Diff of the two buildlogs: -- --- b1/build.log 2024-03-16 20:04:32.902484863 +0000 +++ b2/build.log 2024-03-16 21:02:40.569975787 +0000 @@ -1,6 +1,6 @@ I: pbuilder: network access will be disabled during build -I: Current time: Sat Mar 16 07:28:24 -12 2024 -I: pbuilder-time-stamp: 1710617304 +I: Current time: Sun Mar 17 10:05:06 +14 2024 +I: pbuilder-time-stamp: 1710619506 I: Building the build Environment I: extracting base tarball [/var/cache/pbuilder/bookworm-reproducible-base.tgz] I: copying local configuration @@ -16,7 +16,7 @@ I: copying [./librsb_1.3.0.2+dfsg.orig.tar.xz] I: copying [./librsb_1.3.0.2+dfsg-4.debian.tar.xz] I: Extracting source -gpgv: Signature made Fri Feb 17 19:00:35 2023 -12 +gpgv: Signature made Sat Feb 18 21:00:35 2023 +14 gpgv: using RSA key 3F464391498FE874BDB5D98F2124AA1983785C90 gpgv: issuer "rafael@debian.org" gpgv: Can't check signature: No public key @@ -28,135 +28,167 @@ dpkg-source: info: applying auto-gitignore I: Not using root during the build. I: Installing the build-deps -I: user script /srv/workspace/pbuilder/21297/tmp/hooks/D02_print_environment starting +I: user script /srv/workspace/pbuilder/10894/tmp/hooks/D01_modify_environment starting +debug: Running on virt32c. +I: Changing host+domainname to test build reproducibility +I: Adding a custom variable just for the fun of it... +I: Changing /bin/sh to bash +'/bin/sh' -> '/bin/bash' +lrwxrwxrwx 1 root root 9 Mar 17 10:05 /bin/sh -> /bin/bash +I: Setting pbuilder2's login shell to /bin/bash +I: Setting pbuilder2's GECOS to second user,second room,second work-phone,second home-phone,second other +I: user script /srv/workspace/pbuilder/10894/tmp/hooks/D01_modify_environment finished +I: user script /srv/workspace/pbuilder/10894/tmp/hooks/D02_print_environment starting I: set - BUILDDIR='/build/reproducible-path' - BUILDUSERGECOS='first user,first room,first work-phone,first home-phone,first other' - BUILDUSERNAME='pbuilder1' - BUILD_ARCH='armhf' - DEBIAN_FRONTEND='noninteractive' - DEB_BUILD_OPTIONS='buildinfo=+all reproducible=+all parallel=3 ' - DISTRIBUTION='bookworm' - HOME='/root' - HOST_ARCH='armhf' + BASH=/bin/sh + BASHOPTS=checkwinsize:cmdhist:complete_fullquote:extquote:force_fignore:globasciiranges:globskipdots:hostcomplete:interactive_comments:patsub_replacement:progcomp:promptvars:sourcepath + BASH_ALIASES=() + BASH_ARGC=() + BASH_ARGV=() + BASH_CMDS=() + BASH_LINENO=([0]="12" [1]="0") + BASH_LOADABLES_PATH=/usr/local/lib/bash:/usr/lib/bash:/opt/local/lib/bash:/usr/pkg/lib/bash:/opt/pkg/lib/bash:. + BASH_SOURCE=([0]="/tmp/hooks/D02_print_environment" [1]="/tmp/hooks/D02_print_environment") + BASH_VERSINFO=([0]="5" [1]="2" [2]="15" [3]="1" [4]="release" [5]="arm-unknown-linux-gnueabihf") + BASH_VERSION='5.2.15(1)-release' + BUILDDIR=/build/reproducible-path + BUILDUSERGECOS='second user,second room,second work-phone,second home-phone,second other' + BUILDUSERNAME=pbuilder2 + BUILD_ARCH=armhf + DEBIAN_FRONTEND=noninteractive + DEB_BUILD_OPTIONS='buildinfo=+all reproducible=+all parallel=4 ' + DIRSTACK=() + DISTRIBUTION=bookworm + EUID=0 + FUNCNAME=([0]="Echo" [1]="main") + GROUPS=() + HOME=/root + HOSTNAME=i-capture-the-hostname + HOSTTYPE=arm + HOST_ARCH=armhf IFS=' ' - INVOCATION_ID='c6d6a7d74f8b4ec4ad3cd7103020ce76' - LANG='C' - LANGUAGE='en_US:en' - LC_ALL='C' - MAIL='/var/mail/root' - OPTIND='1' - PATH='/usr/sbin:/usr/bin:/sbin:/bin:/usr/games' - PBCURRENTCOMMANDLINEOPERATION='build' - PBUILDER_OPERATION='build' - PBUILDER_PKGDATADIR='/usr/share/pbuilder' - PBUILDER_PKGLIBDIR='/usr/lib/pbuilder' - PBUILDER_SYSCONFDIR='/etc' - PPID='21297' - PS1='# ' - PS2='> ' + INVOCATION_ID=4c4406c4e63d4cfca8b55353aa923c98 + LANG=C + LANGUAGE=it_CH:it + LC_ALL=C + MACHTYPE=arm-unknown-linux-gnueabihf + MAIL=/var/mail/root + OPTERR=1 + OPTIND=1 + OSTYPE=linux-gnueabihf + PATH=/usr/sbin:/usr/bin:/sbin:/bin:/usr/games:/i/capture/the/path + PBCURRENTCOMMANDLINEOPERATION=build + PBUILDER_OPERATION=build + PBUILDER_PKGDATADIR=/usr/share/pbuilder + PBUILDER_PKGLIBDIR=/usr/lib/pbuilder + PBUILDER_SYSCONFDIR=/etc + PIPESTATUS=([0]="0") + POSIXLY_CORRECT=y + PPID=10894 PS4='+ ' - PWD='/' - SHELL='/bin/bash' - SHLVL='2' - SUDO_COMMAND='/usr/bin/timeout -k 18.1h 18h /usr/bin/ionice -c 3 /usr/bin/nice /usr/sbin/pbuilder --build --configfile /srv/reproducible-results/rbuild-debian/r-b-build.UWWiF9pB/pbuilderrc_GgQ9 --distribution bookworm --hookdir /etc/pbuilder/first-build-hooks --debbuildopts -b --basetgz /var/cache/pbuilder/bookworm-reproducible-base.tgz --buildresult /srv/reproducible-results/rbuild-debian/r-b-build.UWWiF9pB/b1 --logfile b1/build.log librsb_1.3.0.2+dfsg-4.dsc' - SUDO_GID='113' - SUDO_UID='107' - SUDO_USER='jenkins' - TERM='unknown' - TZ='/usr/share/zoneinfo/Etc/GMT+12' - USER='root' - _='/usr/bin/systemd-run' - http_proxy='http://10.0.0.15:3142/' + PWD=/ + SHELL=/bin/bash + SHELLOPTS=braceexpand:errexit:hashall:interactive-comments:posix + SHLVL=3 + SUDO_COMMAND='/usr/bin/timeout -k 24.1h 24h /usr/bin/ionice -c 3 /usr/bin/nice -n 11 /usr/bin/unshare --uts -- /usr/sbin/pbuilder --build --configfile /srv/reproducible-results/rbuild-debian/r-b-build.UWWiF9pB/pbuilderrc_lwLu --distribution bookworm --hookdir /etc/pbuilder/rebuild-hooks --debbuildopts -b --basetgz /var/cache/pbuilder/bookworm-reproducible-base.tgz --buildresult /srv/reproducible-results/rbuild-debian/r-b-build.UWWiF9pB/b2 --logfile b2/build.log librsb_1.3.0.2+dfsg-4.dsc' + SUDO_GID=113 + SUDO_UID=107 + SUDO_USER=jenkins + TERM=unknown + TZ=/usr/share/zoneinfo/Etc/GMT-14 + UID=0 + USER=root + _='I: set' + http_proxy=http://10.0.0.15:3142/ I: uname -a - Linux virt64c 6.1.0-18-arm64 #1 SMP Debian 6.1.76-1 (2024-02-01) aarch64 GNU/Linux + Linux i-capture-the-hostname 6.1.0-18-armmp-lpae #1 SMP Debian 6.1.76-1 (2024-02-01) armv7l GNU/Linux I: ls -l /bin - total 4964 - -rwxr-xr-x 1 root root 838488 Apr 23 2023 bash - -rwxr-xr-x 3 root root 67144 Sep 18 2022 bunzip2 - -rwxr-xr-x 3 root root 67144 Sep 18 2022 bzcat - lrwxrwxrwx 1 root root 6 Sep 18 2022 bzcmp -> bzdiff - -rwxr-xr-x 1 root root 2225 Sep 18 2022 bzdiff - lrwxrwxrwx 1 root root 6 Sep 18 2022 bzegrep -> bzgrep - -rwxr-xr-x 1 root root 4893 Nov 27 2021 bzexe - lrwxrwxrwx 1 root root 6 Sep 18 2022 bzfgrep -> bzgrep - -rwxr-xr-x 1 root root 3775 Sep 18 2022 bzgrep - -rwxr-xr-x 3 root root 67144 Sep 18 2022 bzip2 - -rwxr-xr-x 1 root root 67112 Sep 18 2022 bzip2recover - lrwxrwxrwx 1 root root 6 Sep 18 2022 bzless -> bzmore - -rwxr-xr-x 1 root root 1297 Sep 18 2022 bzmore - -rwxr-xr-x 1 root root 67632 Sep 20 2022 cat - -rwxr-xr-x 1 root root 67676 Sep 20 2022 chgrp - -rwxr-xr-x 1 root root 67644 Sep 20 2022 chmod - -rwxr-xr-x 1 root root 67684 Sep 20 2022 chown - -rwxr-xr-x 1 root root 133532 Sep 20 2022 cp - -rwxr-xr-x 1 root root 132868 Jan 5 2023 dash - -rwxr-xr-x 1 root root 133220 Sep 20 2022 date - -rwxr-xr-x 1 root root 67732 Sep 20 2022 dd - -rwxr-xr-x 1 root root 68104 Sep 20 2022 df - -rwxr-xr-x 1 root root 133632 Sep 20 2022 dir - -rwxr-xr-x 1 root root 59128 Mar 22 2023 dmesg - lrwxrwxrwx 1 root root 8 Dec 19 2022 dnsdomainname -> hostname - lrwxrwxrwx 1 root root 8 Dec 19 2022 domainname -> hostname - -rwxr-xr-x 1 root root 67560 Sep 20 2022 echo - -rwxr-xr-x 1 root root 41 Jan 24 2023 egrep - -rwxr-xr-x 1 root root 67548 Sep 20 2022 false - -rwxr-xr-x 1 root root 41 Jan 24 2023 fgrep - -rwxr-xr-x 1 root root 55748 Mar 22 2023 findmnt - -rwsr-xr-x 1 root root 26208 Mar 22 2023 fusermount - -rwxr-xr-x 1 root root 128608 Jan 24 2023 grep - -rwxr-xr-x 2 root root 2346 Apr 9 2022 gunzip - -rwxr-xr-x 1 root root 6447 Apr 9 2022 gzexe - -rwxr-xr-x 1 root root 64220 Apr 9 2022 gzip - -rwxr-xr-x 1 root root 67032 Dec 19 2022 hostname - -rwxr-xr-x 1 root root 67720 Sep 20 2022 ln - -rwxr-xr-x 1 root root 35132 Mar 22 2023 login - -rwxr-xr-x 1 root root 133632 Sep 20 2022 ls - -rwxr-xr-x 1 root root 136808 Mar 22 2023 lsblk - -rwxr-xr-x 1 root root 67800 Sep 20 2022 mkdir - -rwxr-xr-x 1 root root 67764 Sep 20 2022 mknod - -rwxr-xr-x 1 root root 67596 Sep 20 2022 mktemp - -rwxr-xr-x 1 root root 38504 Mar 22 2023 more - -rwsr-xr-x 1 root root 38496 Mar 22 2023 mount - -rwxr-xr-x 1 root root 9824 Mar 22 2023 mountpoint - -rwxr-xr-x 1 root root 133532 Sep 20 2022 mv - lrwxrwxrwx 1 root root 8 Dec 19 2022 nisdomainname -> hostname - lrwxrwxrwx 1 root root 14 Apr 2 2023 pidof -> /sbin/killall5 - -rwxr-xr-x 1 root root 67608 Sep 20 2022 pwd - lrwxrwxrwx 1 root root 4 Apr 23 2023 rbash -> bash - -rwxr-xr-x 1 root root 67600 Sep 20 2022 readlink - -rwxr-xr-x 1 root root 67672 Sep 20 2022 rm - -rwxr-xr-x 1 root root 67600 Sep 20 2022 rmdir - -rwxr-xr-x 1 root root 14152 Jul 28 2023 run-parts - -rwxr-xr-x 1 root root 133372 Jan 5 2023 sed - lrwxrwxrwx 1 root root 4 Jan 5 2023 sh -> dash - -rwxr-xr-x 1 root root 67584 Sep 20 2022 sleep - -rwxr-xr-x 1 root root 67644 Sep 20 2022 stty - -rwsr-xr-x 1 root root 50800 Mar 22 2023 su - -rwxr-xr-x 1 root root 67584 Sep 20 2022 sync - -rwxr-xr-x 1 root root 336764 Jan 19 21:27 tar - -rwxr-xr-x 1 root root 9800 Jul 28 2023 tempfile - -rwxr-xr-x 1 root root 133224 Sep 20 2022 touch - -rwxr-xr-x 1 root root 67548 Sep 20 2022 true - -rwxr-xr-x 1 root root 9768 Mar 22 2023 ulockmgr_server - -rwsr-xr-x 1 root root 22108 Mar 22 2023 umount - -rwxr-xr-x 1 root root 67572 Sep 20 2022 uname - -rwxr-xr-x 2 root root 2346 Apr 9 2022 uncompress - -rwxr-xr-x 1 root root 133632 Sep 20 2022 vdir - -rwxr-xr-x 1 root root 42608 Mar 22 2023 wdctl - lrwxrwxrwx 1 root root 8 Dec 19 2022 ypdomainname -> hostname - -rwxr-xr-x 1 root root 1984 Apr 9 2022 zcat - -rwxr-xr-x 1 root root 1678 Apr 9 2022 zcmp - -rwxr-xr-x 1 root root 6460 Apr 9 2022 zdiff - -rwxr-xr-x 1 root root 29 Apr 9 2022 zegrep - -rwxr-xr-x 1 root root 29 Apr 9 2022 zfgrep - -rwxr-xr-x 1 root root 2081 Apr 9 2022 zforce - -rwxr-xr-x 1 root root 8103 Apr 9 2022 zgrep - -rwxr-xr-x 1 root root 2206 Apr 9 2022 zless - -rwxr-xr-x 1 root root 1842 Apr 9 2022 zmore - -rwxr-xr-x 1 root root 4577 Apr 9 2022 znew -I: user script /srv/workspace/pbuilder/21297/tmp/hooks/D02_print_environment finished + total 4996 + -rwxr-xr-x 1 root root 838488 Apr 24 2023 bash + -rwxr-xr-x 3 root root 67144 Sep 19 2022 bunzip2 + -rwxr-xr-x 3 root root 67144 Sep 19 2022 bzcat + lrwxrwxrwx 1 root root 6 Sep 19 2022 bzcmp -> bzdiff + -rwxr-xr-x 1 root root 2225 Sep 19 2022 bzdiff + lrwxrwxrwx 1 root root 6 Sep 19 2022 bzegrep -> bzgrep + -rwxr-xr-x 1 root root 4893 Nov 28 2021 bzexe + lrwxrwxrwx 1 root root 6 Sep 19 2022 bzfgrep -> bzgrep + -rwxr-xr-x 1 root root 3775 Sep 19 2022 bzgrep + -rwxr-xr-x 3 root root 67144 Sep 19 2022 bzip2 + -rwxr-xr-x 1 root root 67112 Sep 19 2022 bzip2recover + lrwxrwxrwx 1 root root 6 Sep 19 2022 bzless -> bzmore + -rwxr-xr-x 1 root root 1297 Sep 19 2022 bzmore + -rwxr-xr-x 1 root root 67632 Sep 21 2022 cat + -rwxr-xr-x 1 root root 67676 Sep 21 2022 chgrp + -rwxr-xr-x 1 root root 67644 Sep 21 2022 chmod + -rwxr-xr-x 1 root root 67684 Sep 21 2022 chown + -rwxr-xr-x 1 root root 133532 Sep 21 2022 cp + -rwxr-xr-x 1 root root 132868 Jan 6 2023 dash + -rwxr-xr-x 1 root root 133220 Sep 21 2022 date + -rwxr-xr-x 1 root root 67732 Sep 21 2022 dd + -rwxr-xr-x 1 root root 68104 Sep 21 2022 df + -rwxr-xr-x 1 root root 133632 Sep 21 2022 dir + -rwxr-xr-x 1 root root 59128 Mar 23 2023 dmesg + lrwxrwxrwx 1 root root 8 Dec 20 2022 dnsdomainname -> hostname + lrwxrwxrwx 1 root root 8 Dec 20 2022 domainname -> hostname + -rwxr-xr-x 1 root root 67560 Sep 21 2022 echo + -rwxr-xr-x 1 root root 41 Jan 25 2023 egrep + -rwxr-xr-x 1 root root 67548 Sep 21 2022 false + -rwxr-xr-x 1 root root 41 Jan 25 2023 fgrep + -rwxr-xr-x 1 root root 55748 Mar 23 2023 findmnt + -rwsr-xr-x 1 root root 26208 Mar 23 2023 fusermount + -rwxr-xr-x 1 root root 128608 Jan 25 2023 grep + -rwxr-xr-x 2 root root 2346 Apr 10 2022 gunzip + -rwxr-xr-x 1 root root 6447 Apr 10 2022 gzexe + -rwxr-xr-x 1 root root 64220 Apr 10 2022 gzip + -rwxr-xr-x 1 root root 67032 Dec 20 2022 hostname + -rwxr-xr-x 1 root root 67720 Sep 21 2022 ln + -rwxr-xr-x 1 root root 35132 Mar 23 2023 login + -rwxr-xr-x 1 root root 133632 Sep 21 2022 ls + -rwxr-xr-x 1 root root 136808 Mar 23 2023 lsblk + -rwxr-xr-x 1 root root 67800 Sep 21 2022 mkdir + -rwxr-xr-x 1 root root 67764 Sep 21 2022 mknod + -rwxr-xr-x 1 root root 67596 Sep 21 2022 mktemp + -rwxr-xr-x 1 root root 38504 Mar 23 2023 more + -rwsr-xr-x 1 root root 38496 Mar 23 2023 mount + -rwxr-xr-x 1 root root 9824 Mar 23 2023 mountpoint + -rwxr-xr-x 1 root root 133532 Sep 21 2022 mv + lrwxrwxrwx 1 root root 8 Dec 20 2022 nisdomainname -> hostname + lrwxrwxrwx 1 root root 14 Apr 3 2023 pidof -> /sbin/killall5 + -rwxr-xr-x 1 root root 67608 Sep 21 2022 pwd + lrwxrwxrwx 1 root root 4 Apr 24 2023 rbash -> bash + -rwxr-xr-x 1 root root 67600 Sep 21 2022 readlink + -rwxr-xr-x 1 root root 67672 Sep 21 2022 rm + -rwxr-xr-x 1 root root 67600 Sep 21 2022 rmdir + -rwxr-xr-x 1 root root 14152 Jul 29 2023 run-parts + -rwxr-xr-x 1 root root 133372 Jan 6 2023 sed + lrwxrwxrwx 1 root root 9 Mar 17 10:05 sh -> /bin/bash + -rwxr-xr-x 1 root root 67584 Sep 21 2022 sleep + -rwxr-xr-x 1 root root 67644 Sep 21 2022 stty + -rwsr-xr-x 1 root root 50800 Mar 23 2023 su + -rwxr-xr-x 1 root root 67584 Sep 21 2022 sync + -rwxr-xr-x 1 root root 336764 Jan 20 23:27 tar + -rwxr-xr-x 1 root root 9800 Jul 29 2023 tempfile + -rwxr-xr-x 1 root root 133224 Sep 21 2022 touch + -rwxr-xr-x 1 root root 67548 Sep 21 2022 true + -rwxr-xr-x 1 root root 9768 Mar 23 2023 ulockmgr_server + -rwsr-xr-x 1 root root 22108 Mar 23 2023 umount + -rwxr-xr-x 1 root root 67572 Sep 21 2022 uname + -rwxr-xr-x 2 root root 2346 Apr 10 2022 uncompress + -rwxr-xr-x 1 root root 133632 Sep 21 2022 vdir + -rwxr-xr-x 1 root root 42608 Mar 23 2023 wdctl + lrwxrwxrwx 1 root root 8 Dec 20 2022 ypdomainname -> hostname + -rwxr-xr-x 1 root root 1984 Apr 10 2022 zcat + -rwxr-xr-x 1 root root 1678 Apr 10 2022 zcmp + -rwxr-xr-x 1 root root 6460 Apr 10 2022 zdiff + -rwxr-xr-x 1 root root 29 Apr 10 2022 zegrep + -rwxr-xr-x 1 root root 29 Apr 10 2022 zfgrep + -rwxr-xr-x 1 root root 2081 Apr 10 2022 zforce + -rwxr-xr-x 1 root root 8103 Apr 10 2022 zgrep + -rwxr-xr-x 1 root root 2206 Apr 10 2022 zless + -rwxr-xr-x 1 root root 1842 Apr 10 2022 zmore + -rwxr-xr-x 1 root root 4577 Apr 10 2022 znew +I: user script /srv/workspace/pbuilder/10894/tmp/hooks/D02_print_environment finished -> Attempting to satisfy build-dependencies -> Creating pbuilder-satisfydepends-dummy package Package: pbuilder-satisfydepends-dummy @@ -357,7 +389,7 @@ Get: 153 http://deb.debian.org/debian bookworm/main armhf libltdl-dev armhf 2.4.7-5 [162 kB] Get: 154 http://deb.debian.org/debian bookworm/main armhf libhwloc-dev armhf 2.9.0-1 [214 kB] Get: 155 http://deb.debian.org/debian bookworm/main armhf zlib1g-dev armhf 1:1.2.13.dfsg-1 [902 kB] -Fetched 327 MB in 13s (25.4 MB/s) +Fetched 327 MB in 11s (30.4 MB/s) debconf: delaying package configuration, since apt-utils is not installed Selecting previously unselected package liblocale-gettext-perl. (Reading database ... (Reading database ... 5% (Reading database ... 10% (Reading database ... 15% (Reading database ... 20% (Reading database ... 25% (Reading database ... 30% (Reading database ... 35% (Reading database ... 40% (Reading database ... 45% (Reading database ... 50% (Reading database ... 55% (Reading database ... 60% (Reading database ... 65% (Reading database ... 70% (Reading database ... 75% (Reading database ... 80% (Reading database ... 85% (Reading database ... 90% (Reading database ... 95% (Reading database ... 100% (Reading database ... 19288 files and directories currently installed.) @@ -1015,7 +1047,11 @@ Building tag database... -> Finished parsing the build-deps I: Building the package -I: Running cd /build/reproducible-path/librsb-1.3.0.2+dfsg/ && env PATH="/usr/sbin:/usr/bin:/sbin:/bin:/usr/games" HOME="/nonexistent/first-build" dpkg-buildpackage -us -uc -b && env PATH="/usr/sbin:/usr/bin:/sbin:/bin:/usr/games" HOME="/nonexistent/first-build" dpkg-genchanges -S > ../librsb_1.3.0.2+dfsg-4_source.changes +I: user script /srv/workspace/pbuilder/10894/tmp/hooks/A99_set_merged_usr starting +Not re-configuring usrmerge for bookworm +I: user script /srv/workspace/pbuilder/10894/tmp/hooks/A99_set_merged_usr finished +hostname: Name or service not known +I: Running cd /build/reproducible-path/librsb-1.3.0.2+dfsg/ && env PATH="/usr/sbin:/usr/bin:/sbin:/bin:/usr/games:/i/capture/the/path" HOME="/nonexistent/second-build" dpkg-buildpackage -us -uc -b && env PATH="/usr/sbin:/usr/bin:/sbin:/bin:/usr/games:/i/capture/the/path" HOME="/nonexistent/second-build" dpkg-genchanges -S > ../librsb_1.3.0.2+dfsg-4_source.changes dpkg-buildpackage: info: source package librsb dpkg-buildpackage: info: source version 1.3.0.2+dfsg-4 dpkg-buildpackage: info: source distribution unstable @@ -1035,62 +1071,62 @@ dh binary --parallel dh_update_autotools_config dh_autoreconf -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found libtoolize: putting auxiliary files in '.'. libtoolize: copying file './ltmain.sh' libtoolize: putting macros in AC_CONFIG_MACRO_DIRS, 'm4'. @@ -1132,90 +1168,90 @@ libtoolize: copying file 'm4/ltsugar.m4' libtoolize: copying file 'm4/ltversion.m4' libtoolize: copying file 'm4/lt~obsolete.m4' -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found configure.ac:66: installing './compile' configure.ac:65: installing './missing' Makefile.am: installing './depcomp' @@ -1398,7 +1434,7 @@ checking for m4... m4 checking for gmake... gmake checking for ggrep... /bin/grep -checking for bash... /bin/bash +checking for bash... /bin/sh checking for gsed... /bin/sed checking for cmp... cmp checking for basename... basename @@ -1515,7 +1551,7 @@ configure: It appears that Fortran programs can be linked without using the Fortran linker. configure: Using OPENMP_CFLAGS ok for linking an OpenMP program: adding it to LIBS. checking if your have a usable getrusage() ... 1 -checking for /bin/bash... /bin/bash +checking for /bin/sh... /bin/sh configure: Will not use Google Test. configure: You seem to not have GNU Octave or have disabled 'int' type. Part of the test suite will not be generated. If you want more testing capabilities, you should enable the 'int' type as well. checking that generated files are newer than configure... done @@ -1537,7 +1573,7 @@ config.status: executing depfiles commands config.status: executing libtool commands === configuring in librsbpp (/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp) -configure: running /bin/bash ./configure --disable-option-checking '--prefix=/usr' '--build=arm-linux-gnueabihf' '--includedir=${prefix}/include' '--mandir=${prefix}/share/man' '--infodir=${prefix}/share/info' '--sysconfdir=/etc' '--localstatedir=/var' '--disable-silent-rules' '--libdir=${prefix}/lib/arm-linux-gnueabihf' '--runstatedir=/run' '--disable-maintainer-mode' '--disable-dependency-tracking' '--with-memhinfo=L2:4/64/512K,L1:8/64/24K' '--with-hwloc' '--enable-matrix-types=blas' '--with-zlib=-lz' '--enable-doc-build' '--enable-fortran-module-install' '--enable-extra-patches' '--enable-pkg-config-install' '--disable-extra-patches' 'build_alias=arm-linux-gnueabihf' 'CFLAGS=-g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3' 'LDFLAGS=-Wl,-z,relro' 'CPPFLAGS=-Wdate-time -D_FORTIFY_SOURCE=2' 'FCFLAGS=-g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong' 'CXXFLAGS=-g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security' 'BASH=/bin/bash' --cache-file=/dev/null --srcdir=. +configure: running /bin/sh ./configure --disable-option-checking '--prefix=/usr' '--build=arm-linux-gnueabihf' '--includedir=${prefix}/include' '--mandir=${prefix}/share/man' '--infodir=${prefix}/share/info' '--sysconfdir=/etc' '--localstatedir=/var' '--disable-silent-rules' '--libdir=${prefix}/lib/arm-linux-gnueabihf' '--runstatedir=/run' '--disable-maintainer-mode' '--disable-dependency-tracking' '--with-memhinfo=L2:4/64/512K,L1:8/64/24K' '--with-hwloc' '--enable-matrix-types=blas' '--with-zlib=-lz' '--enable-doc-build' '--enable-fortran-module-install' '--enable-extra-patches' '--enable-pkg-config-install' '--disable-extra-patches' 'build_alias=arm-linux-gnueabihf' 'CFLAGS=-g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3' 'LDFLAGS=-Wl,-z,relro' 'CPPFLAGS=-Wdate-time -D_FORTIFY_SOURCE=2' 'FCFLAGS=-g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong' 'CXXFLAGS=-g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security' 'BASH=/bin/sh' --cache-file=/dev/null --srcdir=. checking for a BSD-compatible install... /usr/bin/install -c checking whether build environment is sane... yes checking for a race-free mkdir -p... /bin/mkdir -p @@ -1659,7 +1695,7 @@ configure: Will not use Google Test. checking whether you have std::thread... yes checking whether you have std::mutex... yes -/bin/bash +/bin/sh checking that generated files are newer than configure... done configure: creating ./config.status config.status: creating Makefile @@ -1668,7 +1704,7 @@ config.status: executing libtool commands configure: Successfully created a Makefile. === configuring in rsblib (/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib) -configure: running /bin/bash ./configure --disable-option-checking '--prefix=/usr' '--build=arm-linux-gnueabihf' '--includedir=${prefix}/include' '--mandir=${prefix}/share/man' '--infodir=${prefix}/share/info' '--sysconfdir=/etc' '--localstatedir=/var' '--disable-silent-rules' '--libdir=${prefix}/lib/arm-linux-gnueabihf' '--runstatedir=/run' '--disable-maintainer-mode' '--disable-dependency-tracking' '--with-memhinfo=L2:4/64/512K,L1:8/64/24K' '--with-hwloc' '--enable-matrix-types=blas' '--with-zlib=-lz' '--enable-doc-build' '--enable-fortran-module-install' '--enable-extra-patches' '--enable-pkg-config-install' '--disable-extra-patches' 'build_alias=arm-linux-gnueabihf' 'CFLAGS=-g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3' 'LDFLAGS=-Wl,-z,relro' 'CPPFLAGS=-Wdate-time -D_FORTIFY_SOURCE=2' 'FCFLAGS=-g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong' 'CXXFLAGS=-g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security' 'BASH=/bin/bash' --cache-file=/dev/null --srcdir=. +configure: running /bin/sh ./configure --disable-option-checking '--prefix=/usr' '--build=arm-linux-gnueabihf' '--includedir=${prefix}/include' '--mandir=${prefix}/share/man' '--infodir=${prefix}/share/info' '--sysconfdir=/etc' '--localstatedir=/var' '--disable-silent-rules' '--libdir=${prefix}/lib/arm-linux-gnueabihf' '--runstatedir=/run' '--disable-maintainer-mode' '--disable-dependency-tracking' '--with-memhinfo=L2:4/64/512K,L1:8/64/24K' '--with-hwloc' '--enable-matrix-types=blas' '--with-zlib=-lz' '--enable-doc-build' '--enable-fortran-module-install' '--enable-extra-patches' '--enable-pkg-config-install' '--disable-extra-patches' 'build_alias=arm-linux-gnueabihf' 'CFLAGS=-g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3' 'LDFLAGS=-Wl,-z,relro' 'CPPFLAGS=-Wdate-time -D_FORTIFY_SOURCE=2' 'FCFLAGS=-g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong' 'CXXFLAGS=-g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security' 'BASH=/bin/sh' --cache-file=/dev/null --srcdir=. checking for a BSD-compatible install... /usr/bin/install -c checking whether build environment is sane... yes checking for a race-free mkdir -p... /bin/mkdir -p @@ -1777,7 +1813,7 @@ checking for filesystem... yes checking for main in -lstdc++fs... yes configure: Assuming you are yet to build librsb.la. (set LIBS= -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la) -/bin/bash +/bin/sh checking that generated files are newer than configure... done configure: creating ./config.status config.status: creating Makefile @@ -1787,7 +1823,7 @@ config.status: executing libtool commands configure: Created a Makefile. === configuring in rsbtest (/build/reproducible-path/librsb-1.3.0.2+dfsg/rsbtest) -configure: running /bin/bash ./configure --disable-option-checking '--prefix=/usr' '--build=arm-linux-gnueabihf' '--includedir=${prefix}/include' '--mandir=${prefix}/share/man' '--infodir=${prefix}/share/info' '--sysconfdir=/etc' '--localstatedir=/var' '--disable-silent-rules' '--libdir=${prefix}/lib/arm-linux-gnueabihf' '--runstatedir=/run' '--disable-maintainer-mode' '--disable-dependency-tracking' '--with-memhinfo=L2:4/64/512K,L1:8/64/24K' '--with-hwloc' '--enable-matrix-types=blas' '--with-zlib=-lz' '--enable-doc-build' '--enable-fortran-module-install' '--enable-extra-patches' '--enable-pkg-config-install' '--disable-extra-patches' 'build_alias=arm-linux-gnueabihf' 'CFLAGS=-g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3' 'LDFLAGS=-Wl,-z,relro' 'CPPFLAGS=-Wdate-time -D_FORTIFY_SOURCE=2' 'FCFLAGS=-g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong' 'CXXFLAGS=-g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security' 'BASH=/bin/bash' --cache-file=/dev/null --srcdir=. +configure: running /bin/sh ./configure --disable-option-checking '--prefix=/usr' '--build=arm-linux-gnueabihf' '--includedir=${prefix}/include' '--mandir=${prefix}/share/man' '--infodir=${prefix}/share/info' '--sysconfdir=/etc' '--localstatedir=/var' '--disable-silent-rules' '--libdir=${prefix}/lib/arm-linux-gnueabihf' '--runstatedir=/run' '--disable-maintainer-mode' '--disable-dependency-tracking' '--with-memhinfo=L2:4/64/512K,L1:8/64/24K' '--with-hwloc' '--enable-matrix-types=blas' '--with-zlib=-lz' '--enable-doc-build' '--enable-fortran-module-install' '--enable-extra-patches' '--enable-pkg-config-install' '--disable-extra-patches' 'build_alias=arm-linux-gnueabihf' 'CFLAGS=-g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3' 'LDFLAGS=-Wl,-z,relro' 'CPPFLAGS=-Wdate-time -D_FORTIFY_SOURCE=2' 'FCFLAGS=-g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong' 'CXXFLAGS=-g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security' 'BASH=/bin/sh' --cache-file=/dev/null --srcdir=. checking for a BSD-compatible install... /usr/bin/install -c checking whether build environment is sane... yes checking for a race-free mkdir -p... /bin/mkdir -p @@ -1898,7 +1934,7 @@ checking for filesystem... yes checking for rsb_lib_init... no checking for dd... yes -/bin/bash +/bin/sh /usr/bin/timeout checking that generated files are newer than configure... done configure: creating ./config.status @@ -1930,7 +1966,7 @@ ARFLAGS : cru M4 : m4 MAKE : gmake - BASH : /bin/bash + BASH : /bin/sh OCTAVE : false DOXYGEN : doxygen HELP2MAN : help2man @@ -1974,20 +2010,620 @@ debian/rules override_dh_auto_build make[1]: Entering directory '/build/reproducible-path/librsb-1.3.0.2+dfsg' dh_auto_build - make -j3 + make -j4 make[2]: Entering directory '/build/reproducible-path/librsb-1.3.0.2+dfsg' gmake all-recursive gmake[3]: Entering directory '/build/reproducible-path/librsb-1.3.0.2+dfsg' Making all in librsbpp gmake[4]: Entering directory '/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp' g++ -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -DRSBPP_HAS_RSB_H=1 -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -DRSBPP_HAS_RSB_H=1 -c -o rsbpp.o rsbpp.cpp -/bin/bash ./libtool --tag=CXX --mode=compile g++ -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -DRSBPP_HAS_RSB_H=1 -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -DRSBPP_HAS_RSB_H=1 -c -o rsbpp_coo.lo rsbpp_coo.cpp -/bin/bash ./libtool --tag=CXX --mode=compile g++ -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -DRSBPP_HAS_RSB_H=1 -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -DRSBPP_HAS_RSB_H=1 -c -o rsbpp_csr.lo rsbpp_csr.cpp +/bin/sh ./libtool --tag=CXX --mode=compile g++ -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -DRSBPP_HAS_RSB_H=1 -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -DRSBPP_HAS_RSB_H=1 -c -o rsbpp_coo.lo rsbpp_coo.cpp +/bin/sh ./libtool --tag=CXX --mode=compile g++ -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -DRSBPP_HAS_RSB_H=1 -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -DRSBPP_HAS_RSB_H=1 -c -o rsbpp_csr.lo rsbpp_csr.cpp +g++ -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -DRSBPP_HAS_RSB_H=1 -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -DRSBPP_HAS_RSB_H=1 -c -o rsbtt.o rsbtt.cpp libtool: compile: g++ -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -DRSBPP_HAS_RSB_H=1 -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -DRSBPP_HAS_RSB_H=1 -c rsbpp_coo.cpp -fPIC -DPIC -o .libs/rsbpp_coo.o libtool: compile: g++ -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -DRSBPP_HAS_RSB_H=1 -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -DRSBPP_HAS_RSB_H=1 -c rsbpp_csr.cpp -fPIC -DPIC -o .libs/rsbpp_csr.o In file included from /usr/include/c++/12/bits/stl_algo.h:60, from /usr/include/c++/12/algorithm:61, from rsbpp.hpp:24, + from rsbtt.cpp:21: +/usr/include/c++/12/bits/stl_heap.h: In function 'void std::__adjust_heap(_RandomAccessIterator, _Distance, _Distance, _Tp, _Compare) [with _RandomAccessIterator = __gnu_cxx::__normal_iterator::triple_ppd_t*, vector::triple_ppd_t, OpenMP_Allocator::triple_ppd_t> > >; _Distance = int; _Tp = Coo::triple_ppd_t; _Compare = __gnu_cxx::__ops::_Iter_comp_iter::sort_coc(int, int)::::triple_t, Coo::triple_t)> >]': +/usr/include/c++/12/bits/stl_heap.h:224:5: note: parameter passing for argument of type '__gnu_cxx::__normal_iterator::triple_ppd_t*, std::vector::triple_ppd_t, OpenMP_Allocator::triple_ppd_t> > >' changed in GCC 7.1 + 224 | __adjust_heap(_RandomAccessIterator __first, _Distance __holeIndex, + | ^~~~~~~~~~~~~ +/usr/include/c++/12/bits/stl_heap.h: In function 'void std::__adjust_heap(_RandomAccessIterator, _Distance, _Distance, _Tp, _Compare) [with _RandomAccessIterator = __gnu_cxx::__normal_iterator::triple_ppd_t*, vector::triple_ppd_t, OpenMP_Allocator::triple_ppd_t> > >; _Distance = int; _Tp = Coo::triple_ppd_t; _Compare = __gnu_cxx::__ops::_Iter_comp_iter::sort_cor(int, int)::::triple_t, Coo::triple_t)> >]': +/usr/include/c++/12/bits/stl_heap.h:224:5: note: parameter passing for argument of type '__gnu_cxx::__normal_iterator::triple_ppd_t*, std::vector::triple_ppd_t, OpenMP_Allocator::triple_ppd_t> > >' changed in GCC 7.1 +/usr/include/c++/12/bits/stl_algo.h: In function 'void std::__unguarded_linear_insert(_RandomAccessIterator, _Compare) [with _RandomAccessIterator = __gnu_cxx::__normal_iterator::triple_ppd_t*, vector::triple_ppd_t, OpenMP_Allocator::triple_ppd_t> > >; _Compare = __gnu_cxx::__ops::_Val_comp_iter::sort_coc(int, int)::::triple_t, Coo::triple_t)> >]': +/usr/include/c++/12/bits/stl_algo.h:1782:5: note: parameter passing for argument of type '__gnu_cxx::__normal_iterator::triple_ppd_t*, std::vector::triple_ppd_t, OpenMP_Allocator::triple_ppd_t> > >' changed in GCC 7.1 + 1782 | __unguarded_linear_insert(_RandomAccessIterator __last, + | ^~~~~~~~~~~~~~~~~~~~~~~~~ +/usr/include/c++/12/bits/stl_algo.h: In function 'void std::__unguarded_linear_insert(_RandomAccessIterator, _Compare) [with _RandomAccessIterator = __gnu_cxx::__normal_iterator::triple_ppd_t*, vector::triple_ppd_t, OpenMP_Allocator::triple_ppd_t> > >; _Compare = __gnu_cxx::__ops::_Val_comp_iter::sort_cor(int, int)::::triple_t, Coo::triple_t)> >]': +/usr/include/c++/12/bits/stl_algo.h:1782:5: note: parameter passing for argument of type '__gnu_cxx::__normal_iterator::triple_ppd_t*, std::vector::triple_ppd_t, OpenMP_Allocator::triple_ppd_t> > >' changed in GCC 7.1 +/usr/include/c++/12/bits/stl_algo.h: In function 'void std::__insertion_sort(_RandomAccessIterator, _RandomAccessIterator, _Compare) [with _RandomAccessIterator = __gnu_cxx::__normal_iterator::triple_ppd_t*, vector::triple_ppd_t, OpenMP_Allocator::triple_ppd_t> > >; _Compare = __gnu_cxx::__ops::_Iter_comp_iter::sort_cor(int, int)::::triple_t, Coo::triple_t)> >]': +/usr/include/c++/12/bits/stl_algo.h:1802:5: note: parameter passing for argument of type '__gnu_cxx::__normal_iterator::triple_ppd_t*, std::vector::triple_ppd_t, OpenMP_Allocator::triple_ppd_t> > >' changed in GCC 7.1 + 1802 | __insertion_sort(_RandomAccessIterator __first, + | ^~~~~~~~~~~~~~~~ +/usr/include/c++/12/bits/stl_algo.h:1802:5: note: parameter passing for argument of type '__gnu_cxx::__normal_iterator::triple_ppd_t*, std::vector::triple_ppd_t, OpenMP_Allocator::triple_ppd_t> > >' changed in GCC 7.1 +/usr/include/c++/12/bits/stl_algo.h: In function 'void std::__insertion_sort(_RandomAccessIterator, _RandomAccessIterator, _Compare) [with _RandomAccessIterator = __gnu_cxx::__normal_iterator::triple_ppd_t*, vector::triple_ppd_t, OpenMP_Allocator::triple_ppd_t> > >; _Compare = __gnu_cxx::__ops::_Iter_comp_iter::sort_coc(int, int)::::triple_t, Coo::triple_t)> >]': +/usr/include/c++/12/bits/stl_algo.h:1802:5: note: parameter passing for argument of type '__gnu_cxx::__normal_iterator::triple_ppd_t*, std::vector::triple_ppd_t, OpenMP_Allocator::triple_ppd_t> > >' changed in GCC 7.1 +/usr/include/c++/12/bits/stl_algo.h:1802:5: note: parameter passing for argument of type '__gnu_cxx::__normal_iterator::triple_ppd_t*, std::vector::triple_ppd_t, OpenMP_Allocator::triple_ppd_t> > >' changed in GCC 7.1 +/usr/include/c++/12/bits/stl_algo.h: In function '_RandomAccessIterator std::_V2::__rotate(_RandomAccessIterator, _RandomAccessIterator, _RandomAccessIterator, std::random_access_iterator_tag) [with _RandomAccessIterator = __gnu_cxx::__normal_iterator::triple_ppd_t*, std::vector::triple_ppd_t, OpenMP_Allocator::triple_ppd_t> > >]': +/usr/include/c++/12/bits/stl_algo.h:1281:5: note: parameter passing for argument of type '__gnu_cxx::__normal_iterator::triple_ppd_t*, std::vector::triple_ppd_t, OpenMP_Allocator::triple_ppd_t> > >' changed in GCC 7.1 + 1281 | __rotate(_RandomAccessIterator __first, + | ^~~~~~~~ +/usr/include/c++/12/bits/stl_algo.h:1281:5: note: parameter passing for argument of type '__gnu_cxx::__normal_iterator::triple_ppd_t*, std::vector::triple_ppd_t, OpenMP_Allocator::triple_ppd_t> > >' changed in GCC 7.1 +/usr/include/c++/12/bits/stl_algo.h:1281:5: note: parameter passing for argument of type '__gnu_cxx::__normal_iterator::triple_ppd_t*, std::vector::triple_ppd_t, OpenMP_Allocator::triple_ppd_t> > >' changed in GCC 7.1 +In file included from /usr/include/c++/12/vector:64, + from rsbpp.hpp:25: +/usr/include/c++/12/bits/stl_vector.h: In function 'std::vector<_Tp, _Alloc>::vector(std::initializer_list<_Tp>, const allocator_type&) [with _Tp = double; _Alloc = std::allocator]': +/usr/include/c++/12/bits/stl_vector.h:673:7: note: parameter passing for argument of type 'std::initializer_list' changed in GCC 7.1 + 673 | vector(initializer_list __l, + | ^~~~~~ +rsbtt.cpp: In function 'void test_Coo_SpMV_Symmetric()': +rsbtt.cpp:88:37: note: parameter passing for argument of type 'std::initializer_list' changed in GCC 7.1 + 88 | const std::vector VA{+11}; + | ^ +rsbtt.cpp:89:35: note: parameter passing for argument of type 'std::initializer_list' changed in GCC 7.1 + 89 | const std::vector X{21}; + | ^ +rsbtt.cpp:90:30: note: parameter passing for argument of type 'std::initializer_list' changed in GCC 7.1 + 90 | std::vector Y{+11}; + | ^ +rsbtt.cpp: In function 'void test_Csr_SpMM_br_Unsymmetric()': +rsbtt.cpp:662:41: note: parameter passing for argument of type 'std::initializer_list' changed in GCC 7.1 + 662 | const std::vector VA{+11,+12}; + | ^ +rsbtt.cpp:665:48: note: parameter passing for argument of type 'std::initializer_list' changed in GCC 7.1 + 665 | const std::vector X{+21,+23,+22,+24}; + | ^ +rsbtt.cpp:666:42: note: parameter passing for argument of type 'std::initializer_list' changed in GCC 7.1 + 666 | std::vector Y{+11,+13,-12,-14}; + | ^ +/usr/include/c++/12/bits/stl_vector.h: In function 'std::vector<_Tp, _Alloc>::vector(std::initializer_list<_Tp>, const allocator_type&) [with _Tp = std::complex; _Alloc = std::allocator >]': +/usr/include/c++/12/bits/stl_vector.h:673:7: note: parameter passing for argument of type 'std::initializer_list >' changed in GCC 7.1 + 673 | vector(initializer_list __l, + | ^~~~~~ +rsbtt.cpp: In function 'void test_Coo_SpMV_Complex_Symmetric_Transposed_At()': +rsbtt.cpp:176:41: note: parameter passing for argument of type 'std::initializer_list >' changed in GCC 7.1 + 176 | const std::vector VA{{0,+44}}; + | ^ +rsbtt.cpp:177:48: note: parameter passing for argument of type 'std::initializer_list >' changed in GCC 7.1 + 177 | const std::vector X{-21,+22,-23,+24}; + | ^ +rsbtt.cpp:178:42: note: parameter passing for argument of type 'std::initializer_list >' changed in GCC 7.1 + 178 | std::vector Y{-11,+12,-13,+14}; + | ^ +rsbtt.cpp: In function 'void test_Coo_SpMV_Complex_Symmetric_Conjugated_At()': +rsbtt.cpp:204:41: note: parameter passing for argument of type 'std::initializer_list >' changed in GCC 7.1 + 204 | const std::vector VA{{0,+44}}; + | ^ +rsbtt.cpp:205:48: note: parameter passing for argument of type 'std::initializer_list >' changed in GCC 7.1 + 205 | const std::vector X{-21,+22,-23,+24}; + | ^ +rsbtt.cpp:206:42: note: parameter passing for argument of type 'std::initializer_list >' changed in GCC 7.1 + 206 | std::vector Y{-11,+12,-13,+14}; + | ^ +rsbtt.cpp: In function 'void test_Coo_SpMV_Complex_Hermitian_At()': +rsbtt.cpp:324:41: note: parameter passing for argument of type 'std::initializer_list >' changed in GCC 7.1 + 324 | const std::vector VA{{0,+44}}; + | ^ +rsbtt.cpp:325:48: note: parameter passing for argument of type 'std::initializer_list >' changed in GCC 7.1 + 325 | const std::vector X{-21,+22,-23,+24}; + | ^ +rsbtt.cpp:326:42: note: parameter passing for argument of type 'std::initializer_list >' changed in GCC 7.1 + 326 | std::vector Y{-11,+12,-13,+14}; + | ^ +rsbtt.cpp: In function 'void test_Coo_SpMV_Complex_Hermitian_Transposed_At()': +rsbtt.cpp:380:41: note: parameter passing for argument of type 'std::initializer_list >' changed in GCC 7.1 + 380 | const std::vector VA{{0,+44}}; + | ^ +rsbtt.cpp:381:48: note: parameter passing for argument of type 'std::initializer_list >' changed in GCC 7.1 + 381 | const std::vector X{-21,+22,-23,+24}; + | ^ +rsbtt.cpp:382:42: note: parameter passing for argument of type 'std::initializer_list >' changed in GCC 7.1 + 382 | std::vector Y{-11,+12,-13,+14}; + | ^ +rsbtt.cpp: In function 'void test_Csr_SpMV_Complex_Symmetric_Transposed_At()': +rsbtt.cpp:234:41: note: parameter passing for argument of type 'std::initializer_list >' changed in GCC 7.1 + 234 | const std::vector VA{{0,+44}}; + | ^ +rsbtt.cpp:235:48: note: parameter passing for argument of type 'std::initializer_list >' changed in GCC 7.1 + 235 | const std::vector X{-21,+22,-23,+24}; + | ^ +rsbtt.cpp:236:42: note: parameter passing for argument of type 'std::initializer_list >' changed in GCC 7.1 + 236 | std::vector Y{-11,+12,-13,+14}; + | ^ +rsbtt.cpp: In function 'void test_Csr_SpMV_Complex_Symmetric_Conjugated_At()': +rsbtt.cpp:264:41: note: parameter passing for argument of type 'std::initializer_list >' changed in GCC 7.1 + 264 | const std::vector VA{{0,+44}}; + | ^ +rsbtt.cpp:265:48: note: parameter passing for argument of type 'std::initializer_list >' changed in GCC 7.1 + 265 | const std::vector X{-21,+22,-23,+24}; + | ^ +rsbtt.cpp:266:42: note: parameter passing for argument of type 'std::initializer_list >' changed in GCC 7.1 + 266 | std::vector Y{-11,+12,-13,+14}; + | ^ +rsbtt.cpp: In function 'void test_Csr_SpMV_Complex_Hermitian_At()': +rsbtt.cpp:352:41: note: parameter passing for argument of type 'std::initializer_list >' changed in GCC 7.1 + 352 | const std::vector VA{{0,+44}}; + | ^ +rsbtt.cpp:353:48: note: parameter passing for argument of type 'std::initializer_list >' changed in GCC 7.1 + 353 | const std::vector X{-21,+22,-23,+24}; + | ^ +rsbtt.cpp:354:42: note: parameter passing for argument of type 'std::initializer_list >' changed in GCC 7.1 + 354 | std::vector Y{-11,+12,-13,+14}; + | ^ +rsbtt.cpp: In function 'void test_Csr_SpMV_Complex_Hermitian_Transposed_At()': +rsbtt.cpp:408:41: note: parameter passing for argument of type 'std::initializer_list >' changed in GCC 7.1 + 408 | const std::vector VA{{0,+44}}; + | ^ +rsbtt.cpp:409:48: note: parameter passing for argument of type 'std::initializer_list >' changed in GCC 7.1 + 409 | const std::vector X{-21,+22,-23,+24}; + | ^ +rsbtt.cpp:410:42: note: parameter passing for argument of type 'std::initializer_list >' changed in GCC 7.1 + 410 | std::vector Y{-11,+12,-13,+14}; + | ^ +In file included from /usr/include/c++/12/vector:70: +/usr/include/c++/12/bits/vector.tcc: In member function 'void std::vector<_Tp, _Alloc>::_M_realloc_insert(iterator, _Args&& ...) [with _Args = {Coo::triple_ppd_t}; _Tp = Coo::triple_ppd_t; _Alloc = OpenMP_Allocator::triple_ppd_t>]': +/usr/include/c++/12/bits/vector.tcc:439:7: note: parameter passing for argument of type 'std::vector::triple_ppd_t, OpenMP_Allocator::triple_ppd_t> >::iterator' changed in GCC 7.1 + 439 | vector<_Tp, _Alloc>:: + | ^~~~~~~~~~~~~~~~~~~ +In file included from /usr/include/c++/12/bits/stl_algo.h:61: +/usr/include/c++/12/bits/stl_tempbuf.h: In constructor 'std::_Temporary_buffer<_ForwardIterator, _Tp>::_Temporary_buffer(_ForwardIterator, size_type) [with _ForwardIterator = __gnu_cxx::__normal_iterator::triple_ppd_t*, std::vector::triple_ppd_t, OpenMP_Allocator::triple_ppd_t> > >; _Tp = Coo::triple_ppd_t]': +/usr/include/c++/12/bits/stl_tempbuf.h:258:5: note: parameter passing for argument of type '__gnu_cxx::__normal_iterator::triple_ppd_t*, std::vector::triple_ppd_t, OpenMP_Allocator::triple_ppd_t> > >' changed in GCC 7.1 + 258 | _Temporary_buffer<_ForwardIterator, _Tp>:: + | ^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ +/usr/include/c++/12/bits/stl_algo.h: In function '_ForwardIterator std::__stable_partition_adaptive(_ForwardIterator, _ForwardIterator, _Predicate, _Distance, _Pointer, _Distance) [with _ForwardIterator = __gnu_cxx::__normal_iterator::triple_ppd_t*, vector::triple_ppd_t, OpenMP_Allocator::triple_ppd_t> > >; _Pointer = Coo::triple_ppd_t*; _Predicate = __gnu_cxx::__ops::_Iter_pred::zort(std::vector >::iterator, int, int, int, int, int, int, QuadTree&)::::triple_t)> >; _Distance = int]': +/usr/include/c++/12/bits/stl_algo.h:1506:5: note: parameter passing for argument of type '__gnu_cxx::__normal_iterator::triple_ppd_t*, std::vector::triple_ppd_t, OpenMP_Allocator::triple_ppd_t> > >' changed in GCC 7.1 + 1506 | __stable_partition_adaptive(_ForwardIterator __first, + | ^~~~~~~~~~~~~~~~~~~~~~~~~~~ +/usr/include/c++/12/bits/stl_algo.h:1506:5: note: parameter passing for argument of type '__gnu_cxx::__normal_iterator::triple_ppd_t*, std::vector::triple_ppd_t, OpenMP_Allocator::triple_ppd_t> > >' changed in GCC 7.1 +/usr/include/c++/12/bits/stl_algo.h:1545:41: note: parameter passing for argument of type '__gnu_cxx::__normal_iterator::triple_ppd_t*, std::vector::triple_ppd_t, OpenMP_Allocator::triple_ppd_t> > >' changed in GCC 7.1 + 1545 | std::__stable_partition_adaptive(__first, __middle, __pred, + | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~^~~~~~~~~~~~~~~~~~~~~~~~~~~ + 1546 | __len / 2, __buffer, + | ~~~~~~~~~~~~~~~~~~~~ + 1547 | __buffer_size); + | ~~~~~~~~~~~~~~ +/usr/include/c++/12/bits/stl_algo.h:1557:43: note: parameter passing for argument of type '__gnu_cxx::__normal_iterator::triple_ppd_t*, std::vector::triple_ppd_t, OpenMP_Allocator::triple_ppd_t> > >' changed in GCC 7.1 + 1557 | std::__stable_partition_adaptive(__right_split, __last, __pred, + | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ + 1558 | __right_len, + | ~~~~~~~~~~~~ + 1559 | __buffer, __buffer_size); + | ~~~~~~~~~~~~~~~~~~~~~~~~ +In function '_FIter std::_V2::rotate(_FIter, _FIter, _FIter) [with _FIter = __gnu_cxx::__normal_iterator::triple_ppd_t*, std::vector::triple_ppd_t, OpenMP_Allocator::triple_ppd_t> > >]', + inlined from '_ForwardIterator std::__stable_partition_adaptive(_ForwardIterator, _ForwardIterator, _Predicate, _Distance, _Pointer, _Distance) [with _ForwardIterator = __gnu_cxx::__normal_iterator::triple_ppd_t*, vector::triple_ppd_t, OpenMP_Allocator::triple_ppd_t> > >; _Pointer = Coo::triple_ppd_t*; _Predicate = __gnu_cxx::__ops::_Iter_pred::zort(std::vector >::iterator, int, int, int, int, int, int, QuadTree&)::::triple_t)> >; _Distance = int]' at /usr/include/c++/12/bits/stl_algo.h:1561:25: +/usr/include/c++/12/bits/stl_algo.h:1397:27: note: parameter passing for argument of type '__gnu_cxx::__normal_iterator::triple_ppd_t*, std::vector::triple_ppd_t, OpenMP_Allocator::triple_ppd_t> > >' changed in GCC 7.1 + 1397 | return std::__rotate(__first, __middle, __last, + | ~~~~~~~~~~~~~^~~~~~~~~~~~~~~~~~~~~~~~~~~ + 1398 | std::__iterator_category(__first)); + | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ +/usr/include/c++/12/bits/stl_algo.h: In function '_ForwardIterator std::__stable_partition(_ForwardIterator, _ForwardIterator, _Predicate) [with _ForwardIterator = __gnu_cxx::__normal_iterator::triple_ppd_t*, vector::triple_ppd_t, OpenMP_Allocator::triple_ppd_t> > >; _Predicate = __gnu_cxx::__ops::_Iter_pred::zort(std::vector >::iterator, int, int, int, int, int, int, QuadTree&)::::triple_t)> >]': +/usr/include/c++/12/bits/stl_algo.h:1566:5: note: parameter passing for argument of type '__gnu_cxx::__normal_iterator::triple_ppd_t*, std::vector::triple_ppd_t, OpenMP_Allocator::triple_ppd_t> > >' changed in GCC 7.1 + 1566 | __stable_partition(_ForwardIterator __first, _ForwardIterator __last, + | ^~~~~~~~~~~~~~~~~~ +/usr/include/c++/12/bits/stl_algo.h:1566:5: note: parameter passing for argument of type '__gnu_cxx::__normal_iterator::triple_ppd_t*, std::vector::triple_ppd_t, OpenMP_Allocator::triple_ppd_t> > >' changed in GCC 7.1 +/usr/include/c++/12/bits/stl_algo.h:1580:9: note: parameter passing for argument of type '__gnu_cxx::__normal_iterator::triple_ppd_t*, std::vector::triple_ppd_t, OpenMP_Allocator::triple_ppd_t> > >' changed in GCC 7.1 + 1580 | __buf(__first, std::distance(__first, __last)); + | ^~~~~ +/usr/include/c++/12/bits/stl_algo.h:1582:41: note: parameter passing for argument of type '__gnu_cxx::__normal_iterator::triple_ppd_t*, std::vector::triple_ppd_t, OpenMP_Allocator::triple_ppd_t> > >' changed in GCC 7.1 + 1582 | std::__stable_partition_adaptive(__first, __last, __pred, + | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~^~~~~~~~~~~~~~~~~~~~~~~~~ + 1583 | _DistanceType(__buf.requested_size()), + | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ + 1584 | __buf.begin(), + | ~~~~~~~~~~~~~~ + 1585 | _DistanceType(__buf.size())); + | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~ +/usr/include/c++/12/bits/stl_algo.h: In function '_ForwardIterator std::__stable_partition_adaptive(_ForwardIterator, _ForwardIterator, _Predicate, _Distance, _Pointer, _Distance) [with _ForwardIterator = __gnu_cxx::__normal_iterator::triple_ppd_t*, vector::triple_ppd_t, OpenMP_Allocator::triple_ppd_t> > >; _Pointer = Coo::triple_ppd_t*; _Predicate = __gnu_cxx::__ops::_Iter_pred::zort(std::vector >::iterator, int, int, int, int, int, int, QuadTree&)::::triple_t)> >; _Distance = int]': +/usr/include/c++/12/bits/stl_algo.h:1506:5: note: parameter passing for argument of type '__gnu_cxx::__normal_iterator::triple_ppd_t*, std::vector::triple_ppd_t, OpenMP_Allocator::triple_ppd_t> > >' changed in GCC 7.1 + 1506 | __stable_partition_adaptive(_ForwardIterator __first, + | ^~~~~~~~~~~~~~~~~~~~~~~~~~~ +/usr/include/c++/12/bits/stl_algo.h:1506:5: note: parameter passing for argument of type '__gnu_cxx::__normal_iterator::triple_ppd_t*, std::vector::triple_ppd_t, OpenMP_Allocator::triple_ppd_t> > >' changed in GCC 7.1 +/usr/include/c++/12/bits/stl_algo.h:1545:41: note: parameter passing for argument of type '__gnu_cxx::__normal_iterator::triple_ppd_t*, std::vector::triple_ppd_t, OpenMP_Allocator::triple_ppd_t> > >' changed in GCC 7.1 + 1545 | std::__stable_partition_adaptive(__first, __middle, __pred, + | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~^~~~~~~~~~~~~~~~~~~~~~~~~~~ + 1546 | __len / 2, __buffer, + | ~~~~~~~~~~~~~~~~~~~~ + 1547 | __buffer_size); + | ~~~~~~~~~~~~~~ +/usr/include/c++/12/bits/stl_algo.h:1557:43: note: parameter passing for argument of type '__gnu_cxx::__normal_iterator::triple_ppd_t*, std::vector::triple_ppd_t, OpenMP_Allocator::triple_ppd_t> > >' changed in GCC 7.1 + 1557 | std::__stable_partition_adaptive(__right_split, __last, __pred, + | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ + 1558 | __right_len, + | ~~~~~~~~~~~~ + 1559 | __buffer, __buffer_size); + | ~~~~~~~~~~~~~~~~~~~~~~~~ +In function '_FIter std::_V2::rotate(_FIter, _FIter, _FIter) [with _FIter = __gnu_cxx::__normal_iterator::triple_ppd_t*, std::vector::triple_ppd_t, OpenMP_Allocator::triple_ppd_t> > >]', + inlined from '_ForwardIterator std::__stable_partition_adaptive(_ForwardIterator, _ForwardIterator, _Predicate, _Distance, _Pointer, _Distance) [with _ForwardIterator = __gnu_cxx::__normal_iterator::triple_ppd_t*, vector::triple_ppd_t, OpenMP_Allocator::triple_ppd_t> > >; _Pointer = Coo::triple_ppd_t*; _Predicate = __gnu_cxx::__ops::_Iter_pred::zort(std::vector >::iterator, int, int, int, int, int, int, QuadTree&)::::triple_t)> >; _Distance = int]' at /usr/include/c++/12/bits/stl_algo.h:1561:25: +/usr/include/c++/12/bits/stl_algo.h:1397:27: note: parameter passing for argument of type '__gnu_cxx::__normal_iterator::triple_ppd_t*, std::vector::triple_ppd_t, OpenMP_Allocator::triple_ppd_t> > >' changed in GCC 7.1 + 1397 | return std::__rotate(__first, __middle, __last, + | ~~~~~~~~~~~~~^~~~~~~~~~~~~~~~~~~~~~~~~~~ + 1398 | std::__iterator_category(__first)); + | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ +/usr/include/c++/12/bits/stl_algo.h: In function '_ForwardIterator std::__stable_partition(_ForwardIterator, _ForwardIterator, _Predicate) [with _ForwardIterator = __gnu_cxx::__normal_iterator::triple_ppd_t*, vector::triple_ppd_t, OpenMP_Allocator::triple_ppd_t> > >; _Predicate = __gnu_cxx::__ops::_Iter_pred::zort(std::vector >::iterator, int, int, int, int, int, int, QuadTree&)::::triple_t)> >]': +/usr/include/c++/12/bits/stl_algo.h:1566:5: note: parameter passing for argument of type '__gnu_cxx::__normal_iterator::triple_ppd_t*, std::vector::triple_ppd_t, OpenMP_Allocator::triple_ppd_t> > >' changed in GCC 7.1 + 1566 | __stable_partition(_ForwardIterator __first, _ForwardIterator __last, + | ^~~~~~~~~~~~~~~~~~ +/usr/include/c++/12/bits/stl_algo.h:1566:5: note: parameter passing for argument of type '__gnu_cxx::__normal_iterator::triple_ppd_t*, std::vector::triple_ppd_t, OpenMP_Allocator::triple_ppd_t> > >' changed in GCC 7.1 +/usr/include/c++/12/bits/stl_algo.h:1580:9: note: parameter passing for argument of type '__gnu_cxx::__normal_iterator::triple_ppd_t*, std::vector::triple_ppd_t, OpenMP_Allocator::triple_ppd_t> > >' changed in GCC 7.1 + 1580 | __buf(__first, std::distance(__first, __last)); + | ^~~~~ +/usr/include/c++/12/bits/stl_algo.h:1582:41: note: parameter passing for argument of type '__gnu_cxx::__normal_iterator::triple_ppd_t*, std::vector::triple_ppd_t, OpenMP_Allocator::triple_ppd_t> > >' changed in GCC 7.1 + 1582 | std::__stable_partition_adaptive(__first, __last, __pred, + | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~^~~~~~~~~~~~~~~~~~~~~~~~~ + 1583 | _DistanceType(__buf.requested_size()), + | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ + 1584 | __buf.begin(), + | ~~~~~~~~~~~~~~ + 1585 | _DistanceType(__buf.size())); + | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~ +/usr/include/c++/12/bits/stl_algo.h: In function '_ForwardIterator std::__stable_partition_adaptive(_ForwardIterator, _ForwardIterator, _Predicate, _Distance, _Pointer, _Distance) [with _ForwardIterator = __gnu_cxx::__normal_iterator::triple_ppd_t*, vector::triple_ppd_t, OpenMP_Allocator::triple_ppd_t> > >; _Pointer = Coo::triple_ppd_t*; _Predicate = __gnu_cxx::__ops::_Iter_pred::zort(std::vector >::iterator, int, int, int, int, int, int, QuadTree&)::::triple_t)> >; _Distance = int]': +/usr/include/c++/12/bits/stl_algo.h:1506:5: note: parameter passing for argument of type '__gnu_cxx::__normal_iterator::triple_ppd_t*, std::vector::triple_ppd_t, OpenMP_Allocator::triple_ppd_t> > >' changed in GCC 7.1 + 1506 | __stable_partition_adaptive(_ForwardIterator __first, + | ^~~~~~~~~~~~~~~~~~~~~~~~~~~ +/usr/include/c++/12/bits/stl_algo.h:1506:5: note: parameter passing for argument of type '__gnu_cxx::__normal_iterator::triple_ppd_t*, std::vector::triple_ppd_t, OpenMP_Allocator::triple_ppd_t> > >' changed in GCC 7.1 +/usr/include/c++/12/bits/stl_algo.h:1545:41: note: parameter passing for argument of type '__gnu_cxx::__normal_iterator::triple_ppd_t*, std::vector::triple_ppd_t, OpenMP_Allocator::triple_ppd_t> > >' changed in GCC 7.1 + 1545 | std::__stable_partition_adaptive(__first, __middle, __pred, + | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~^~~~~~~~~~~~~~~~~~~~~~~~~~~ + 1546 | __len / 2, __buffer, + | ~~~~~~~~~~~~~~~~~~~~ + 1547 | __buffer_size); + | ~~~~~~~~~~~~~~ +/usr/include/c++/12/bits/stl_algo.h:1557:43: note: parameter passing for argument of type '__gnu_cxx::__normal_iterator::triple_ppd_t*, std::vector::triple_ppd_t, OpenMP_Allocator::triple_ppd_t> > >' changed in GCC 7.1 + 1557 | std::__stable_partition_adaptive(__right_split, __last, __pred, + | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ + 1558 | __right_len, + | ~~~~~~~~~~~~ + 1559 | __buffer, __buffer_size); + | ~~~~~~~~~~~~~~~~~~~~~~~~ +In function '_FIter std::_V2::rotate(_FIter, _FIter, _FIter) [with _FIter = __gnu_cxx::__normal_iterator::triple_ppd_t*, std::vector::triple_ppd_t, OpenMP_Allocator::triple_ppd_t> > >]', + inlined from '_ForwardIterator std::__stable_partition_adaptive(_ForwardIterator, _ForwardIterator, _Predicate, _Distance, _Pointer, _Distance) [with _ForwardIterator = __gnu_cxx::__normal_iterator::triple_ppd_t*, vector::triple_ppd_t, OpenMP_Allocator::triple_ppd_t> > >; _Pointer = Coo::triple_ppd_t*; _Predicate = __gnu_cxx::__ops::_Iter_pred::zort(std::vector >::iterator, int, int, int, int, int, int, QuadTree&)::::triple_t)> >; _Distance = int]' at /usr/include/c++/12/bits/stl_algo.h:1561:25: +/usr/include/c++/12/bits/stl_algo.h:1397:27: note: parameter passing for argument of type '__gnu_cxx::__normal_iterator::triple_ppd_t*, std::vector::triple_ppd_t, OpenMP_Allocator::triple_ppd_t> > >' changed in GCC 7.1 + 1397 | return std::__rotate(__first, __middle, __last, + | ~~~~~~~~~~~~~^~~~~~~~~~~~~~~~~~~~~~~~~~~ + 1398 | std::__iterator_category(__first)); + | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ +/usr/include/c++/12/bits/stl_algo.h: In function '_ForwardIterator std::__stable_partition(_ForwardIterator, _ForwardIterator, _Predicate) [with _ForwardIterator = __gnu_cxx::__normal_iterator::triple_ppd_t*, vector::triple_ppd_t, OpenMP_Allocator::triple_ppd_t> > >; _Predicate = __gnu_cxx::__ops::_Iter_pred::zort(std::vector >::iterator, int, int, int, int, int, int, QuadTree&)::::triple_t)> >]': +/usr/include/c++/12/bits/stl_algo.h:1566:5: note: parameter passing for argument of type '__gnu_cxx::__normal_iterator::triple_ppd_t*, std::vector::triple_ppd_t, OpenMP_Allocator::triple_ppd_t> > >' changed in GCC 7.1 + 1566 | __stable_partition(_ForwardIterator __first, _ForwardIterator __last, + | ^~~~~~~~~~~~~~~~~~ +/usr/include/c++/12/bits/stl_algo.h:1566:5: note: parameter passing for argument of type '__gnu_cxx::__normal_iterator::triple_ppd_t*, std::vector::triple_ppd_t, OpenMP_Allocator::triple_ppd_t> > >' changed in GCC 7.1 +/usr/include/c++/12/bits/stl_algo.h:1580:9: note: parameter passing for argument of type '__gnu_cxx::__normal_iterator::triple_ppd_t*, std::vector::triple_ppd_t, OpenMP_Allocator::triple_ppd_t> > >' changed in GCC 7.1 + 1580 | __buf(__first, std::distance(__first, __last)); + | ^~~~~ +/usr/include/c++/12/bits/stl_algo.h:1582:41: note: parameter passing for argument of type '__gnu_cxx::__normal_iterator::triple_ppd_t*, std::vector::triple_ppd_t, OpenMP_Allocator::triple_ppd_t> > >' changed in GCC 7.1 + 1582 | std::__stable_partition_adaptive(__first, __last, __pred, + | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~^~~~~~~~~~~~~~~~~~~~~~~~~ + 1583 | _DistanceType(__buf.requested_size()), + | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ + 1584 | __buf.begin(), + | ~~~~~~~~~~~~~~ + 1585 | _DistanceType(__buf.size())); + | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~ +/usr/include/c++/12/bits/stl_algo.h: In function 'void std::__introsort_loop(_RandomAccessIterator, _RandomAccessIterator, _Size, _Compare) [with _RandomAccessIterator = __gnu_cxx::__normal_iterator::triple_ppd_t*, vector::triple_ppd_t, OpenMP_Allocator::triple_ppd_t> > >; _Size = int; _Compare = __gnu_cxx::__ops::_Iter_comp_iter::sort_cor(int, int)::::triple_t, Coo::triple_t)> >]': +/usr/include/c++/12/bits/stl_algo.h:1908:5: note: parameter passing for argument of type '__gnu_cxx::__normal_iterator::triple_ppd_t*, std::vector::triple_ppd_t, OpenMP_Allocator::triple_ppd_t> > >' changed in GCC 7.1 + 1908 | __introsort_loop(_RandomAccessIterator __first, + | ^~~~~~~~~~~~~~~~ +/usr/include/c++/12/bits/stl_algo.h:1908:5: note: parameter passing for argument of type '__gnu_cxx::__normal_iterator::triple_ppd_t*, std::vector::triple_ppd_t, OpenMP_Allocator::triple_ppd_t> > >' changed in GCC 7.1 +/usr/include/c++/12/bits/stl_algo.h:1922:32: note: parameter passing for argument of type '__gnu_cxx::__normal_iterator::triple_ppd_t*, std::vector::triple_ppd_t, OpenMP_Allocator::triple_ppd_t> > >' changed in GCC 7.1 + 1922 | std::__introsort_loop(__cut, __last, __depth_limit, __comp); + | ~~~~~~~~~~~~~~~~~~~~~^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ +/usr/include/c++/12/bits/stl_algo.h: In function 'void std::__introsort_loop(_RandomAccessIterator, _RandomAccessIterator, _Size, _Compare) [with _RandomAccessIterator = __gnu_cxx::__normal_iterator::triple_ppd_t*, vector::triple_ppd_t, OpenMP_Allocator::triple_ppd_t> > >; _Size = int; _Compare = __gnu_cxx::__ops::_Iter_comp_iter::sort_coc(int, int)::::triple_t, Coo::triple_t)> >]': +/usr/include/c++/12/bits/stl_algo.h:1908:5: note: parameter passing for argument of type '__gnu_cxx::__normal_iterator::triple_ppd_t*, std::vector::triple_ppd_t, OpenMP_Allocator::triple_ppd_t> > >' changed in GCC 7.1 + 1908 | __introsort_loop(_RandomAccessIterator __first, + | ^~~~~~~~~~~~~~~~ +/usr/include/c++/12/bits/stl_algo.h:1908:5: note: parameter passing for argument of type '__gnu_cxx::__normal_iterator::triple_ppd_t*, std::vector::triple_ppd_t, OpenMP_Allocator::triple_ppd_t> > >' changed in GCC 7.1 +/usr/include/c++/12/bits/stl_algo.h:1922:32: note: parameter passing for argument of type '__gnu_cxx::__normal_iterator::triple_ppd_t*, std::vector::triple_ppd_t, OpenMP_Allocator::triple_ppd_t> > >' changed in GCC 7.1 + 1922 | std::__introsort_loop(__cut, __last, __depth_limit, __comp); + | ~~~~~~~~~~~~~~~~~~~~~^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ +rsbpp.hpp: In member function 'void Coo::zort(typename trivec_t::iterator, IT, IT, IT, IT, IT, IT, QuadTree&) [with IT = int; NT = double]': +rsbpp.hpp:4458:14: note: parameter passing for argument of type 'std::vector::triple_ppd_t, OpenMP_Allocator::triple_ppd_t> >::iterator' changed in GCC 7.1 + 4458 | void zort(typename trivec_t::iterator bi, const IT lfnz, const IT lnnz, const IT lfr, const IT lnr, const IT lfc, const IT lnc, QuadTree & qt) + | ^~~~ +In function 'void std::__sort(_RandomAccessIterator, _RandomAccessIterator, _Compare) [with _RandomAccessIterator = __gnu_cxx::__normal_iterator::triple_ppd_t*, vector::triple_ppd_t, OpenMP_Allocator::triple_ppd_t> > >; _Compare = __gnu_cxx::__ops::_Iter_comp_iter::sort_cor(int, int)::::triple_t, Coo::triple_t)> >]', + inlined from 'void std::sort(_RAIter, _RAIter, _Compare) [with _RAIter = __gnu_cxx::__normal_iterator::triple_ppd_t*, vector::triple_ppd_t, OpenMP_Allocator::triple_ppd_t> > >; _Compare = Coo::sort_cor(int, int)::::triple_t, Coo::triple_t)>]' at /usr/include/c++/12/bits/stl_algo.h:4853:18, + inlined from 'void Coo::sort_cor(IT, IT) [with IT = int; NT = double]' at rsbpp.hpp:4419:12, + inlined from 'void Coo::zort(typename trivec_t::iterator, IT, IT, IT, IT, IT, IT, QuadTree&) [with IT = int; NT = double]' at rsbpp.hpp:4510:14: +/usr/include/c++/12/bits/stl_algo.h:1937:32: note: parameter passing for argument of type '__gnu_cxx::__normal_iterator::triple_ppd_t*, std::vector::triple_ppd_t, OpenMP_Allocator::triple_ppd_t> > >' changed in GCC 7.1 + 1937 | std::__introsort_loop(__first, __last, + | ~~~~~~~~~~~~~~~~~~~~~^~~~~~~~~~~~~~~~~ + 1938 | std::__lg(__last - __first) * 2, + | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ + 1939 | __comp); + | ~~~~~~~ +In function 'void std::__final_insertion_sort(_RandomAccessIterator, _RandomAccessIterator, _Compare) [with _RandomAccessIterator = __gnu_cxx::__normal_iterator::triple_ppd_t*, vector::triple_ppd_t, OpenMP_Allocator::triple_ppd_t> > >; _Compare = __gnu_cxx::__ops::_Iter_comp_iter::sort_cor(int, int)::::triple_t, Coo::triple_t)> >]', + inlined from 'void std::__sort(_RandomAccessIterator, _RandomAccessIterator, _Compare) [with _RandomAccessIterator = __gnu_cxx::__normal_iterator::triple_ppd_t*, vector::triple_ppd_t, OpenMP_Allocator::triple_ppd_t> > >; _Compare = __gnu_cxx::__ops::_Iter_comp_iter::sort_cor(int, int)::::triple_t, Coo::triple_t)> >]' at /usr/include/c++/12/bits/stl_algo.h:1940:31, + inlined from 'void std::sort(_RAIter, _RAIter, _Compare) [with _RAIter = __gnu_cxx::__normal_iterator::triple_ppd_t*, vector::triple_ppd_t, OpenMP_Allocator::triple_ppd_t> > >; _Compare = Coo::sort_cor(int, int)::::triple_t, Coo::triple_t)>]' at /usr/include/c++/12/bits/stl_algo.h:4853:18, + inlined from 'void Coo::sort_cor(IT, IT) [with IT = int; NT = double]' at rsbpp.hpp:4419:12, + inlined from 'void Coo::zort(typename trivec_t::iterator, IT, IT, IT, IT, IT, IT, QuadTree&) [with IT = int; NT = double]' at rsbpp.hpp:4510:14: +/usr/include/c++/12/bits/stl_algo.h:1849:32: note: parameter passing for argument of type '__gnu_cxx::__normal_iterator::triple_ppd_t*, std::vector::triple_ppd_t, OpenMP_Allocator::triple_ppd_t> > >' changed in GCC 7.1 + 1849 | std::__insertion_sort(__first, __first + int(_S_threshold), __comp); + | ~~~~~~~~~~~~~~~~~~~~~^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ +/usr/include/c++/12/bits/stl_algo.h:1854:30: note: parameter passing for argument of type '__gnu_cxx::__normal_iterator::triple_ppd_t*, std::vector::triple_ppd_t, OpenMP_Allocator::triple_ppd_t> > >' changed in GCC 7.1 + 1854 | std::__insertion_sort(__first, __last, __comp); + | ~~~~~~~~~~~~~~~~~~~~~^~~~~~~~~~~~~~~~~~~~~~~~~ +In function 'void std::__sort(_RandomAccessIterator, _RandomAccessIterator, _Compare) [with _RandomAccessIterator = __gnu_cxx::__normal_iterator::triple_ppd_t*, vector::triple_ppd_t, OpenMP_Allocator::triple_ppd_t> > >; _Compare = __gnu_cxx::__ops::_Iter_comp_iter::sort_coc(int, int)::::triple_t, Coo::triple_t)> >]', + inlined from 'void std::sort(_RAIter, _RAIter, _Compare) [with _RAIter = __gnu_cxx::__normal_iterator::triple_ppd_t*, vector::triple_ppd_t, OpenMP_Allocator::triple_ppd_t> > >; _Compare = Coo::sort_coc(int, int)::::triple_t, Coo::triple_t)>]' at /usr/include/c++/12/bits/stl_algo.h:4853:18, + inlined from 'void Coo::sort_coc(IT, IT) [with IT = int; NT = double]' at rsbpp.hpp:4447:12, + inlined from 'void Coo::zort(typename trivec_t::iterator, IT, IT, IT, IT, IT, IT, QuadTree&) [with IT = int; NT = double]' at rsbpp.hpp:4512:14: +/usr/include/c++/12/bits/stl_algo.h:1937:32: note: parameter passing for argument of type '__gnu_cxx::__normal_iterator::triple_ppd_t*, std::vector::triple_ppd_t, OpenMP_Allocator::triple_ppd_t> > >' changed in GCC 7.1 + 1937 | std::__introsort_loop(__first, __last, + | ~~~~~~~~~~~~~~~~~~~~~^~~~~~~~~~~~~~~~~ + 1938 | std::__lg(__last - __first) * 2, + | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ + 1939 | __comp); + | ~~~~~~~ +In function 'void std::__final_insertion_sort(_RandomAccessIterator, _RandomAccessIterator, _Compare) [with _RandomAccessIterator = __gnu_cxx::__normal_iterator::triple_ppd_t*, vector::triple_ppd_t, OpenMP_Allocator::triple_ppd_t> > >; _Compare = __gnu_cxx::__ops::_Iter_comp_iter::sort_coc(int, int)::::triple_t, Coo::triple_t)> >]', + inlined from 'void std::__sort(_RandomAccessIterator, _RandomAccessIterator, _Compare) [with _RandomAccessIterator = __gnu_cxx::__normal_iterator::triple_ppd_t*, vector::triple_ppd_t, OpenMP_Allocator::triple_ppd_t> > >; _Compare = __gnu_cxx::__ops::_Iter_comp_iter::sort_coc(int, int)::::triple_t, Coo::triple_t)> >]' at /usr/include/c++/12/bits/stl_algo.h:1940:31, + inlined from 'void std::sort(_RAIter, _RAIter, _Compare) [with _RAIter = __gnu_cxx::__normal_iterator::triple_ppd_t*, vector::triple_ppd_t, OpenMP_Allocator::triple_ppd_t> > >; _Compare = Coo::sort_coc(int, int)::::triple_t, Coo::triple_t)>]' at /usr/include/c++/12/bits/stl_algo.h:4853:18, + inlined from 'void Coo::sort_coc(IT, IT) [with IT = int; NT = double]' at rsbpp.hpp:4447:12, + inlined from 'void Coo::zort(typename trivec_t::iterator, IT, IT, IT, IT, IT, IT, QuadTree&) [with IT = int; NT = double]' at rsbpp.hpp:4512:14: +/usr/include/c++/12/bits/stl_algo.h:1849:32: note: parameter passing for argument of type '__gnu_cxx::__normal_iterator::triple_ppd_t*, std::vector::triple_ppd_t, OpenMP_Allocator::triple_ppd_t> > >' changed in GCC 7.1 + 1849 | std::__insertion_sort(__first, __first + int(_S_threshold), __comp); + | ~~~~~~~~~~~~~~~~~~~~~^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ +/usr/include/c++/12/bits/stl_algo.h:1854:30: note: parameter passing for argument of type '__gnu_cxx::__normal_iterator::triple_ppd_t*, std::vector::triple_ppd_t, OpenMP_Allocator::triple_ppd_t> > >' changed in GCC 7.1 + 1854 | std::__insertion_sort(__first, __last, __comp); + | ~~~~~~~~~~~~~~~~~~~~~^~~~~~~~~~~~~~~~~~~~~~~~~ +In function '_BIter std::stable_partition(_BIter, _BIter, _Predicate) [with _BIter = __gnu_cxx::__normal_iterator::triple_ppd_t*, vector::triple_ppd_t, OpenMP_Allocator::triple_ppd_t> > >; _Predicate = Coo::zort(std::vector >::iterator, int, int, int, int, int, int, QuadTree&)::::triple_t)>]', + inlined from 'void Coo::zort(typename trivec_t::iterator, IT, IT, IT, IT, IT, IT, QuadTree&) [with IT = int; NT = double]' at rsbpp.hpp:4527:40: +/usr/include/c++/12/bits/stl_algo.h:1617:37: note: parameter passing for argument of type '__gnu_cxx::__normal_iterator::triple_ppd_t*, std::vector::triple_ppd_t, OpenMP_Allocator::triple_ppd_t> > >' changed in GCC 7.1 + 1617 | return std::__stable_partition(__first, __last, + | ~~~~~~~~~~~~~~~~~~~~~~~^~~~~~~~~~~~~~~~~ + 1618 | __gnu_cxx::__ops::__pred_iter(__pred)); + | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ +In function '_BIter std::stable_partition(_BIter, _BIter, _Predicate) [with _BIter = __gnu_cxx::__normal_iterator::triple_ppd_t*, vector::triple_ppd_t, OpenMP_Allocator::triple_ppd_t> > >; _Predicate = Coo::zort(std::vector >::iterator, int, int, int, int, int, int, QuadTree&)::::triple_t)>]', + inlined from 'void Coo::zort(typename trivec_t::iterator, IT, IT, IT, IT, IT, IT, QuadTree&) [with IT = int; NT = double]' at rsbpp.hpp:4528:40: +/usr/include/c++/12/bits/stl_algo.h:1617:37: note: parameter passing for argument of type '__gnu_cxx::__normal_iterator::triple_ppd_t*, std::vector::triple_ppd_t, OpenMP_Allocator::triple_ppd_t> > >' changed in GCC 7.1 + 1617 | return std::__stable_partition(__first, __last, + | ~~~~~~~~~~~~~~~~~~~~~~~^~~~~~~~~~~~~~~~~ + 1618 | __gnu_cxx::__ops::__pred_iter(__pred)); + | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ +In function '_BIter std::stable_partition(_BIter, _BIter, _Predicate) [with _BIter = __gnu_cxx::__normal_iterator::triple_ppd_t*, vector::triple_ppd_t, OpenMP_Allocator::triple_ppd_t> > >; _Predicate = Coo::zort(std::vector >::iterator, int, int, int, int, int, int, QuadTree&)::::triple_t)>]', + inlined from 'void Coo::zort(typename trivec_t::iterator, IT, IT, IT, IT, IT, IT, QuadTree&) [with IT = int; NT = double]' at rsbpp.hpp:4529:40: +/usr/include/c++/12/bits/stl_algo.h:1617:37: note: parameter passing for argument of type '__gnu_cxx::__normal_iterator::triple_ppd_t*, std::vector::triple_ppd_t, OpenMP_Allocator::triple_ppd_t> > >' changed in GCC 7.1 + 1617 | return std::__stable_partition(__first, __last, + | ~~~~~~~~~~~~~~~~~~~~~~~^~~~~~~~~~~~~~~~~ + 1618 | __gnu_cxx::__ops::__pred_iter(__pred)); + | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ +rsbpp.hpp: In member function 'void Coo::zort(typename trivec_t::iterator, IT, IT, IT, IT, IT, IT, QuadTree&) [with IT = int; NT = double]': +rsbpp.hpp:4554:37: note: parameter passing for argument of type 'std::vector::triple_ppd_t, OpenMP_Allocator::triple_ppd_t> >::iterator' changed in GCC 7.1 + 4554 | zort(bi,qnz[midx-1],qnz.n_at(midx),qro[midx],qnr[midx],qco[midx],qnc[midx],qt); + | ~~~~^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ +rsbpp.hpp: In member function 'void Coo::zort() [with IT = int; NT = double]': +rsbpp.hpp:4570:21: note: parameter passing for argument of type '__gnu_cxx::__normal_iterator::triple_ppd_t*, std::vector::triple_ppd_t, OpenMP_Allocator::triple_ppd_t> > >' changed in GCC 7.1 + 4570 | zort(coo_.begin(),0,nnz(),0,nr(),0,nc(),qt_); + | ~~~~^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ +In member function 'std::vector<_Tp, _Alloc>::reference std::vector<_Tp, _Alloc>::emplace_back(_Args&& ...) [with _Args = {Coo::triple_ppd_t}; _Tp = Coo::triple_ppd_t; _Alloc = OpenMP_Allocator::triple_ppd_t>]', + inlined from 'void Coo::init_coo(const std::vector&, const std::vector&, const std::vector&, rsb_flags_t, Ordering) [with IT = int; NT = double]' at rsbpp.hpp:4367:21, + inlined from 'Coo::Coo(const std::vector&, const std::vector&, const std::vector&, rsb_flags_t, Ordering) [with IT = int; NT = double]' at rsbpp.hpp:4303:11: +/usr/include/c++/12/bits/vector.tcc:123:28: note: parameter passing for argument of type '__gnu_cxx::__normal_iterator::triple_ppd_t*, std::vector::triple_ppd_t, OpenMP_Allocator::triple_ppd_t> > >' changed in GCC 7.1 + 123 | _M_realloc_insert(end(), std::forward<_Args>(__args)...); + | ~~~~~~~~~~~~~~~~~^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ +In function 'void std::__sort(_RandomAccessIterator, _RandomAccessIterator, _Compare) [with _RandomAccessIterator = __gnu_cxx::__normal_iterator::triple_ppd_t*, vector::triple_ppd_t, OpenMP_Allocator::triple_ppd_t> > >; _Compare = __gnu_cxx::__ops::_Iter_comp_iter::sort_cor(int, int)::::triple_t, Coo::triple_t)> >]', + inlined from 'void std::sort(_RAIter, _RAIter, _Compare) [with _RAIter = __gnu_cxx::__normal_iterator::triple_ppd_t*, vector::triple_ppd_t, OpenMP_Allocator::triple_ppd_t> > >; _Compare = Coo::sort_cor(int, int)::::triple_t, Coo::triple_t)>]' at /usr/include/c++/12/bits/stl_algo.h:4853:18, + inlined from 'void Coo::sort_cor(IT, IT) [with IT = int; NT = double]' at rsbpp.hpp:4419:12, + inlined from 'void Coo::sort_cor() [with IT = int; NT = double]' at rsbpp.hpp:4427:11, + inlined from 'void Coo::sort() [with IT = int; NT = double]' at rsbpp.hpp:4402:13, + inlined from 'void Coo::init_coo(const std::vector&, const std::vector&, const std::vector&, rsb_flags_t, Ordering) [with IT = int; NT = double]' at rsbpp.hpp:4375:14, + inlined from 'Coo::Coo(const std::vector&, const std::vector&, const std::vector&, rsb_flags_t, Ordering) [with IT = int; NT = double]' at rsbpp.hpp:4303:11: +/usr/include/c++/12/bits/stl_algo.h:1937:32: note: parameter passing for argument of type '__gnu_cxx::__normal_iterator::triple_ppd_t*, std::vector::triple_ppd_t, OpenMP_Allocator::triple_ppd_t> > >' changed in GCC 7.1 + 1937 | std::__introsort_loop(__first, __last, + | ~~~~~~~~~~~~~~~~~~~~~^~~~~~~~~~~~~~~~~ + 1938 | std::__lg(__last - __first) * 2, + | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ + 1939 | __comp); + | ~~~~~~~ +In function 'void std::__final_insertion_sort(_RandomAccessIterator, _RandomAccessIterator, _Compare) [with _RandomAccessIterator = __gnu_cxx::__normal_iterator::triple_ppd_t*, vector::triple_ppd_t, OpenMP_Allocator::triple_ppd_t> > >; _Compare = __gnu_cxx::__ops::_Iter_comp_iter::sort_cor(int, int)::::triple_t, Coo::triple_t)> >]', + inlined from 'void std::__sort(_RandomAccessIterator, _RandomAccessIterator, _Compare) [with _RandomAccessIterator = __gnu_cxx::__normal_iterator::triple_ppd_t*, vector::triple_ppd_t, OpenMP_Allocator::triple_ppd_t> > >; _Compare = __gnu_cxx::__ops::_Iter_comp_iter::sort_cor(int, int)::::triple_t, Coo::triple_t)> >]' at /usr/include/c++/12/bits/stl_algo.h:1940:31, + inlined from 'void std::sort(_RAIter, _RAIter, _Compare) [with _RAIter = __gnu_cxx::__normal_iterator::triple_ppd_t*, vector::triple_ppd_t, OpenMP_Allocator::triple_ppd_t> > >; _Compare = Coo::sort_cor(int, int)::::triple_t, Coo::triple_t)>]' at /usr/include/c++/12/bits/stl_algo.h:4853:18, + inlined from 'void Coo::sort_cor(IT, IT) [with IT = int; NT = double]' at rsbpp.hpp:4419:12, + inlined from 'void Coo::sort_cor() [with IT = int; NT = double]' at rsbpp.hpp:4427:11, + inlined from 'void Coo::sort() [with IT = int; NT = double]' at rsbpp.hpp:4402:13, + inlined from 'void Coo::init_coo(const std::vector&, const std::vector&, const std::vector&, rsb_flags_t, Ordering) [with IT = int; NT = double]' at rsbpp.hpp:4375:14, + inlined from 'Coo::Coo(const std::vector&, const std::vector&, const std::vector&, rsb_flags_t, Ordering) [with IT = int; NT = double]' at rsbpp.hpp:4303:11: +/usr/include/c++/12/bits/stl_algo.h:1849:32: note: parameter passing for argument of type '__gnu_cxx::__normal_iterator::triple_ppd_t*, std::vector::triple_ppd_t, OpenMP_Allocator::triple_ppd_t> > >' changed in GCC 7.1 + 1849 | std::__insertion_sort(__first, __first + int(_S_threshold), __comp); + | ~~~~~~~~~~~~~~~~~~~~~^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ +/usr/include/c++/12/bits/stl_algo.h:1854:30: note: parameter passing for argument of type '__gnu_cxx::__normal_iterator::triple_ppd_t*, std::vector::triple_ppd_t, OpenMP_Allocator::triple_ppd_t> > >' changed in GCC 7.1 + 1854 | std::__insertion_sort(__first, __last, __comp); + | ~~~~~~~~~~~~~~~~~~~~~^~~~~~~~~~~~~~~~~~~~~~~~~ +In function 'void std::__sort(_RandomAccessIterator, _RandomAccessIterator, _Compare) [with _RandomAccessIterator = __gnu_cxx::__normal_iterator::triple_ppd_t*, vector::triple_ppd_t, OpenMP_Allocator::triple_ppd_t> > >; _Compare = __gnu_cxx::__ops::_Iter_comp_iter::sort_coc(int, int)::::triple_t, Coo::triple_t)> >]', + inlined from 'void std::sort(_RAIter, _RAIter, _Compare) [with _RAIter = __gnu_cxx::__normal_iterator::triple_ppd_t*, vector::triple_ppd_t, OpenMP_Allocator::triple_ppd_t> > >; _Compare = Coo::sort_coc(int, int)::::triple_t, Coo::triple_t)>]' at /usr/include/c++/12/bits/stl_algo.h:4853:18, + inlined from 'void Coo::sort_coc(IT, IT) [with IT = int; NT = double]' at rsbpp.hpp:4447:12, + inlined from 'void Coo::sort_coc() [with IT = int; NT = double]' at rsbpp.hpp:4455:11, + inlined from 'void Coo::sort() [with IT = int; NT = double]' at rsbpp.hpp:4405:13, + inlined from 'void Coo::init_coo(const std::vector&, const std::vector&, const std::vector&, rsb_flags_t, Ordering) [with IT = int; NT = double]' at rsbpp.hpp:4375:14, + inlined from 'Coo::Coo(const std::vector&, const std::vector&, const std::vector&, rsb_flags_t, Ordering) [with IT = int; NT = double]' at rsbpp.hpp:4303:11: +/usr/include/c++/12/bits/stl_algo.h:1937:32: note: parameter passing for argument of type '__gnu_cxx::__normal_iterator::triple_ppd_t*, std::vector::triple_ppd_t, OpenMP_Allocator::triple_ppd_t> > >' changed in GCC 7.1 + 1937 | std::__introsort_loop(__first, __last, + | ~~~~~~~~~~~~~~~~~~~~~^~~~~~~~~~~~~~~~~ + 1938 | std::__lg(__last - __first) * 2, + | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ + 1939 | __comp); + | ~~~~~~~ +In function 'void std::__final_insertion_sort(_RandomAccessIterator, _RandomAccessIterator, _Compare) [with _RandomAccessIterator = __gnu_cxx::__normal_iterator::triple_ppd_t*, vector::triple_ppd_t, OpenMP_Allocator::triple_ppd_t> > >; _Compare = __gnu_cxx::__ops::_Iter_comp_iter::sort_coc(int, int)::::triple_t, Coo::triple_t)> >]', + inlined from 'void std::__sort(_RandomAccessIterator, _RandomAccessIterator, _Compare) [with _RandomAccessIterator = __gnu_cxx::__normal_iterator::triple_ppd_t*, vector::triple_ppd_t, OpenMP_Allocator::triple_ppd_t> > >; _Compare = __gnu_cxx::__ops::_Iter_comp_iter::sort_coc(int, int)::::triple_t, Coo::triple_t)> >]' at /usr/include/c++/12/bits/stl_algo.h:1940:31, + inlined from 'void std::sort(_RAIter, _RAIter, _Compare) [with _RAIter = __gnu_cxx::__normal_iterator::triple_ppd_t*, vector::triple_ppd_t, OpenMP_Allocator::triple_ppd_t> > >; _Compare = Coo::sort_coc(int, int)::::triple_t, Coo::triple_t)>]' at /usr/include/c++/12/bits/stl_algo.h:4853:18, + inlined from 'void Coo::sort_coc(IT, IT) [with IT = int; NT = double]' at rsbpp.hpp:4447:12, + inlined from 'void Coo::sort_coc() [with IT = int; NT = double]' at rsbpp.hpp:4455:11, + inlined from 'void Coo::sort() [with IT = int; NT = double]' at rsbpp.hpp:4405:13, + inlined from 'void Coo::init_coo(const std::vector&, const std::vector&, const std::vector&, rsb_flags_t, Ordering) [with IT = int; NT = double]' at rsbpp.hpp:4375:14, + inlined from 'Coo::Coo(const std::vector&, const std::vector&, const std::vector&, rsb_flags_t, Ordering) [with IT = int; NT = double]' at rsbpp.hpp:4303:11: +/usr/include/c++/12/bits/stl_algo.h:1849:32: note: parameter passing for argument of type '__gnu_cxx::__normal_iterator::triple_ppd_t*, std::vector::triple_ppd_t, OpenMP_Allocator::triple_ppd_t> > >' changed in GCC 7.1 + 1849 | std::__insertion_sort(__first, __first + int(_S_threshold), __comp); + | ~~~~~~~~~~~~~~~~~~~~~^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ +/usr/include/c++/12/bits/stl_algo.h:1854:30: note: parameter passing for argument of type '__gnu_cxx::__normal_iterator::triple_ppd_t*, std::vector::triple_ppd_t, OpenMP_Allocator::triple_ppd_t> > >' changed in GCC 7.1 + 1854 | std::__insertion_sort(__first, __last, __comp); + | ~~~~~~~~~~~~~~~~~~~~~^~~~~~~~~~~~~~~~~~~~~~~~~ +In function 'void test_Coo_BuildsNonEmptyFromVectors()', + inlined from 'int main()' at rsbtt.cpp:840:36: +rsbtt.cpp:48:35: note: parameter passing for argument of type 'std::initializer_list' changed in GCC 7.1 + 48 | std::vector VA{+11}; + | ^ +In function 'void test_Coo_SpMV_Unsymmetric()', + inlined from 'int main()' at rsbtt.cpp:843:27: +rsbtt.cpp:574:39: note: parameter passing for argument of type 'std::initializer_list' changed in GCC 7.1 + 574 | const std::vector VA{11,12}; + | ^ +rsbtt.cpp:575:38: note: parameter passing for argument of type 'std::initializer_list' changed in GCC 7.1 + 575 | const std::vector X{+1,-1}; + | ^ +rsbtt.cpp:576:32: note: parameter passing for argument of type 'std::initializer_list' changed in GCC 7.1 + 576 | std::vector Y{+3,-3}; + | ^ +In function 'void test_Coo_SpMM_Unsymmetric()', + inlined from 'int main()' at rsbtt.cpp:844:27: +rsbtt.cpp:744:39: note: parameter passing for argument of type 'std::initializer_list' changed in GCC 7.1 + 744 | const std::vector VA{11,12}; + | ^ +rsbtt.cpp:745:44: note: parameter passing for argument of type 'std::initializer_list' changed in GCC 7.1 + 745 | const std::vector X{+1,-1,+2,-2}; + | ^ +rsbtt.cpp:746:32: note: parameter passing for argument of type 'std::initializer_list' changed in GCC 7.1 + 746 | std::vector Y{+3,-3}; + | ^ +In function 'void test_Coo_SpMV_Unsymmetric_Transposed()', + inlined from 'int main()' at rsbtt.cpp:845:38: +rsbtt.cpp:789:41: note: parameter passing for argument of type 'std::initializer_list' changed in GCC 7.1 + 789 | const std::vector VA{+11,+21}; + | ^ +rsbtt.cpp:790:40: note: parameter passing for argument of type 'std::initializer_list' changed in GCC 7.1 + 790 | const std::vector X{+21,+22}; + | ^ +rsbtt.cpp:791:34: note: parameter passing for argument of type 'std::initializer_list' changed in GCC 7.1 + 791 | std::vector Y{+31,-32}; + | ^ +In function 'void test_Coo_SpMV_Complex()', + inlined from 'int main()' at rsbtt.cpp:846:23: +rsbtt.cpp:503:37: note: parameter passing for argument of type 'std::initializer_list >' changed in GCC 7.1 + 503 | const std::vector VA{+44}; + | ^ +rsbtt.cpp:504:36: note: parameter passing for argument of type 'std::initializer_list >' changed in GCC 7.1 + 504 | const std::vector X{+21}; + | ^ +rsbtt.cpp:505:30: note: parameter passing for argument of type 'std::initializer_list >' changed in GCC 7.1 + 505 | std::vector Y{+31}; + | ^ +In function 'void test_Coo_SpMV_No_Inc()', + inlined from 'int main()' at rsbtt.cpp:847:22: +rsbtt.cpp:552:39: note: parameter passing for argument of type 'std::initializer_list' changed in GCC 7.1 + 552 | const std::vector VA{11,12}; + | ^ +rsbtt.cpp:553:38: note: parameter passing for argument of type 'std::initializer_list' changed in GCC 7.1 + 553 | const std::vector X{+1,-1}; + | ^ +rsbtt.cpp:554:32: note: parameter passing for argument of type 'std::initializer_list' changed in GCC 7.1 + 554 | std::vector Y{+3,-3}; + | ^ +In function 'void test_Coo_SpMV_Symmetric_At()', + inlined from 'int main()' at rsbtt.cpp:848:28: +rsbtt.cpp:292:37: note: parameter passing for argument of type 'std::initializer_list' changed in GCC 7.1 + 292 | const std::vector VA{+11}; + | ^ +rsbtt.cpp:293:40: note: parameter passing for argument of type 'std::initializer_list' changed in GCC 7.1 + 293 | const std::vector X{-21,+22}; + | ^ +rsbtt.cpp:294:32: note: parameter passing for argument of type 'std::initializer_list' changed in GCC 7.1 + 294 | std::vector Y{-11,3}; + | ^ +In function 'void test_Coo_SpMV_Complex_Unsymmetric_Conjugated_At()', + inlined from 'int main()' at rsbtt.cpp:853:49: +rsbtt.cpp:124:41: note: parameter passing for argument of type 'std::initializer_list >' changed in GCC 7.1 + 124 | const std::vector VA{{0,+44}}; + | ^ +rsbtt.cpp:125:48: note: parameter passing for argument of type 'std::initializer_list >' changed in GCC 7.1 + 125 | const std::vector X{-21,-22,-23,+24}; + | ^ +rsbtt.cpp:126:34: note: parameter passing for argument of type 'std::initializer_list >' changed in GCC 7.1 + 126 | std::vector Y{-11,+13}; + | ^ +In function 'void test_Coo_SpMV_Symmetric_At_Short()', + inlined from 'int main()' at rsbtt.cpp:854:34: +rsbtt.cpp:437:37: note: parameter passing for argument of type 'std::initializer_list' changed in GCC 7.1 + 437 | const std::vector VA{+44}; + | ^ +rsbtt.cpp:438:40: note: parameter passing for argument of type 'std::initializer_list' changed in GCC 7.1 + 438 | const std::vector X{-11,+22}; + | ^ +rsbtt.cpp:439:34: note: parameter passing for argument of type 'std::initializer_list' changed in GCC 7.1 + 439 | std::vector Y{-11,+12}; + | ^ +In function 'void test_Coo_SpMV_Complex_Hermitian()', + inlined from 'int main()' at rsbtt.cpp:855:33: +rsbtt.cpp:527:41: note: parameter passing for argument of type 'std::initializer_list >' changed in GCC 7.1 + 527 | const std::vector VA{{+4,+1}}; + | ^ +rsbtt.cpp:528:38: note: parameter passing for argument of type 'std::initializer_list >' changed in GCC 7.1 + 528 | const std::vector X{+1,+2}; + | ^ +rsbtt.cpp:529:32: note: parameter passing for argument of type 'std::initializer_list >' changed in GCC 7.1 + 529 | std::vector Y{-1,-2}; + | ^ +In function 'void test_Csr_BuildsNonEmptyFromVectors()', + inlined from 'int main()' at rsbtt.cpp:857:36: +rsbtt.cpp:64:35: note: parameter passing for argument of type 'std::initializer_list' changed in GCC 7.1 + 64 | std::vector VA{+11}; + | ^ +In function 'void test_Csr_SpMV_Unsymmetric()', + inlined from 'int main()' at rsbtt.cpp:858:27: +rsbtt.cpp:601:41: note: parameter passing for argument of type 'std::initializer_list' changed in GCC 7.1 + 601 | const std::vector VA{+11,+12}; + | ^ +rsbtt.cpp:602:40: note: parameter passing for argument of type 'std::initializer_list' changed in GCC 7.1 + 602 | const std::vector X{+21,+22}; + | ^ +rsbtt.cpp:603:34: note: parameter passing for argument of type 'std::initializer_list' changed in GCC 7.1 + 603 | std::vector Y{+11,-12}; + | ^ +In function 'void test_Csr_SpMM_Unsymmetric()', + inlined from 'int main()' at rsbtt.cpp:859:27: +rsbtt.cpp:628:41: note: parameter passing for argument of type 'std::initializer_list' changed in GCC 7.1 + 628 | const std::vector VA{+11,+12}; + | ^ +rsbtt.cpp:629:48: note: parameter passing for argument of type 'std::initializer_list' changed in GCC 7.1 + 629 | const std::vector X{+21,+22,+23,+24}; + | ^ +rsbtt.cpp:630:42: note: parameter passing for argument of type 'std::initializer_list' changed in GCC 7.1 + 630 | std::vector Y{+11,-12,+13,-14}; + | ^ +In function 'void test_Csr_SpMM_Unsymmetric_Short_At()', + inlined from 'int main()' at rsbtt.cpp:861:36: +rsbtt.cpp:708:41: note: parameter passing for argument of type 'std::initializer_list' changed in GCC 7.1 + 708 | const std::vector VA{+21,+22}; + | ^ +rsbtt.cpp:709:48: note: parameter passing for argument of type 'std::initializer_list' changed in GCC 7.1 + 709 | const std::vector X{+21,+22,+23,+24}; + | ^ +rsbtt.cpp:722:46: note: parameter passing for argument of type 'std::initializer_list' changed in GCC 7.1 + 722 | std::vector Y{0,-11,+12,0,-13,+14}; + | ^ +In function 'void test_Csr_SpMV_Symmetric_At_Short()', + inlined from 'int main()' at rsbtt.cpp:862:34: +rsbtt.cpp:471:37: note: parameter passing for argument of type 'std::initializer_list' changed in GCC 7.1 + 471 | const std::vector VA{+44}; + | ^ +rsbtt.cpp:472:40: note: parameter passing for argument of type 'std::initializer_list' changed in GCC 7.1 + 472 | const std::vector X{-11,+22}; + | ^ +rsbtt.cpp:473:34: note: parameter passing for argument of type 'std::initializer_list' changed in GCC 7.1 + 473 | std::vector Y{-11,+12}; + | ^ +In function 'void test_Csr_SpMV_Complex_Unsymmetric_Conjugated_At()', + inlined from 'int main()' at rsbtt.cpp:866:49: +rsbtt.cpp:150:41: note: parameter passing for argument of type 'std::initializer_list >' changed in GCC 7.1 + 150 | const std::vector VA{{0,+44}}; + | ^ +rsbtt.cpp:151:48: note: parameter passing for argument of type 'std::initializer_list >' changed in GCC 7.1 + 151 | const std::vector X{-21,-22,-23,+24}; + | ^ +rsbtt.cpp:152:34: note: parameter passing for argument of type 'std::initializer_list >' changed in GCC 7.1 + 152 | std::vector Y{-11,+13}; + | ^ +gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -DRSBPP_HAS_RSB_H=1 -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -c -o rsbct.o rsbct.c +In file included from /usr/include/c++/12/bits/stl_algo.h:60, + from /usr/include/c++/12/algorithm:61, + from rsbpp.hpp:24, from rsbpp.cpp:28: /usr/include/c++/12/bits/stl_heap.h: In function 'void std::__adjust_heap(_RandomAccessIterator, _Distance, _Distance, _Tp, _Compare) [with _RandomAccessIterator = __gnu_cxx::__normal_iterator >::triple_ppd_t*, vector >::triple_ppd_t, OpenMP_Allocator >::triple_ppd_t> > >; _Distance = int; _Tp = Coo >::triple_ppd_t; _Compare = __gnu_cxx::__ops::_Iter_comp_iter >::sort_coc(int, int):: >::triple_t, Coo >::triple_t)> >]': /usr/include/c++/12/bits/stl_heap.h:224:5: note: parameter passing for argument of type '__gnu_cxx::__normal_iterator >::triple_ppd_t*, std::vector >::triple_ppd_t, OpenMP_Allocator >::triple_ppd_t> > >' changed in GCC 7.1 @@ -2621,615 +3257,15 @@ /usr/include/c++/12/bits/stl_vector.h:1032:25: note: parameter passing for argument of type '__gnu_cxx::__normal_iterator >::triple_ppd_t*, std::vector >::triple_ppd_t, OpenMP_Allocator >::triple_ppd_t> > >' changed in GCC 7.1 1032 | _M_fill_insert(end(), __new_size - size(), __x); | ~~~~~~~~~~~~~~^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ -g++ -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -DRSBPP_HAS_RSB_H=1 -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -DRSBPP_HAS_RSB_H=1 -c -o rsbtt.o rsbtt.cpp -In file included from /usr/include/c++/12/bits/stl_algo.h:60, - from /usr/include/c++/12/algorithm:61, - from rsbpp.hpp:24, - from rsbtt.cpp:21: -/usr/include/c++/12/bits/stl_heap.h: In function 'void std::__adjust_heap(_RandomAccessIterator, _Distance, _Distance, _Tp, _Compare) [with _RandomAccessIterator = __gnu_cxx::__normal_iterator::triple_ppd_t*, vector::triple_ppd_t, OpenMP_Allocator::triple_ppd_t> > >; _Distance = int; _Tp = Coo::triple_ppd_t; _Compare = __gnu_cxx::__ops::_Iter_comp_iter::sort_coc(int, int)::::triple_t, Coo::triple_t)> >]': -/usr/include/c++/12/bits/stl_heap.h:224:5: note: parameter passing for argument of type '__gnu_cxx::__normal_iterator::triple_ppd_t*, std::vector::triple_ppd_t, OpenMP_Allocator::triple_ppd_t> > >' changed in GCC 7.1 - 224 | __adjust_heap(_RandomAccessIterator __first, _Distance __holeIndex, - | ^~~~~~~~~~~~~ -/usr/include/c++/12/bits/stl_heap.h: In function 'void std::__adjust_heap(_RandomAccessIterator, _Distance, _Distance, _Tp, _Compare) [with _RandomAccessIterator = __gnu_cxx::__normal_iterator::triple_ppd_t*, vector::triple_ppd_t, OpenMP_Allocator::triple_ppd_t> > >; _Distance = int; _Tp = Coo::triple_ppd_t; _Compare = __gnu_cxx::__ops::_Iter_comp_iter::sort_cor(int, int)::::triple_t, Coo::triple_t)> >]': -/usr/include/c++/12/bits/stl_heap.h:224:5: note: parameter passing for argument of type '__gnu_cxx::__normal_iterator::triple_ppd_t*, std::vector::triple_ppd_t, OpenMP_Allocator::triple_ppd_t> > >' changed in GCC 7.1 -/usr/include/c++/12/bits/stl_algo.h: In function 'void std::__unguarded_linear_insert(_RandomAccessIterator, _Compare) [with _RandomAccessIterator = __gnu_cxx::__normal_iterator::triple_ppd_t*, vector::triple_ppd_t, OpenMP_Allocator::triple_ppd_t> > >; _Compare = __gnu_cxx::__ops::_Val_comp_iter::sort_coc(int, int)::::triple_t, Coo::triple_t)> >]': -/usr/include/c++/12/bits/stl_algo.h:1782:5: note: parameter passing for argument of type '__gnu_cxx::__normal_iterator::triple_ppd_t*, std::vector::triple_ppd_t, OpenMP_Allocator::triple_ppd_t> > >' changed in GCC 7.1 - 1782 | __unguarded_linear_insert(_RandomAccessIterator __last, - | ^~~~~~~~~~~~~~~~~~~~~~~~~ -/usr/include/c++/12/bits/stl_algo.h: In function 'void std::__unguarded_linear_insert(_RandomAccessIterator, _Compare) [with _RandomAccessIterator = __gnu_cxx::__normal_iterator::triple_ppd_t*, vector::triple_ppd_t, OpenMP_Allocator::triple_ppd_t> > >; _Compare = __gnu_cxx::__ops::_Val_comp_iter::sort_cor(int, int)::::triple_t, Coo::triple_t)> >]': -/usr/include/c++/12/bits/stl_algo.h:1782:5: note: parameter passing for argument of type '__gnu_cxx::__normal_iterator::triple_ppd_t*, std::vector::triple_ppd_t, OpenMP_Allocator::triple_ppd_t> > >' changed in GCC 7.1 -/usr/include/c++/12/bits/stl_algo.h: In function 'void std::__insertion_sort(_RandomAccessIterator, _RandomAccessIterator, _Compare) [with _RandomAccessIterator = __gnu_cxx::__normal_iterator::triple_ppd_t*, vector::triple_ppd_t, OpenMP_Allocator::triple_ppd_t> > >; _Compare = __gnu_cxx::__ops::_Iter_comp_iter::sort_cor(int, int)::::triple_t, Coo::triple_t)> >]': -/usr/include/c++/12/bits/stl_algo.h:1802:5: note: parameter passing for argument of type '__gnu_cxx::__normal_iterator::triple_ppd_t*, std::vector::triple_ppd_t, OpenMP_Allocator::triple_ppd_t> > >' changed in GCC 7.1 - 1802 | __insertion_sort(_RandomAccessIterator __first, - | ^~~~~~~~~~~~~~~~ -/usr/include/c++/12/bits/stl_algo.h:1802:5: note: parameter passing for argument of type '__gnu_cxx::__normal_iterator::triple_ppd_t*, std::vector::triple_ppd_t, OpenMP_Allocator::triple_ppd_t> > >' changed in GCC 7.1 -/usr/include/c++/12/bits/stl_algo.h: In function 'void std::__insertion_sort(_RandomAccessIterator, _RandomAccessIterator, _Compare) [with _RandomAccessIterator = __gnu_cxx::__normal_iterator::triple_ppd_t*, vector::triple_ppd_t, OpenMP_Allocator::triple_ppd_t> > >; _Compare = __gnu_cxx::__ops::_Iter_comp_iter::sort_coc(int, int)::::triple_t, Coo::triple_t)> >]': -/usr/include/c++/12/bits/stl_algo.h:1802:5: note: parameter passing for argument of type '__gnu_cxx::__normal_iterator::triple_ppd_t*, std::vector::triple_ppd_t, OpenMP_Allocator::triple_ppd_t> > >' changed in GCC 7.1 -/usr/include/c++/12/bits/stl_algo.h:1802:5: note: parameter passing for argument of type '__gnu_cxx::__normal_iterator::triple_ppd_t*, std::vector::triple_ppd_t, OpenMP_Allocator::triple_ppd_t> > >' changed in GCC 7.1 -/usr/include/c++/12/bits/stl_algo.h: In function '_RandomAccessIterator std::_V2::__rotate(_RandomAccessIterator, _RandomAccessIterator, _RandomAccessIterator, std::random_access_iterator_tag) [with _RandomAccessIterator = __gnu_cxx::__normal_iterator::triple_ppd_t*, std::vector::triple_ppd_t, OpenMP_Allocator::triple_ppd_t> > >]': -/usr/include/c++/12/bits/stl_algo.h:1281:5: note: parameter passing for argument of type '__gnu_cxx::__normal_iterator::triple_ppd_t*, std::vector::triple_ppd_t, OpenMP_Allocator::triple_ppd_t> > >' changed in GCC 7.1 - 1281 | __rotate(_RandomAccessIterator __first, - | ^~~~~~~~ -/usr/include/c++/12/bits/stl_algo.h:1281:5: note: parameter passing for argument of type '__gnu_cxx::__normal_iterator::triple_ppd_t*, std::vector::triple_ppd_t, OpenMP_Allocator::triple_ppd_t> > >' changed in GCC 7.1 -/usr/include/c++/12/bits/stl_algo.h:1281:5: note: parameter passing for argument of type '__gnu_cxx::__normal_iterator::triple_ppd_t*, std::vector::triple_ppd_t, OpenMP_Allocator::triple_ppd_t> > >' changed in GCC 7.1 -In file included from /usr/include/c++/12/vector:64, - from rsbpp.hpp:25: -/usr/include/c++/12/bits/stl_vector.h: In function 'std::vector<_Tp, _Alloc>::vector(std::initializer_list<_Tp>, const allocator_type&) [with _Tp = double; _Alloc = std::allocator]': -/usr/include/c++/12/bits/stl_vector.h:673:7: note: parameter passing for argument of type 'std::initializer_list' changed in GCC 7.1 - 673 | vector(initializer_list __l, - | ^~~~~~ -rsbtt.cpp: In function 'void test_Coo_SpMV_Symmetric()': -rsbtt.cpp:88:37: note: parameter passing for argument of type 'std::initializer_list' changed in GCC 7.1 - 88 | const std::vector VA{+11}; - | ^ -rsbtt.cpp:89:35: note: parameter passing for argument of type 'std::initializer_list' changed in GCC 7.1 - 89 | const std::vector X{21}; - | ^ -rsbtt.cpp:90:30: note: parameter passing for argument of type 'std::initializer_list' changed in GCC 7.1 - 90 | std::vector Y{+11}; - | ^ -rsbtt.cpp: In function 'void test_Csr_SpMM_br_Unsymmetric()': -rsbtt.cpp:662:41: note: parameter passing for argument of type 'std::initializer_list' changed in GCC 7.1 - 662 | const std::vector VA{+11,+12}; - | ^ -rsbtt.cpp:665:48: note: parameter passing for argument of type 'std::initializer_list' changed in GCC 7.1 - 665 | const std::vector X{+21,+23,+22,+24}; - | ^ -rsbtt.cpp:666:42: note: parameter passing for argument of type 'std::initializer_list' changed in GCC 7.1 - 666 | std::vector Y{+11,+13,-12,-14}; - | ^ -/usr/include/c++/12/bits/stl_vector.h: In function 'std::vector<_Tp, _Alloc>::vector(std::initializer_list<_Tp>, const allocator_type&) [with _Tp = std::complex; _Alloc = std::allocator >]': -/usr/include/c++/12/bits/stl_vector.h:673:7: note: parameter passing for argument of type 'std::initializer_list >' changed in GCC 7.1 - 673 | vector(initializer_list __l, - | ^~~~~~ -rsbtt.cpp: In function 'void test_Coo_SpMV_Complex_Symmetric_Transposed_At()': -rsbtt.cpp:176:41: note: parameter passing for argument of type 'std::initializer_list >' changed in GCC 7.1 - 176 | const std::vector VA{{0,+44}}; - | ^ -rsbtt.cpp:177:48: note: parameter passing for argument of type 'std::initializer_list >' changed in GCC 7.1 - 177 | const std::vector X{-21,+22,-23,+24}; - | ^ -rsbtt.cpp:178:42: note: parameter passing for argument of type 'std::initializer_list >' changed in GCC 7.1 - 178 | std::vector Y{-11,+12,-13,+14}; - | ^ -rsbtt.cpp: In function 'void test_Coo_SpMV_Complex_Symmetric_Conjugated_At()': -rsbtt.cpp:204:41: note: parameter passing for argument of type 'std::initializer_list >' changed in GCC 7.1 - 204 | const std::vector VA{{0,+44}}; - | ^ -rsbtt.cpp:205:48: note: parameter passing for argument of type 'std::initializer_list >' changed in GCC 7.1 - 205 | const std::vector X{-21,+22,-23,+24}; - | ^ -rsbtt.cpp:206:42: note: parameter passing for argument of type 'std::initializer_list >' changed in GCC 7.1 - 206 | std::vector Y{-11,+12,-13,+14}; - | ^ -rsbtt.cpp: In function 'void test_Coo_SpMV_Complex_Hermitian_At()': -rsbtt.cpp:324:41: note: parameter passing for argument of type 'std::initializer_list >' changed in GCC 7.1 - 324 | const std::vector VA{{0,+44}}; - | ^ -rsbtt.cpp:325:48: note: parameter passing for argument of type 'std::initializer_list >' changed in GCC 7.1 - 325 | const std::vector X{-21,+22,-23,+24}; - | ^ -rsbtt.cpp:326:42: note: parameter passing for argument of type 'std::initializer_list >' changed in GCC 7.1 - 326 | std::vector Y{-11,+12,-13,+14}; - | ^ -rsbtt.cpp: In function 'void test_Coo_SpMV_Complex_Hermitian_Transposed_At()': -rsbtt.cpp:380:41: note: parameter passing for argument of type 'std::initializer_list >' changed in GCC 7.1 - 380 | const std::vector VA{{0,+44}}; - | ^ -rsbtt.cpp:381:48: note: parameter passing for argument of type 'std::initializer_list >' changed in GCC 7.1 - 381 | const std::vector X{-21,+22,-23,+24}; - | ^ -rsbtt.cpp:382:42: note: parameter passing for argument of type 'std::initializer_list >' changed in GCC 7.1 - 382 | std::vector Y{-11,+12,-13,+14}; - | ^ -rsbtt.cpp: In function 'void test_Csr_SpMV_Complex_Symmetric_Transposed_At()': -rsbtt.cpp:234:41: note: parameter passing for argument of type 'std::initializer_list >' changed in GCC 7.1 - 234 | const std::vector VA{{0,+44}}; - | ^ -rsbtt.cpp:235:48: note: parameter passing for argument of type 'std::initializer_list >' changed in GCC 7.1 - 235 | const std::vector X{-21,+22,-23,+24}; - | ^ -rsbtt.cpp:236:42: note: parameter passing for argument of type 'std::initializer_list >' changed in GCC 7.1 - 236 | std::vector Y{-11,+12,-13,+14}; - | ^ -rsbtt.cpp: In function 'void test_Csr_SpMV_Complex_Symmetric_Conjugated_At()': -rsbtt.cpp:264:41: note: parameter passing for argument of type 'std::initializer_list >' changed in GCC 7.1 - 264 | const std::vector VA{{0,+44}}; - | ^ -rsbtt.cpp:265:48: note: parameter passing for argument of type 'std::initializer_list >' changed in GCC 7.1 - 265 | const std::vector X{-21,+22,-23,+24}; - | ^ -rsbtt.cpp:266:42: note: parameter passing for argument of type 'std::initializer_list >' changed in GCC 7.1 - 266 | std::vector Y{-11,+12,-13,+14}; - | ^ -rsbtt.cpp: In function 'void test_Csr_SpMV_Complex_Hermitian_At()': -rsbtt.cpp:352:41: note: parameter passing for argument of type 'std::initializer_list >' changed in GCC 7.1 - 352 | const std::vector VA{{0,+44}}; - | ^ -rsbtt.cpp:353:48: note: parameter passing for argument of type 'std::initializer_list >' changed in GCC 7.1 - 353 | const std::vector X{-21,+22,-23,+24}; - | ^ -rsbtt.cpp:354:42: note: parameter passing for argument of type 'std::initializer_list >' changed in GCC 7.1 - 354 | std::vector Y{-11,+12,-13,+14}; - | ^ -rsbtt.cpp: In function 'void test_Csr_SpMV_Complex_Hermitian_Transposed_At()': -rsbtt.cpp:408:41: note: parameter passing for argument of type 'std::initializer_list >' changed in GCC 7.1 - 408 | const std::vector VA{{0,+44}}; - | ^ -rsbtt.cpp:409:48: note: parameter passing for argument of type 'std::initializer_list >' changed in GCC 7.1 - 409 | const std::vector X{-21,+22,-23,+24}; - | ^ -rsbtt.cpp:410:42: note: parameter passing for argument of type 'std::initializer_list >' changed in GCC 7.1 - 410 | std::vector Y{-11,+12,-13,+14}; - | ^ -In file included from /usr/include/c++/12/vector:70: -/usr/include/c++/12/bits/vector.tcc: In member function 'void std::vector<_Tp, _Alloc>::_M_realloc_insert(iterator, _Args&& ...) [with _Args = {Coo::triple_ppd_t}; _Tp = Coo::triple_ppd_t; _Alloc = OpenMP_Allocator::triple_ppd_t>]': -/usr/include/c++/12/bits/vector.tcc:439:7: note: parameter passing for argument of type 'std::vector::triple_ppd_t, OpenMP_Allocator::triple_ppd_t> >::iterator' changed in GCC 7.1 - 439 | vector<_Tp, _Alloc>:: - | ^~~~~~~~~~~~~~~~~~~ -In file included from /usr/include/c++/12/bits/stl_algo.h:61: -/usr/include/c++/12/bits/stl_tempbuf.h: In constructor 'std::_Temporary_buffer<_ForwardIterator, _Tp>::_Temporary_buffer(_ForwardIterator, size_type) [with _ForwardIterator = __gnu_cxx::__normal_iterator::triple_ppd_t*, std::vector::triple_ppd_t, OpenMP_Allocator::triple_ppd_t> > >; _Tp = Coo::triple_ppd_t]': -/usr/include/c++/12/bits/stl_tempbuf.h:258:5: note: parameter passing for argument of type '__gnu_cxx::__normal_iterator::triple_ppd_t*, std::vector::triple_ppd_t, OpenMP_Allocator::triple_ppd_t> > >' changed in GCC 7.1 - 258 | _Temporary_buffer<_ForwardIterator, _Tp>:: - | ^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ -/usr/include/c++/12/bits/stl_algo.h: In function '_ForwardIterator std::__stable_partition_adaptive(_ForwardIterator, _ForwardIterator, _Predicate, _Distance, _Pointer, _Distance) [with _ForwardIterator = __gnu_cxx::__normal_iterator::triple_ppd_t*, vector::triple_ppd_t, OpenMP_Allocator::triple_ppd_t> > >; _Pointer = Coo::triple_ppd_t*; _Predicate = __gnu_cxx::__ops::_Iter_pred::zort(std::vector >::iterator, int, int, int, int, int, int, QuadTree&)::::triple_t)> >; _Distance = int]': -/usr/include/c++/12/bits/stl_algo.h:1506:5: note: parameter passing for argument of type '__gnu_cxx::__normal_iterator::triple_ppd_t*, std::vector::triple_ppd_t, OpenMP_Allocator::triple_ppd_t> > >' changed in GCC 7.1 - 1506 | __stable_partition_adaptive(_ForwardIterator __first, - | ^~~~~~~~~~~~~~~~~~~~~~~~~~~ -/usr/include/c++/12/bits/stl_algo.h:1506:5: note: parameter passing for argument of type '__gnu_cxx::__normal_iterator::triple_ppd_t*, std::vector::triple_ppd_t, OpenMP_Allocator::triple_ppd_t> > >' changed in GCC 7.1 -/usr/include/c++/12/bits/stl_algo.h:1545:41: note: parameter passing for argument of type '__gnu_cxx::__normal_iterator::triple_ppd_t*, std::vector::triple_ppd_t, OpenMP_Allocator::triple_ppd_t> > >' changed in GCC 7.1 - 1545 | std::__stable_partition_adaptive(__first, __middle, __pred, - | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~^~~~~~~~~~~~~~~~~~~~~~~~~~~ - 1546 | __len / 2, __buffer, - | ~~~~~~~~~~~~~~~~~~~~ - 1547 | __buffer_size); - | ~~~~~~~~~~~~~~ -/usr/include/c++/12/bits/stl_algo.h:1557:43: note: parameter passing for argument of type '__gnu_cxx::__normal_iterator::triple_ppd_t*, std::vector::triple_ppd_t, OpenMP_Allocator::triple_ppd_t> > >' changed in GCC 7.1 - 1557 | std::__stable_partition_adaptive(__right_split, __last, __pred, - | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ - 1558 | __right_len, - | ~~~~~~~~~~~~ - 1559 | __buffer, __buffer_size); - | ~~~~~~~~~~~~~~~~~~~~~~~~ -In function '_FIter std::_V2::rotate(_FIter, _FIter, _FIter) [with _FIter = __gnu_cxx::__normal_iterator::triple_ppd_t*, std::vector::triple_ppd_t, OpenMP_Allocator::triple_ppd_t> > >]', - inlined from '_ForwardIterator std::__stable_partition_adaptive(_ForwardIterator, _ForwardIterator, _Predicate, _Distance, _Pointer, _Distance) [with _ForwardIterator = __gnu_cxx::__normal_iterator::triple_ppd_t*, vector::triple_ppd_t, OpenMP_Allocator::triple_ppd_t> > >; _Pointer = Coo::triple_ppd_t*; _Predicate = __gnu_cxx::__ops::_Iter_pred::zort(std::vector >::iterator, int, int, int, int, int, int, QuadTree&)::::triple_t)> >; _Distance = int]' at /usr/include/c++/12/bits/stl_algo.h:1561:25: -/usr/include/c++/12/bits/stl_algo.h:1397:27: note: parameter passing for argument of type '__gnu_cxx::__normal_iterator::triple_ppd_t*, std::vector::triple_ppd_t, OpenMP_Allocator::triple_ppd_t> > >' changed in GCC 7.1 - 1397 | return std::__rotate(__first, __middle, __last, - | ~~~~~~~~~~~~~^~~~~~~~~~~~~~~~~~~~~~~~~~~ - 1398 | std::__iterator_category(__first)); - | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ -/usr/include/c++/12/bits/stl_algo.h: In function '_ForwardIterator std::__stable_partition(_ForwardIterator, _ForwardIterator, _Predicate) [with _ForwardIterator = __gnu_cxx::__normal_iterator::triple_ppd_t*, vector::triple_ppd_t, OpenMP_Allocator::triple_ppd_t> > >; _Predicate = __gnu_cxx::__ops::_Iter_pred::zort(std::vector >::iterator, int, int, int, int, int, int, QuadTree&)::::triple_t)> >]': -/usr/include/c++/12/bits/stl_algo.h:1566:5: note: parameter passing for argument of type '__gnu_cxx::__normal_iterator::triple_ppd_t*, std::vector::triple_ppd_t, OpenMP_Allocator::triple_ppd_t> > >' changed in GCC 7.1 - 1566 | __stable_partition(_ForwardIterator __first, _ForwardIterator __last, - | ^~~~~~~~~~~~~~~~~~ -/usr/include/c++/12/bits/stl_algo.h:1566:5: note: parameter passing for argument of type '__gnu_cxx::__normal_iterator::triple_ppd_t*, std::vector::triple_ppd_t, OpenMP_Allocator::triple_ppd_t> > >' changed in GCC 7.1 -/usr/include/c++/12/bits/stl_algo.h:1580:9: note: parameter passing for argument of type '__gnu_cxx::__normal_iterator::triple_ppd_t*, std::vector::triple_ppd_t, OpenMP_Allocator::triple_ppd_t> > >' changed in GCC 7.1 - 1580 | __buf(__first, std::distance(__first, __last)); - | ^~~~~ -/usr/include/c++/12/bits/stl_algo.h:1582:41: note: parameter passing for argument of type '__gnu_cxx::__normal_iterator::triple_ppd_t*, std::vector::triple_ppd_t, OpenMP_Allocator::triple_ppd_t> > >' changed in GCC 7.1 - 1582 | std::__stable_partition_adaptive(__first, __last, __pred, - | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~^~~~~~~~~~~~~~~~~~~~~~~~~ - 1583 | _DistanceType(__buf.requested_size()), - | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ - 1584 | __buf.begin(), - | ~~~~~~~~~~~~~~ - 1585 | _DistanceType(__buf.size())); - | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~ -/usr/include/c++/12/bits/stl_algo.h: In function '_ForwardIterator std::__stable_partition_adaptive(_ForwardIterator, _ForwardIterator, _Predicate, _Distance, _Pointer, _Distance) [with _ForwardIterator = __gnu_cxx::__normal_iterator::triple_ppd_t*, vector::triple_ppd_t, OpenMP_Allocator::triple_ppd_t> > >; _Pointer = Coo::triple_ppd_t*; _Predicate = __gnu_cxx::__ops::_Iter_pred::zort(std::vector >::iterator, int, int, int, int, int, int, QuadTree&)::::triple_t)> >; _Distance = int]': -/usr/include/c++/12/bits/stl_algo.h:1506:5: note: parameter passing for argument of type '__gnu_cxx::__normal_iterator::triple_ppd_t*, std::vector::triple_ppd_t, OpenMP_Allocator::triple_ppd_t> > >' changed in GCC 7.1 - 1506 | __stable_partition_adaptive(_ForwardIterator __first, - | ^~~~~~~~~~~~~~~~~~~~~~~~~~~ -/usr/include/c++/12/bits/stl_algo.h:1506:5: note: parameter passing for argument of type '__gnu_cxx::__normal_iterator::triple_ppd_t*, std::vector::triple_ppd_t, OpenMP_Allocator::triple_ppd_t> > >' changed in GCC 7.1 -/usr/include/c++/12/bits/stl_algo.h:1545:41: note: parameter passing for argument of type '__gnu_cxx::__normal_iterator::triple_ppd_t*, std::vector::triple_ppd_t, OpenMP_Allocator::triple_ppd_t> > >' changed in GCC 7.1 - 1545 | std::__stable_partition_adaptive(__first, __middle, __pred, - | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~^~~~~~~~~~~~~~~~~~~~~~~~~~~ - 1546 | __len / 2, __buffer, - | ~~~~~~~~~~~~~~~~~~~~ - 1547 | __buffer_size); - | ~~~~~~~~~~~~~~ -/usr/include/c++/12/bits/stl_algo.h:1557:43: note: parameter passing for argument of type '__gnu_cxx::__normal_iterator::triple_ppd_t*, std::vector::triple_ppd_t, OpenMP_Allocator::triple_ppd_t> > >' changed in GCC 7.1 - 1557 | std::__stable_partition_adaptive(__right_split, __last, __pred, - | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ - 1558 | __right_len, - | ~~~~~~~~~~~~ - 1559 | __buffer, __buffer_size); - | ~~~~~~~~~~~~~~~~~~~~~~~~ -In function '_FIter std::_V2::rotate(_FIter, _FIter, _FIter) [with _FIter = __gnu_cxx::__normal_iterator::triple_ppd_t*, std::vector::triple_ppd_t, OpenMP_Allocator::triple_ppd_t> > >]', - inlined from '_ForwardIterator std::__stable_partition_adaptive(_ForwardIterator, _ForwardIterator, _Predicate, _Distance, _Pointer, _Distance) [with _ForwardIterator = __gnu_cxx::__normal_iterator::triple_ppd_t*, vector::triple_ppd_t, OpenMP_Allocator::triple_ppd_t> > >; _Pointer = Coo::triple_ppd_t*; _Predicate = __gnu_cxx::__ops::_Iter_pred::zort(std::vector >::iterator, int, int, int, int, int, int, QuadTree&)::::triple_t)> >; _Distance = int]' at /usr/include/c++/12/bits/stl_algo.h:1561:25: -/usr/include/c++/12/bits/stl_algo.h:1397:27: note: parameter passing for argument of type '__gnu_cxx::__normal_iterator::triple_ppd_t*, std::vector::triple_ppd_t, OpenMP_Allocator::triple_ppd_t> > >' changed in GCC 7.1 - 1397 | return std::__rotate(__first, __middle, __last, - | ~~~~~~~~~~~~~^~~~~~~~~~~~~~~~~~~~~~~~~~~ - 1398 | std::__iterator_category(__first)); - | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ -/usr/include/c++/12/bits/stl_algo.h: In function '_ForwardIterator std::__stable_partition(_ForwardIterator, _ForwardIterator, _Predicate) [with _ForwardIterator = __gnu_cxx::__normal_iterator::triple_ppd_t*, vector::triple_ppd_t, OpenMP_Allocator::triple_ppd_t> > >; _Predicate = __gnu_cxx::__ops::_Iter_pred::zort(std::vector >::iterator, int, int, int, int, int, int, QuadTree&)::::triple_t)> >]': -/usr/include/c++/12/bits/stl_algo.h:1566:5: note: parameter passing for argument of type '__gnu_cxx::__normal_iterator::triple_ppd_t*, std::vector::triple_ppd_t, OpenMP_Allocator::triple_ppd_t> > >' changed in GCC 7.1 - 1566 | __stable_partition(_ForwardIterator __first, _ForwardIterator __last, - | ^~~~~~~~~~~~~~~~~~ -/usr/include/c++/12/bits/stl_algo.h:1566:5: note: parameter passing for argument of type '__gnu_cxx::__normal_iterator::triple_ppd_t*, std::vector::triple_ppd_t, OpenMP_Allocator::triple_ppd_t> > >' changed in GCC 7.1 -/usr/include/c++/12/bits/stl_algo.h:1580:9: note: parameter passing for argument of type '__gnu_cxx::__normal_iterator::triple_ppd_t*, std::vector::triple_ppd_t, OpenMP_Allocator::triple_ppd_t> > >' changed in GCC 7.1 - 1580 | __buf(__first, std::distance(__first, __last)); - | ^~~~~ -/usr/include/c++/12/bits/stl_algo.h:1582:41: note: parameter passing for argument of type '__gnu_cxx::__normal_iterator::triple_ppd_t*, std::vector::triple_ppd_t, OpenMP_Allocator::triple_ppd_t> > >' changed in GCC 7.1 - 1582 | std::__stable_partition_adaptive(__first, __last, __pred, - | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~^~~~~~~~~~~~~~~~~~~~~~~~~ - 1583 | _DistanceType(__buf.requested_size()), - | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ - 1584 | __buf.begin(), - | ~~~~~~~~~~~~~~ - 1585 | _DistanceType(__buf.size())); - | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~ -/usr/include/c++/12/bits/stl_algo.h: In function '_ForwardIterator std::__stable_partition_adaptive(_ForwardIterator, _ForwardIterator, _Predicate, _Distance, _Pointer, _Distance) [with _ForwardIterator = __gnu_cxx::__normal_iterator::triple_ppd_t*, vector::triple_ppd_t, OpenMP_Allocator::triple_ppd_t> > >; _Pointer = Coo::triple_ppd_t*; _Predicate = __gnu_cxx::__ops::_Iter_pred::zort(std::vector >::iterator, int, int, int, int, int, int, QuadTree&)::::triple_t)> >; _Distance = int]': -/usr/include/c++/12/bits/stl_algo.h:1506:5: note: parameter passing for argument of type '__gnu_cxx::__normal_iterator::triple_ppd_t*, std::vector::triple_ppd_t, OpenMP_Allocator::triple_ppd_t> > >' changed in GCC 7.1 - 1506 | __stable_partition_adaptive(_ForwardIterator __first, - | ^~~~~~~~~~~~~~~~~~~~~~~~~~~ -/usr/include/c++/12/bits/stl_algo.h:1506:5: note: parameter passing for argument of type '__gnu_cxx::__normal_iterator::triple_ppd_t*, std::vector::triple_ppd_t, OpenMP_Allocator::triple_ppd_t> > >' changed in GCC 7.1 -/usr/include/c++/12/bits/stl_algo.h:1545:41: note: parameter passing for argument of type '__gnu_cxx::__normal_iterator::triple_ppd_t*, std::vector::triple_ppd_t, OpenMP_Allocator::triple_ppd_t> > >' changed in GCC 7.1 - 1545 | std::__stable_partition_adaptive(__first, __middle, __pred, - | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~^~~~~~~~~~~~~~~~~~~~~~~~~~~ - 1546 | __len / 2, __buffer, - | ~~~~~~~~~~~~~~~~~~~~ - 1547 | __buffer_size); - | ~~~~~~~~~~~~~~ -/usr/include/c++/12/bits/stl_algo.h:1557:43: note: parameter passing for argument of type '__gnu_cxx::__normal_iterator::triple_ppd_t*, std::vector::triple_ppd_t, OpenMP_Allocator::triple_ppd_t> > >' changed in GCC 7.1 - 1557 | std::__stable_partition_adaptive(__right_split, __last, __pred, - | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ - 1558 | __right_len, - | ~~~~~~~~~~~~ - 1559 | __buffer, __buffer_size); - | ~~~~~~~~~~~~~~~~~~~~~~~~ -In function '_FIter std::_V2::rotate(_FIter, _FIter, _FIter) [with _FIter = __gnu_cxx::__normal_iterator::triple_ppd_t*, std::vector::triple_ppd_t, OpenMP_Allocator::triple_ppd_t> > >]', - inlined from '_ForwardIterator std::__stable_partition_adaptive(_ForwardIterator, _ForwardIterator, _Predicate, _Distance, _Pointer, _Distance) [with _ForwardIterator = __gnu_cxx::__normal_iterator::triple_ppd_t*, vector::triple_ppd_t, OpenMP_Allocator::triple_ppd_t> > >; _Pointer = Coo::triple_ppd_t*; _Predicate = __gnu_cxx::__ops::_Iter_pred::zort(std::vector >::iterator, int, int, int, int, int, int, QuadTree&)::::triple_t)> >; _Distance = int]' at /usr/include/c++/12/bits/stl_algo.h:1561:25: -/usr/include/c++/12/bits/stl_algo.h:1397:27: note: parameter passing for argument of type '__gnu_cxx::__normal_iterator::triple_ppd_t*, std::vector::triple_ppd_t, OpenMP_Allocator::triple_ppd_t> > >' changed in GCC 7.1 - 1397 | return std::__rotate(__first, __middle, __last, - | ~~~~~~~~~~~~~^~~~~~~~~~~~~~~~~~~~~~~~~~~ - 1398 | std::__iterator_category(__first)); - | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ -/usr/include/c++/12/bits/stl_algo.h: In function '_ForwardIterator std::__stable_partition(_ForwardIterator, _ForwardIterator, _Predicate) [with _ForwardIterator = __gnu_cxx::__normal_iterator::triple_ppd_t*, vector::triple_ppd_t, OpenMP_Allocator::triple_ppd_t> > >; _Predicate = __gnu_cxx::__ops::_Iter_pred::zort(std::vector >::iterator, int, int, int, int, int, int, QuadTree&)::::triple_t)> >]': -/usr/include/c++/12/bits/stl_algo.h:1566:5: note: parameter passing for argument of type '__gnu_cxx::__normal_iterator::triple_ppd_t*, std::vector::triple_ppd_t, OpenMP_Allocator::triple_ppd_t> > >' changed in GCC 7.1 - 1566 | __stable_partition(_ForwardIterator __first, _ForwardIterator __last, - | ^~~~~~~~~~~~~~~~~~ -/usr/include/c++/12/bits/stl_algo.h:1566:5: note: parameter passing for argument of type '__gnu_cxx::__normal_iterator::triple_ppd_t*, std::vector::triple_ppd_t, OpenMP_Allocator::triple_ppd_t> > >' changed in GCC 7.1 -/usr/include/c++/12/bits/stl_algo.h:1580:9: note: parameter passing for argument of type '__gnu_cxx::__normal_iterator::triple_ppd_t*, std::vector::triple_ppd_t, OpenMP_Allocator::triple_ppd_t> > >' changed in GCC 7.1 - 1580 | __buf(__first, std::distance(__first, __last)); - | ^~~~~ -/usr/include/c++/12/bits/stl_algo.h:1582:41: note: parameter passing for argument of type '__gnu_cxx::__normal_iterator::triple_ppd_t*, std::vector::triple_ppd_t, OpenMP_Allocator::triple_ppd_t> > >' changed in GCC 7.1 - 1582 | std::__stable_partition_adaptive(__first, __last, __pred, - | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~^~~~~~~~~~~~~~~~~~~~~~~~~ - 1583 | _DistanceType(__buf.requested_size()), - | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ - 1584 | __buf.begin(), - | ~~~~~~~~~~~~~~ - 1585 | _DistanceType(__buf.size())); - | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~ -/usr/include/c++/12/bits/stl_algo.h: In function 'void std::__introsort_loop(_RandomAccessIterator, _RandomAccessIterator, _Size, _Compare) [with _RandomAccessIterator = __gnu_cxx::__normal_iterator::triple_ppd_t*, vector::triple_ppd_t, OpenMP_Allocator::triple_ppd_t> > >; _Size = int; _Compare = __gnu_cxx::__ops::_Iter_comp_iter::sort_cor(int, int)::::triple_t, Coo::triple_t)> >]': -/usr/include/c++/12/bits/stl_algo.h:1908:5: note: parameter passing for argument of type '__gnu_cxx::__normal_iterator::triple_ppd_t*, std::vector::triple_ppd_t, OpenMP_Allocator::triple_ppd_t> > >' changed in GCC 7.1 - 1908 | __introsort_loop(_RandomAccessIterator __first, - | ^~~~~~~~~~~~~~~~ -/usr/include/c++/12/bits/stl_algo.h:1908:5: note: parameter passing for argument of type '__gnu_cxx::__normal_iterator::triple_ppd_t*, std::vector::triple_ppd_t, OpenMP_Allocator::triple_ppd_t> > >' changed in GCC 7.1 -/usr/include/c++/12/bits/stl_algo.h:1922:32: note: parameter passing for argument of type '__gnu_cxx::__normal_iterator::triple_ppd_t*, std::vector::triple_ppd_t, OpenMP_Allocator::triple_ppd_t> > >' changed in GCC 7.1 - 1922 | std::__introsort_loop(__cut, __last, __depth_limit, __comp); - | ~~~~~~~~~~~~~~~~~~~~~^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ -/usr/include/c++/12/bits/stl_algo.h: In function 'void std::__introsort_loop(_RandomAccessIterator, _RandomAccessIterator, _Size, _Compare) [with _RandomAccessIterator = __gnu_cxx::__normal_iterator::triple_ppd_t*, vector::triple_ppd_t, OpenMP_Allocator::triple_ppd_t> > >; _Size = int; _Compare = __gnu_cxx::__ops::_Iter_comp_iter::sort_coc(int, int)::::triple_t, Coo::triple_t)> >]': -/usr/include/c++/12/bits/stl_algo.h:1908:5: note: parameter passing for argument of type '__gnu_cxx::__normal_iterator::triple_ppd_t*, std::vector::triple_ppd_t, OpenMP_Allocator::triple_ppd_t> > >' changed in GCC 7.1 - 1908 | __introsort_loop(_RandomAccessIterator __first, - | ^~~~~~~~~~~~~~~~ -/usr/include/c++/12/bits/stl_algo.h:1908:5: note: parameter passing for argument of type '__gnu_cxx::__normal_iterator::triple_ppd_t*, std::vector::triple_ppd_t, OpenMP_Allocator::triple_ppd_t> > >' changed in GCC 7.1 -/usr/include/c++/12/bits/stl_algo.h:1922:32: note: parameter passing for argument of type '__gnu_cxx::__normal_iterator::triple_ppd_t*, std::vector::triple_ppd_t, OpenMP_Allocator::triple_ppd_t> > >' changed in GCC 7.1 - 1922 | std::__introsort_loop(__cut, __last, __depth_limit, __comp); - | ~~~~~~~~~~~~~~~~~~~~~^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ -rsbpp.hpp: In member function 'void Coo::zort(typename trivec_t::iterator, IT, IT, IT, IT, IT, IT, QuadTree&) [with IT = int; NT = double]': -rsbpp.hpp:4458:14: note: parameter passing for argument of type 'std::vector::triple_ppd_t, OpenMP_Allocator::triple_ppd_t> >::iterator' changed in GCC 7.1 - 4458 | void zort(typename trivec_t::iterator bi, const IT lfnz, const IT lnnz, const IT lfr, const IT lnr, const IT lfc, const IT lnc, QuadTree & qt) - | ^~~~ -In function 'void std::__sort(_RandomAccessIterator, _RandomAccessIterator, _Compare) [with _RandomAccessIterator = __gnu_cxx::__normal_iterator::triple_ppd_t*, vector::triple_ppd_t, OpenMP_Allocator::triple_ppd_t> > >; _Compare = __gnu_cxx::__ops::_Iter_comp_iter::sort_cor(int, int)::::triple_t, Coo::triple_t)> >]', - inlined from 'void std::sort(_RAIter, _RAIter, _Compare) [with _RAIter = __gnu_cxx::__normal_iterator::triple_ppd_t*, vector::triple_ppd_t, OpenMP_Allocator::triple_ppd_t> > >; _Compare = Coo::sort_cor(int, int)::::triple_t, Coo::triple_t)>]' at /usr/include/c++/12/bits/stl_algo.h:4853:18, - inlined from 'void Coo::sort_cor(IT, IT) [with IT = int; NT = double]' at rsbpp.hpp:4419:12, - inlined from 'void Coo::zort(typename trivec_t::iterator, IT, IT, IT, IT, IT, IT, QuadTree&) [with IT = int; NT = double]' at rsbpp.hpp:4510:14: -/usr/include/c++/12/bits/stl_algo.h:1937:32: note: parameter passing for argument of type '__gnu_cxx::__normal_iterator::triple_ppd_t*, std::vector::triple_ppd_t, OpenMP_Allocator::triple_ppd_t> > >' changed in GCC 7.1 - 1937 | std::__introsort_loop(__first, __last, - | ~~~~~~~~~~~~~~~~~~~~~^~~~~~~~~~~~~~~~~ - 1938 | std::__lg(__last - __first) * 2, - | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ - 1939 | __comp); - | ~~~~~~~ -In function 'void std::__final_insertion_sort(_RandomAccessIterator, _RandomAccessIterator, _Compare) [with _RandomAccessIterator = __gnu_cxx::__normal_iterator::triple_ppd_t*, vector::triple_ppd_t, OpenMP_Allocator::triple_ppd_t> > >; _Compare = __gnu_cxx::__ops::_Iter_comp_iter::sort_cor(int, int)::::triple_t, Coo::triple_t)> >]', - inlined from 'void std::__sort(_RandomAccessIterator, _RandomAccessIterator, _Compare) [with _RandomAccessIterator = __gnu_cxx::__normal_iterator::triple_ppd_t*, vector::triple_ppd_t, OpenMP_Allocator::triple_ppd_t> > >; _Compare = __gnu_cxx::__ops::_Iter_comp_iter::sort_cor(int, int)::::triple_t, Coo::triple_t)> >]' at /usr/include/c++/12/bits/stl_algo.h:1940:31, - inlined from 'void std::sort(_RAIter, _RAIter, _Compare) [with _RAIter = __gnu_cxx::__normal_iterator::triple_ppd_t*, vector::triple_ppd_t, OpenMP_Allocator::triple_ppd_t> > >; _Compare = Coo::sort_cor(int, int)::::triple_t, Coo::triple_t)>]' at /usr/include/c++/12/bits/stl_algo.h:4853:18, - inlined from 'void Coo::sort_cor(IT, IT) [with IT = int; NT = double]' at rsbpp.hpp:4419:12, - inlined from 'void Coo::zort(typename trivec_t::iterator, IT, IT, IT, IT, IT, IT, QuadTree&) [with IT = int; NT = double]' at rsbpp.hpp:4510:14: -/usr/include/c++/12/bits/stl_algo.h:1849:32: note: parameter passing for argument of type '__gnu_cxx::__normal_iterator::triple_ppd_t*, std::vector::triple_ppd_t, OpenMP_Allocator::triple_ppd_t> > >' changed in GCC 7.1 - 1849 | std::__insertion_sort(__first, __first + int(_S_threshold), __comp); - | ~~~~~~~~~~~~~~~~~~~~~^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ -/usr/include/c++/12/bits/stl_algo.h:1854:30: note: parameter passing for argument of type '__gnu_cxx::__normal_iterator::triple_ppd_t*, std::vector::triple_ppd_t, OpenMP_Allocator::triple_ppd_t> > >' changed in GCC 7.1 - 1854 | std::__insertion_sort(__first, __last, __comp); - | ~~~~~~~~~~~~~~~~~~~~~^~~~~~~~~~~~~~~~~~~~~~~~~ -In function 'void std::__sort(_RandomAccessIterator, _RandomAccessIterator, _Compare) [with _RandomAccessIterator = __gnu_cxx::__normal_iterator::triple_ppd_t*, vector::triple_ppd_t, OpenMP_Allocator::triple_ppd_t> > >; _Compare = __gnu_cxx::__ops::_Iter_comp_iter::sort_coc(int, int)::::triple_t, Coo::triple_t)> >]', - inlined from 'void std::sort(_RAIter, _RAIter, _Compare) [with _RAIter = __gnu_cxx::__normal_iterator::triple_ppd_t*, vector::triple_ppd_t, OpenMP_Allocator::triple_ppd_t> > >; _Compare = Coo::sort_coc(int, int)::::triple_t, Coo::triple_t)>]' at /usr/include/c++/12/bits/stl_algo.h:4853:18, - inlined from 'void Coo::sort_coc(IT, IT) [with IT = int; NT = double]' at rsbpp.hpp:4447:12, - inlined from 'void Coo::zort(typename trivec_t::iterator, IT, IT, IT, IT, IT, IT, QuadTree&) [with IT = int; NT = double]' at rsbpp.hpp:4512:14: -/usr/include/c++/12/bits/stl_algo.h:1937:32: note: parameter passing for argument of type '__gnu_cxx::__normal_iterator::triple_ppd_t*, std::vector::triple_ppd_t, OpenMP_Allocator::triple_ppd_t> > >' changed in GCC 7.1 - 1937 | std::__introsort_loop(__first, __last, - | ~~~~~~~~~~~~~~~~~~~~~^~~~~~~~~~~~~~~~~ - 1938 | std::__lg(__last - __first) * 2, - | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ - 1939 | __comp); - | ~~~~~~~ -In function 'void std::__final_insertion_sort(_RandomAccessIterator, _RandomAccessIterator, _Compare) [with _RandomAccessIterator = __gnu_cxx::__normal_iterator::triple_ppd_t*, vector::triple_ppd_t, OpenMP_Allocator::triple_ppd_t> > >; _Compare = __gnu_cxx::__ops::_Iter_comp_iter::sort_coc(int, int)::::triple_t, Coo::triple_t)> >]', - inlined from 'void std::__sort(_RandomAccessIterator, _RandomAccessIterator, _Compare) [with _RandomAccessIterator = __gnu_cxx::__normal_iterator::triple_ppd_t*, vector::triple_ppd_t, OpenMP_Allocator::triple_ppd_t> > >; _Compare = __gnu_cxx::__ops::_Iter_comp_iter::sort_coc(int, int)::::triple_t, Coo::triple_t)> >]' at /usr/include/c++/12/bits/stl_algo.h:1940:31, - inlined from 'void std::sort(_RAIter, _RAIter, _Compare) [with _RAIter = __gnu_cxx::__normal_iterator::triple_ppd_t*, vector::triple_ppd_t, OpenMP_Allocator::triple_ppd_t> > >; _Compare = Coo::sort_coc(int, int)::::triple_t, Coo::triple_t)>]' at /usr/include/c++/12/bits/stl_algo.h:4853:18, - inlined from 'void Coo::sort_coc(IT, IT) [with IT = int; NT = double]' at rsbpp.hpp:4447:12, - inlined from 'void Coo::zort(typename trivec_t::iterator, IT, IT, IT, IT, IT, IT, QuadTree&) [with IT = int; NT = double]' at rsbpp.hpp:4512:14: -/usr/include/c++/12/bits/stl_algo.h:1849:32: note: parameter passing for argument of type '__gnu_cxx::__normal_iterator::triple_ppd_t*, std::vector::triple_ppd_t, OpenMP_Allocator::triple_ppd_t> > >' changed in GCC 7.1 - 1849 | std::__insertion_sort(__first, __first + int(_S_threshold), __comp); - | ~~~~~~~~~~~~~~~~~~~~~^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ -/usr/include/c++/12/bits/stl_algo.h:1854:30: note: parameter passing for argument of type '__gnu_cxx::__normal_iterator::triple_ppd_t*, std::vector::triple_ppd_t, OpenMP_Allocator::triple_ppd_t> > >' changed in GCC 7.1 - 1854 | std::__insertion_sort(__first, __last, __comp); - | ~~~~~~~~~~~~~~~~~~~~~^~~~~~~~~~~~~~~~~~~~~~~~~ -In function '_BIter std::stable_partition(_BIter, _BIter, _Predicate) [with _BIter = __gnu_cxx::__normal_iterator::triple_ppd_t*, vector::triple_ppd_t, OpenMP_Allocator::triple_ppd_t> > >; _Predicate = Coo::zort(std::vector >::iterator, int, int, int, int, int, int, QuadTree&)::::triple_t)>]', - inlined from 'void Coo::zort(typename trivec_t::iterator, IT, IT, IT, IT, IT, IT, QuadTree&) [with IT = int; NT = double]' at rsbpp.hpp:4527:40: -/usr/include/c++/12/bits/stl_algo.h:1617:37: note: parameter passing for argument of type '__gnu_cxx::__normal_iterator::triple_ppd_t*, std::vector::triple_ppd_t, OpenMP_Allocator::triple_ppd_t> > >' changed in GCC 7.1 - 1617 | return std::__stable_partition(__first, __last, - | ~~~~~~~~~~~~~~~~~~~~~~~^~~~~~~~~~~~~~~~~ - 1618 | __gnu_cxx::__ops::__pred_iter(__pred)); - | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ -In function '_BIter std::stable_partition(_BIter, _BIter, _Predicate) [with _BIter = __gnu_cxx::__normal_iterator::triple_ppd_t*, vector::triple_ppd_t, OpenMP_Allocator::triple_ppd_t> > >; _Predicate = Coo::zort(std::vector >::iterator, int, int, int, int, int, int, QuadTree&)::::triple_t)>]', - inlined from 'void Coo::zort(typename trivec_t::iterator, IT, IT, IT, IT, IT, IT, QuadTree&) [with IT = int; NT = double]' at rsbpp.hpp:4528:40: -/usr/include/c++/12/bits/stl_algo.h:1617:37: note: parameter passing for argument of type '__gnu_cxx::__normal_iterator::triple_ppd_t*, std::vector::triple_ppd_t, OpenMP_Allocator::triple_ppd_t> > >' changed in GCC 7.1 - 1617 | return std::__stable_partition(__first, __last, - | ~~~~~~~~~~~~~~~~~~~~~~~^~~~~~~~~~~~~~~~~ - 1618 | __gnu_cxx::__ops::__pred_iter(__pred)); - | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ -In function '_BIter std::stable_partition(_BIter, _BIter, _Predicate) [with _BIter = __gnu_cxx::__normal_iterator::triple_ppd_t*, vector::triple_ppd_t, OpenMP_Allocator::triple_ppd_t> > >; _Predicate = Coo::zort(std::vector >::iterator, int, int, int, int, int, int, QuadTree&)::::triple_t)>]', - inlined from 'void Coo::zort(typename trivec_t::iterator, IT, IT, IT, IT, IT, IT, QuadTree&) [with IT = int; NT = double]' at rsbpp.hpp:4529:40: -/usr/include/c++/12/bits/stl_algo.h:1617:37: note: parameter passing for argument of type '__gnu_cxx::__normal_iterator::triple_ppd_t*, std::vector::triple_ppd_t, OpenMP_Allocator::triple_ppd_t> > >' changed in GCC 7.1 - 1617 | return std::__stable_partition(__first, __last, - | ~~~~~~~~~~~~~~~~~~~~~~~^~~~~~~~~~~~~~~~~ - 1618 | __gnu_cxx::__ops::__pred_iter(__pred)); - | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ -rsbpp.hpp: In member function 'void Coo::zort(typename trivec_t::iterator, IT, IT, IT, IT, IT, IT, QuadTree&) [with IT = int; NT = double]': -rsbpp.hpp:4554:37: note: parameter passing for argument of type 'std::vector::triple_ppd_t, OpenMP_Allocator::triple_ppd_t> >::iterator' changed in GCC 7.1 - 4554 | zort(bi,qnz[midx-1],qnz.n_at(midx),qro[midx],qnr[midx],qco[midx],qnc[midx],qt); - | ~~~~^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ -rsbpp.hpp: In member function 'void Coo::zort() [with IT = int; NT = double]': -rsbpp.hpp:4570:21: note: parameter passing for argument of type '__gnu_cxx::__normal_iterator::triple_ppd_t*, std::vector::triple_ppd_t, OpenMP_Allocator::triple_ppd_t> > >' changed in GCC 7.1 - 4570 | zort(coo_.begin(),0,nnz(),0,nr(),0,nc(),qt_); - | ~~~~^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ -In member function 'std::vector<_Tp, _Alloc>::reference std::vector<_Tp, _Alloc>::emplace_back(_Args&& ...) [with _Args = {Coo::triple_ppd_t}; _Tp = Coo::triple_ppd_t; _Alloc = OpenMP_Allocator::triple_ppd_t>]', - inlined from 'void Coo::init_coo(const std::vector&, const std::vector&, const std::vector&, rsb_flags_t, Ordering) [with IT = int; NT = double]' at rsbpp.hpp:4367:21, - inlined from 'Coo::Coo(const std::vector&, const std::vector&, const std::vector&, rsb_flags_t, Ordering) [with IT = int; NT = double]' at rsbpp.hpp:4303:11: -/usr/include/c++/12/bits/vector.tcc:123:28: note: parameter passing for argument of type '__gnu_cxx::__normal_iterator::triple_ppd_t*, std::vector::triple_ppd_t, OpenMP_Allocator::triple_ppd_t> > >' changed in GCC 7.1 - 123 | _M_realloc_insert(end(), std::forward<_Args>(__args)...); - | ~~~~~~~~~~~~~~~~~^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ -In function 'void std::__sort(_RandomAccessIterator, _RandomAccessIterator, _Compare) [with _RandomAccessIterator = __gnu_cxx::__normal_iterator::triple_ppd_t*, vector::triple_ppd_t, OpenMP_Allocator::triple_ppd_t> > >; _Compare = __gnu_cxx::__ops::_Iter_comp_iter::sort_cor(int, int)::::triple_t, Coo::triple_t)> >]', - inlined from 'void std::sort(_RAIter, _RAIter, _Compare) [with _RAIter = __gnu_cxx::__normal_iterator::triple_ppd_t*, vector::triple_ppd_t, OpenMP_Allocator::triple_ppd_t> > >; _Compare = Coo::sort_cor(int, int)::::triple_t, Coo::triple_t)>]' at /usr/include/c++/12/bits/stl_algo.h:4853:18, - inlined from 'void Coo::sort_cor(IT, IT) [with IT = int; NT = double]' at rsbpp.hpp:4419:12, - inlined from 'void Coo::sort_cor() [with IT = int; NT = double]' at rsbpp.hpp:4427:11, - inlined from 'void Coo::sort() [with IT = int; NT = double]' at rsbpp.hpp:4402:13, - inlined from 'void Coo::init_coo(const std::vector&, const std::vector&, const std::vector&, rsb_flags_t, Ordering) [with IT = int; NT = double]' at rsbpp.hpp:4375:14, - inlined from 'Coo::Coo(const std::vector&, const std::vector&, const std::vector&, rsb_flags_t, Ordering) [with IT = int; NT = double]' at rsbpp.hpp:4303:11: -/usr/include/c++/12/bits/stl_algo.h:1937:32: note: parameter passing for argument of type '__gnu_cxx::__normal_iterator::triple_ppd_t*, std::vector::triple_ppd_t, OpenMP_Allocator::triple_ppd_t> > >' changed in GCC 7.1 - 1937 | std::__introsort_loop(__first, __last, - | ~~~~~~~~~~~~~~~~~~~~~^~~~~~~~~~~~~~~~~ - 1938 | std::__lg(__last - __first) * 2, - | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ - 1939 | __comp); - | ~~~~~~~ -In function 'void std::__final_insertion_sort(_RandomAccessIterator, _RandomAccessIterator, _Compare) [with _RandomAccessIterator = __gnu_cxx::__normal_iterator::triple_ppd_t*, vector::triple_ppd_t, OpenMP_Allocator::triple_ppd_t> > >; _Compare = __gnu_cxx::__ops::_Iter_comp_iter::sort_cor(int, int)::::triple_t, Coo::triple_t)> >]', - inlined from 'void std::__sort(_RandomAccessIterator, _RandomAccessIterator, _Compare) [with _RandomAccessIterator = __gnu_cxx::__normal_iterator::triple_ppd_t*, vector::triple_ppd_t, OpenMP_Allocator::triple_ppd_t> > >; _Compare = __gnu_cxx::__ops::_Iter_comp_iter::sort_cor(int, int)::::triple_t, Coo::triple_t)> >]' at /usr/include/c++/12/bits/stl_algo.h:1940:31, - inlined from 'void std::sort(_RAIter, _RAIter, _Compare) [with _RAIter = __gnu_cxx::__normal_iterator::triple_ppd_t*, vector::triple_ppd_t, OpenMP_Allocator::triple_ppd_t> > >; _Compare = Coo::sort_cor(int, int)::::triple_t, Coo::triple_t)>]' at /usr/include/c++/12/bits/stl_algo.h:4853:18, - inlined from 'void Coo::sort_cor(IT, IT) [with IT = int; NT = double]' at rsbpp.hpp:4419:12, - inlined from 'void Coo::sort_cor() [with IT = int; NT = double]' at rsbpp.hpp:4427:11, - inlined from 'void Coo::sort() [with IT = int; NT = double]' at rsbpp.hpp:4402:13, - inlined from 'void Coo::init_coo(const std::vector&, const std::vector&, const std::vector&, rsb_flags_t, Ordering) [with IT = int; NT = double]' at rsbpp.hpp:4375:14, - inlined from 'Coo::Coo(const std::vector&, const std::vector&, const std::vector&, rsb_flags_t, Ordering) [with IT = int; NT = double]' at rsbpp.hpp:4303:11: -/usr/include/c++/12/bits/stl_algo.h:1849:32: note: parameter passing for argument of type '__gnu_cxx::__normal_iterator::triple_ppd_t*, std::vector::triple_ppd_t, OpenMP_Allocator::triple_ppd_t> > >' changed in GCC 7.1 - 1849 | std::__insertion_sort(__first, __first + int(_S_threshold), __comp); - | ~~~~~~~~~~~~~~~~~~~~~^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ -/usr/include/c++/12/bits/stl_algo.h:1854:30: note: parameter passing for argument of type '__gnu_cxx::__normal_iterator::triple_ppd_t*, std::vector::triple_ppd_t, OpenMP_Allocator::triple_ppd_t> > >' changed in GCC 7.1 - 1854 | std::__insertion_sort(__first, __last, __comp); - | ~~~~~~~~~~~~~~~~~~~~~^~~~~~~~~~~~~~~~~~~~~~~~~ -In function 'void std::__sort(_RandomAccessIterator, _RandomAccessIterator, _Compare) [with _RandomAccessIterator = __gnu_cxx::__normal_iterator::triple_ppd_t*, vector::triple_ppd_t, OpenMP_Allocator::triple_ppd_t> > >; _Compare = __gnu_cxx::__ops::_Iter_comp_iter::sort_coc(int, int)::::triple_t, Coo::triple_t)> >]', - inlined from 'void std::sort(_RAIter, _RAIter, _Compare) [with _RAIter = __gnu_cxx::__normal_iterator::triple_ppd_t*, vector::triple_ppd_t, OpenMP_Allocator::triple_ppd_t> > >; _Compare = Coo::sort_coc(int, int)::::triple_t, Coo::triple_t)>]' at /usr/include/c++/12/bits/stl_algo.h:4853:18, - inlined from 'void Coo::sort_coc(IT, IT) [with IT = int; NT = double]' at rsbpp.hpp:4447:12, - inlined from 'void Coo::sort_coc() [with IT = int; NT = double]' at rsbpp.hpp:4455:11, - inlined from 'void Coo::sort() [with IT = int; NT = double]' at rsbpp.hpp:4405:13, - inlined from 'void Coo::init_coo(const std::vector&, const std::vector&, const std::vector&, rsb_flags_t, Ordering) [with IT = int; NT = double]' at rsbpp.hpp:4375:14, - inlined from 'Coo::Coo(const std::vector&, const std::vector&, const std::vector&, rsb_flags_t, Ordering) [with IT = int; NT = double]' at rsbpp.hpp:4303:11: -/usr/include/c++/12/bits/stl_algo.h:1937:32: note: parameter passing for argument of type '__gnu_cxx::__normal_iterator::triple_ppd_t*, std::vector::triple_ppd_t, OpenMP_Allocator::triple_ppd_t> > >' changed in GCC 7.1 - 1937 | std::__introsort_loop(__first, __last, - | ~~~~~~~~~~~~~~~~~~~~~^~~~~~~~~~~~~~~~~ - 1938 | std::__lg(__last - __first) * 2, - | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ - 1939 | __comp); - | ~~~~~~~ -In function 'void std::__final_insertion_sort(_RandomAccessIterator, _RandomAccessIterator, _Compare) [with _RandomAccessIterator = __gnu_cxx::__normal_iterator::triple_ppd_t*, vector::triple_ppd_t, OpenMP_Allocator::triple_ppd_t> > >; _Compare = __gnu_cxx::__ops::_Iter_comp_iter::sort_coc(int, int)::::triple_t, Coo::triple_t)> >]', - inlined from 'void std::__sort(_RandomAccessIterator, _RandomAccessIterator, _Compare) [with _RandomAccessIterator = __gnu_cxx::__normal_iterator::triple_ppd_t*, vector::triple_ppd_t, OpenMP_Allocator::triple_ppd_t> > >; _Compare = __gnu_cxx::__ops::_Iter_comp_iter::sort_coc(int, int)::::triple_t, Coo::triple_t)> >]' at /usr/include/c++/12/bits/stl_algo.h:1940:31, - inlined from 'void std::sort(_RAIter, _RAIter, _Compare) [with _RAIter = __gnu_cxx::__normal_iterator::triple_ppd_t*, vector::triple_ppd_t, OpenMP_Allocator::triple_ppd_t> > >; _Compare = Coo::sort_coc(int, int)::::triple_t, Coo::triple_t)>]' at /usr/include/c++/12/bits/stl_algo.h:4853:18, - inlined from 'void Coo::sort_coc(IT, IT) [with IT = int; NT = double]' at rsbpp.hpp:4447:12, - inlined from 'void Coo::sort_coc() [with IT = int; NT = double]' at rsbpp.hpp:4455:11, - inlined from 'void Coo::sort() [with IT = int; NT = double]' at rsbpp.hpp:4405:13, - inlined from 'void Coo::init_coo(const std::vector&, const std::vector&, const std::vector&, rsb_flags_t, Ordering) [with IT = int; NT = double]' at rsbpp.hpp:4375:14, - inlined from 'Coo::Coo(const std::vector&, const std::vector&, const std::vector&, rsb_flags_t, Ordering) [with IT = int; NT = double]' at rsbpp.hpp:4303:11: -/usr/include/c++/12/bits/stl_algo.h:1849:32: note: parameter passing for argument of type '__gnu_cxx::__normal_iterator::triple_ppd_t*, std::vector::triple_ppd_t, OpenMP_Allocator::triple_ppd_t> > >' changed in GCC 7.1 - 1849 | std::__insertion_sort(__first, __first + int(_S_threshold), __comp); - | ~~~~~~~~~~~~~~~~~~~~~^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ -/usr/include/c++/12/bits/stl_algo.h:1854:30: note: parameter passing for argument of type '__gnu_cxx::__normal_iterator::triple_ppd_t*, std::vector::triple_ppd_t, OpenMP_Allocator::triple_ppd_t> > >' changed in GCC 7.1 - 1854 | std::__insertion_sort(__first, __last, __comp); - | ~~~~~~~~~~~~~~~~~~~~~^~~~~~~~~~~~~~~~~~~~~~~~~ -In function 'void test_Coo_BuildsNonEmptyFromVectors()', - inlined from 'int main()' at rsbtt.cpp:840:36: -rsbtt.cpp:48:35: note: parameter passing for argument of type 'std::initializer_list' changed in GCC 7.1 - 48 | std::vector VA{+11}; - | ^ -In function 'void test_Coo_SpMV_Unsymmetric()', - inlined from 'int main()' at rsbtt.cpp:843:27: -rsbtt.cpp:574:39: note: parameter passing for argument of type 'std::initializer_list' changed in GCC 7.1 - 574 | const std::vector VA{11,12}; - | ^ -rsbtt.cpp:575:38: note: parameter passing for argument of type 'std::initializer_list' changed in GCC 7.1 - 575 | const std::vector X{+1,-1}; - | ^ -rsbtt.cpp:576:32: note: parameter passing for argument of type 'std::initializer_list' changed in GCC 7.1 - 576 | std::vector Y{+3,-3}; - | ^ -In function 'void test_Coo_SpMM_Unsymmetric()', - inlined from 'int main()' at rsbtt.cpp:844:27: -rsbtt.cpp:744:39: note: parameter passing for argument of type 'std::initializer_list' changed in GCC 7.1 - 744 | const std::vector VA{11,12}; - | ^ -rsbtt.cpp:745:44: note: parameter passing for argument of type 'std::initializer_list' changed in GCC 7.1 - 745 | const std::vector X{+1,-1,+2,-2}; - | ^ -rsbtt.cpp:746:32: note: parameter passing for argument of type 'std::initializer_list' changed in GCC 7.1 - 746 | std::vector Y{+3,-3}; - | ^ -In function 'void test_Coo_SpMV_Unsymmetric_Transposed()', - inlined from 'int main()' at rsbtt.cpp:845:38: -rsbtt.cpp:789:41: note: parameter passing for argument of type 'std::initializer_list' changed in GCC 7.1 - 789 | const std::vector VA{+11,+21}; - | ^ -rsbtt.cpp:790:40: note: parameter passing for argument of type 'std::initializer_list' changed in GCC 7.1 - 790 | const std::vector X{+21,+22}; - | ^ -rsbtt.cpp:791:34: note: parameter passing for argument of type 'std::initializer_list' changed in GCC 7.1 - 791 | std::vector Y{+31,-32}; - | ^ -In function 'void test_Coo_SpMV_Complex()', - inlined from 'int main()' at rsbtt.cpp:846:23: -rsbtt.cpp:503:37: note: parameter passing for argument of type 'std::initializer_list >' changed in GCC 7.1 - 503 | const std::vector VA{+44}; - | ^ -rsbtt.cpp:504:36: note: parameter passing for argument of type 'std::initializer_list >' changed in GCC 7.1 - 504 | const std::vector X{+21}; - | ^ -rsbtt.cpp:505:30: note: parameter passing for argument of type 'std::initializer_list >' changed in GCC 7.1 - 505 | std::vector Y{+31}; - | ^ -In function 'void test_Coo_SpMV_No_Inc()', - inlined from 'int main()' at rsbtt.cpp:847:22: -rsbtt.cpp:552:39: note: parameter passing for argument of type 'std::initializer_list' changed in GCC 7.1 - 552 | const std::vector VA{11,12}; - | ^ -rsbtt.cpp:553:38: note: parameter passing for argument of type 'std::initializer_list' changed in GCC 7.1 - 553 | const std::vector X{+1,-1}; - | ^ -rsbtt.cpp:554:32: note: parameter passing for argument of type 'std::initializer_list' changed in GCC 7.1 - 554 | std::vector Y{+3,-3}; - | ^ -In function 'void test_Coo_SpMV_Symmetric_At()', - inlined from 'int main()' at rsbtt.cpp:848:28: -rsbtt.cpp:292:37: note: parameter passing for argument of type 'std::initializer_list' changed in GCC 7.1 - 292 | const std::vector VA{+11}; - | ^ -rsbtt.cpp:293:40: note: parameter passing for argument of type 'std::initializer_list' changed in GCC 7.1 - 293 | const std::vector X{-21,+22}; - | ^ -rsbtt.cpp:294:32: note: parameter passing for argument of type 'std::initializer_list' changed in GCC 7.1 - 294 | std::vector Y{-11,3}; - | ^ -In function 'void test_Coo_SpMV_Complex_Unsymmetric_Conjugated_At()', - inlined from 'int main()' at rsbtt.cpp:853:49: -rsbtt.cpp:124:41: note: parameter passing for argument of type 'std::initializer_list >' changed in GCC 7.1 - 124 | const std::vector VA{{0,+44}}; - | ^ -rsbtt.cpp:125:48: note: parameter passing for argument of type 'std::initializer_list >' changed in GCC 7.1 - 125 | const std::vector X{-21,-22,-23,+24}; - | ^ -rsbtt.cpp:126:34: note: parameter passing for argument of type 'std::initializer_list >' changed in GCC 7.1 - 126 | std::vector Y{-11,+13}; - | ^ -In function 'void test_Coo_SpMV_Symmetric_At_Short()', - inlined from 'int main()' at rsbtt.cpp:854:34: -rsbtt.cpp:437:37: note: parameter passing for argument of type 'std::initializer_list' changed in GCC 7.1 - 437 | const std::vector VA{+44}; - | ^ -rsbtt.cpp:438:40: note: parameter passing for argument of type 'std::initializer_list' changed in GCC 7.1 - 438 | const std::vector X{-11,+22}; - | ^ -rsbtt.cpp:439:34: note: parameter passing for argument of type 'std::initializer_list' changed in GCC 7.1 - 439 | std::vector Y{-11,+12}; - | ^ -In function 'void test_Coo_SpMV_Complex_Hermitian()', - inlined from 'int main()' at rsbtt.cpp:855:33: -rsbtt.cpp:527:41: note: parameter passing for argument of type 'std::initializer_list >' changed in GCC 7.1 - 527 | const std::vector VA{{+4,+1}}; - | ^ -rsbtt.cpp:528:38: note: parameter passing for argument of type 'std::initializer_list >' changed in GCC 7.1 - 528 | const std::vector X{+1,+2}; - | ^ -rsbtt.cpp:529:32: note: parameter passing for argument of type 'std::initializer_list >' changed in GCC 7.1 - 529 | std::vector Y{-1,-2}; - | ^ -In function 'void test_Csr_BuildsNonEmptyFromVectors()', - inlined from 'int main()' at rsbtt.cpp:857:36: -rsbtt.cpp:64:35: note: parameter passing for argument of type 'std::initializer_list' changed in GCC 7.1 - 64 | std::vector VA{+11}; - | ^ -In function 'void test_Csr_SpMV_Unsymmetric()', - inlined from 'int main()' at rsbtt.cpp:858:27: -rsbtt.cpp:601:41: note: parameter passing for argument of type 'std::initializer_list' changed in GCC 7.1 - 601 | const std::vector VA{+11,+12}; - | ^ -rsbtt.cpp:602:40: note: parameter passing for argument of type 'std::initializer_list' changed in GCC 7.1 - 602 | const std::vector X{+21,+22}; - | ^ -rsbtt.cpp:603:34: note: parameter passing for argument of type 'std::initializer_list' changed in GCC 7.1 - 603 | std::vector Y{+11,-12}; - | ^ -In function 'void test_Csr_SpMM_Unsymmetric()', - inlined from 'int main()' at rsbtt.cpp:859:27: -rsbtt.cpp:628:41: note: parameter passing for argument of type 'std::initializer_list' changed in GCC 7.1 - 628 | const std::vector VA{+11,+12}; - | ^ -rsbtt.cpp:629:48: note: parameter passing for argument of type 'std::initializer_list' changed in GCC 7.1 - 629 | const std::vector X{+21,+22,+23,+24}; - | ^ -rsbtt.cpp:630:42: note: parameter passing for argument of type 'std::initializer_list' changed in GCC 7.1 - 630 | std::vector Y{+11,-12,+13,-14}; - | ^ -In function 'void test_Csr_SpMM_Unsymmetric_Short_At()', - inlined from 'int main()' at rsbtt.cpp:861:36: -rsbtt.cpp:708:41: note: parameter passing for argument of type 'std::initializer_list' changed in GCC 7.1 - 708 | const std::vector VA{+21,+22}; - | ^ -rsbtt.cpp:709:48: note: parameter passing for argument of type 'std::initializer_list' changed in GCC 7.1 - 709 | const std::vector X{+21,+22,+23,+24}; - | ^ -rsbtt.cpp:722:46: note: parameter passing for argument of type 'std::initializer_list' changed in GCC 7.1 - 722 | std::vector Y{0,-11,+12,0,-13,+14}; - | ^ -In function 'void test_Csr_SpMV_Symmetric_At_Short()', - inlined from 'int main()' at rsbtt.cpp:862:34: -rsbtt.cpp:471:37: note: parameter passing for argument of type 'std::initializer_list' changed in GCC 7.1 - 471 | const std::vector VA{+44}; - | ^ -rsbtt.cpp:472:40: note: parameter passing for argument of type 'std::initializer_list' changed in GCC 7.1 - 472 | const std::vector X{-11,+22}; - | ^ -rsbtt.cpp:473:34: note: parameter passing for argument of type 'std::initializer_list' changed in GCC 7.1 - 473 | std::vector Y{-11,+12}; - | ^ -In function 'void test_Csr_SpMV_Complex_Unsymmetric_Conjugated_At()', - inlined from 'int main()' at rsbtt.cpp:866:49: -rsbtt.cpp:150:41: note: parameter passing for argument of type 'std::initializer_list >' changed in GCC 7.1 - 150 | const std::vector VA{{0,+44}}; - | ^ -rsbtt.cpp:151:48: note: parameter passing for argument of type 'std::initializer_list >' changed in GCC 7.1 - 151 | const std::vector X{-21,-22,-23,+24}; - | ^ -rsbtt.cpp:152:34: note: parameter passing for argument of type 'std::initializer_list >' changed in GCC 7.1 - 152 | std::vector Y{-11,+13}; - | ^ -gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -DRSBPP_HAS_RSB_H=1 -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -c -o rsbct.o rsbct.c libtool: compile: g++ -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -DRSBPP_HAS_RSB_H=1 -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -DRSBPP_HAS_RSB_H=1 -c rsbpp_coo.cpp -o rsbpp_coo.o >/dev/null 2>&1 libtool: compile: g++ -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -DRSBPP_HAS_RSB_H=1 -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -DRSBPP_HAS_RSB_H=1 -c rsbpp_csr.cpp -o rsbpp_csr.o >/dev/null 2>&1 -/bin/bash ./libtool --tag=CXX --mode=link g++ -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -DRSBPP_HAS_RSB_H=1 -Wl,-z,relro -o librsbpp.la rsbpp_coo.lo rsbpp_csr.lo -lpthread -lstdc++fs +/bin/sh ./libtool --tag=CXX --mode=link g++ -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -DRSBPP_HAS_RSB_H=1 -Wl,-z,relro -o librsbpp.la rsbpp_coo.lo rsbpp_csr.lo -lpthread -lstdc++fs libtool: link: ar cr .libs/librsbpp.a .libs/rsbpp_coo.o .libs/rsbpp_csr.o libtool: link: ranlib .libs/librsbpp.a libtool: link: ( cd ".libs" && rm -f "librsbpp.la" && ln -s "../librsbpp.la" "librsbpp.la" ) -/bin/bash ./libtool --tag=CXX --mode=link g++ -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -DRSBPP_HAS_RSB_H=1 -Wl,-z,relro -o rsbpp rsbpp.o librsbpp.la -lpthread -lstdc++fs -/bin/bash ./libtool --tag=CXX --mode=link g++ -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -DRSBPP_HAS_RSB_H=1 -Wl,-z,relro -o rsbtt rsbtt.o librsbpp.la -lpthread -lstdc++fs -/bin/bash ./libtool --tag=CXX --mode=link g++ -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -DRSBPP_HAS_RSB_H=1 -Wl,-z,relro -o rsbct rsbct.o librsbpp.la -lpthread -lstdc++fs +/bin/sh ./libtool --tag=CXX --mode=link g++ -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -DRSBPP_HAS_RSB_H=1 -Wl,-z,relro -o rsbpp rsbpp.o librsbpp.la -lpthread -lstdc++fs +/bin/sh ./libtool --tag=CXX --mode=link g++ -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -DRSBPP_HAS_RSB_H=1 -Wl,-z,relro -o rsbtt rsbtt.o librsbpp.la -lpthread -lstdc++fs +/bin/sh ./libtool --tag=CXX --mode=link g++ -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -DRSBPP_HAS_RSB_H=1 -Wl,-z,relro -o rsbct rsbct.o librsbpp.la -lpthread -lstdc++fs libtool: link: g++ -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -DRSBPP_HAS_RSB_H=1 -Wl,-z -Wl,relro -o rsbpp rsbpp.o ./.libs/librsbpp.a -lpthread -lstdc++fs -fopenmp libtool: link: g++ -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -DRSBPP_HAS_RSB_H=1 -Wl,-z -Wl,relro -o rsbtt rsbtt.o ./.libs/librsbpp.a -lpthread -lstdc++fs -fopenmp libtool: link: g++ -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -DRSBPP_HAS_RSB_H=1 -Wl,-z -Wl,relro -o rsbct rsbct.o ./.libs/librsbpp.a -lpthread -lstdc++fs -fopenmp @@ -3250,8 +3286,28 @@ gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o rsbench-rsb_libspblas_tests.o `test -f 'rsb_libspblas_tests.c' || echo './'`rsb_libspblas_tests.c g++ -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -fopenmp -c -o rsb_dummy.o rsb_dummy.cpp gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o ch2icfb-ch2icfb.o `test -f 'ch2icfb.c' || echo './'`ch2icfb.c -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_nounroll_la-rsb_stropts.lo `test -f 'rsb_stropts.c' || echo './'`rsb_stropts.c +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_nounroll_la-rsb_stropts.lo `test -f 'rsb_stropts.c' || echo './'`rsb_stropts.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_stropts.c -fPIC -DPIC -o .libs/librsb_nounroll_la-rsb_stropts.o +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_stropts.c -o librsb_nounroll_la-rsb_stropts.o >/dev/null 2>&1 +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_nounroll_la-rsb_strmif.lo `test -f 'rsb_strmif.c' || echo './'`rsb_strmif.c +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_nounroll_la-rsb_unroll.lo `test -f 'rsb_unroll.c' || echo './'`rsb_unroll.c +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_strmif.c -fPIC -DPIC -o .libs/librsb_nounroll_la-rsb_strmif.o +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_unroll.c -fPIC -DPIC -o .libs/librsb_nounroll_la-rsb_unroll.o +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_unroll.c -o librsb_nounroll_la-rsb_unroll.o >/dev/null 2>&1 +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_nounroll_la-rsb_krnl_vb.lo `test -f 'rsb_krnl_vb.c' || echo './'`rsb_krnl_vb.c +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_krnl_vb.c -fPIC -DPIC -o .libs/librsb_nounroll_la-rsb_krnl_vb.o +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_strmif.c -o librsb_nounroll_la-rsb_strmif.o >/dev/null 2>&1 +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_krnl_vb.c -o librsb_nounroll_la-rsb_krnl_vb.o >/dev/null 2>&1 +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_nounroll_la-rsb_krnl_lb.lo `test -f 'rsb_krnl_lb.c' || echo './'`rsb_krnl_lb.c +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_nounroll_la-rsb_krnl.lo `test -f 'rsb_krnl.c' || echo './'`rsb_krnl.c +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_krnl_lb.c -fPIC -DPIC -o .libs/librsb_nounroll_la-rsb_krnl_lb.o +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_krnl.c -fPIC -DPIC -o .libs/librsb_nounroll_la-rsb_krnl.o +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_krnl_lb.c -o librsb_nounroll_la-rsb_krnl_lb.o >/dev/null 2>&1 +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_nounroll_la-rsb_bench.lo `test -f 'rsb_bench.c' || echo './'`rsb_bench.c +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_bench.c -fPIC -DPIC -o .libs/librsb_nounroll_la-rsb_bench.o +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_nounroll_la-rsb_mergesort.lo `test -f 'rsb_mergesort.c' || echo './'`rsb_mergesort.c +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_mergesort.c -fPIC -DPIC -o .libs/librsb_nounroll_la-rsb_mergesort.o +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_mergesort.c -o librsb_nounroll_la-rsb_mergesort.o >/dev/null 2>&1 rsb_test_matops.c: In function 'rsb__main_block_partitioned_spmv_sxsa': rsb_test_matops.c:214:41: warning: '%s' directive writing up to 2047 bytes into a region of size 1011 [-Wformat-overflow=] 214 | rsb__sprintf(dst,"%s%s_%s_%.0lf_%s%s" "%s%s%s" "%s%s" "%s",pp?pp:"",h,rsb__getenv_nnr("HOSTNAME"),rsb_time(),buf,ap?ap:"", @@ -3270,38 +3326,21 @@ | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ 32 | __va_arg_pack ()); | ~~~~~~~~~~~~~~~~~ -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_stropts.c -o librsb_nounroll_la-rsb_stropts.o >/dev/null 2>&1 -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_nounroll_la-rsb_strmif.lo `test -f 'rsb_strmif.c' || echo './'`rsb_strmif.c -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_nounroll_la-rsb_unroll.lo `test -f 'rsb_unroll.c' || echo './'`rsb_unroll.c -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_strmif.c -fPIC -DPIC -o .libs/librsb_nounroll_la-rsb_strmif.o -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_unroll.c -fPIC -DPIC -o .libs/librsb_nounroll_la-rsb_unroll.o -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_unroll.c -o librsb_nounroll_la-rsb_unroll.o >/dev/null 2>&1 -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_nounroll_la-rsb_krnl_vb.lo `test -f 'rsb_krnl_vb.c' || echo './'`rsb_krnl_vb.c -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_krnl_vb.c -fPIC -DPIC -o .libs/librsb_nounroll_la-rsb_krnl_vb.o -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_strmif.c -o librsb_nounroll_la-rsb_strmif.o >/dev/null 2>&1 -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_krnl_vb.c -o librsb_nounroll_la-rsb_krnl_vb.o >/dev/null 2>&1 -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_nounroll_la-rsb_krnl_lb.lo `test -f 'rsb_krnl_lb.c' || echo './'`rsb_krnl_lb.c -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_krnl_lb.c -fPIC -DPIC -o .libs/librsb_nounroll_la-rsb_krnl_lb.o -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_nounroll_la-rsb_krnl.lo `test -f 'rsb_krnl.c' || echo './'`rsb_krnl.c -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_krnl_lb.c -o librsb_nounroll_la-rsb_krnl_lb.o >/dev/null 2>&1 -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_krnl.c -fPIC -DPIC -o .libs/librsb_nounroll_la-rsb_krnl.o -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_nounroll_la-rsb_bench.lo `test -f 'rsb_bench.c' || echo './'`rsb_bench.c -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_bench.c -fPIC -DPIC -o .libs/librsb_nounroll_la-rsb_bench.o -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_bench.c -o librsb_nounroll_la-rsb_bench.o >/dev/null 2>&1 -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_nounroll_la-rsb_mergesort.lo `test -f 'rsb_mergesort.c' || echo './'`rsb_mergesort.c -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_mergesort.c -fPIC -DPIC -o .libs/librsb_nounroll_la-rsb_mergesort.o -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_mergesort.c -o librsb_nounroll_la-rsb_mergesort.o >/dev/null 2>&1 -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_nounroll_la-rsb_permute.lo `test -f 'rsb_permute.c' || echo './'`rsb_permute.c +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_nounroll_la-rsb_permute.lo `test -f 'rsb_permute.c' || echo './'`rsb_permute.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_permute.c -fPIC -DPIC -o .libs/librsb_nounroll_la-rsb_permute.o +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_bench.c -o librsb_nounroll_la-rsb_bench.o >/dev/null 2>&1 libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_permute.c -o librsb_nounroll_la-rsb_permute.o >/dev/null 2>&1 -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_nounroll_la-rsb_krnl_bcss_l.lo `test -f 'rsb_krnl_bcss_l.c' || echo './'`rsb_krnl_bcss_l.c +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_nounroll_la-rsb_krnl_bcss_l.lo `test -f 'rsb_krnl_bcss_l.c' || echo './'`rsb_krnl_bcss_l.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_krnl_bcss_l.c -fPIC -DPIC -o .libs/librsb_nounroll_la-rsb_krnl_bcss_l.o libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_krnl_bcss_l.c -o librsb_nounroll_la-rsb_krnl_bcss_l.o >/dev/null 2>&1 -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_nounroll_la-rsb_krnl_bcss_u.lo `test -f 'rsb_krnl_bcss_u.c' || echo './'`rsb_krnl_bcss_u.c +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_nounroll_la-rsb_krnl_bcss_u.lo `test -f 'rsb_krnl_bcss_u.c' || echo './'`rsb_krnl_bcss_u.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_krnl_bcss_u.c -fPIC -DPIC -o .libs/librsb_nounroll_la-rsb_krnl_bcss_u.o libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_krnl_bcss_u.c -o librsb_nounroll_la-rsb_krnl_bcss_u.o >/dev/null 2>&1 -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_nounroll_la-rsb_krnl_bcss_spsv_u.lo `test -f 'rsb_krnl_bcss_spsv_u.c' || echo './'`rsb_krnl_bcss_spsv_u.c +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_nounroll_la-rsb_krnl_bcss_spsv_u.lo `test -f 'rsb_krnl_bcss_spsv_u.c' || echo './'`rsb_krnl_bcss_spsv_u.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_krnl_bcss_spsv_u.c -fPIC -DPIC -o .libs/librsb_nounroll_la-rsb_krnl_bcss_spsv_u.o +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_nounroll_la-rsb_krnl_bcss_spmv_u.lo `test -f 'rsb_krnl_bcss_spmv_u.c' || echo './'`rsb_krnl_bcss_spmv_u.c +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_krnl_bcss_spmv_u.c -fPIC -DPIC -o .libs/librsb_nounroll_la-rsb_krnl_bcss_spmv_u.o +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_krnl_bcss_spsv_u.c -o librsb_nounroll_la-rsb_krnl_bcss_spsv_u.o >/dev/null 2>&1 rsb_test_matops.c: In function 'rsb__main_block_partitioned_spsv_sxsx': rsb_test_matops.c:214:41: warning: '%s' directive writing up to 2047 bytes into a region of size 1011 [-Wformat-overflow=] 214 | rsb__sprintf(dst,"%s%s_%s_%.0lf_%s%s" "%s%s%s" "%s%s" "%s",pp?pp:"",h,rsb__getenv_nnr("HOSTNAME"),rsb_time(),buf,ap?ap:"", @@ -3316,7 +3355,8 @@ | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ 32 | __va_arg_pack ()); | ~~~~~~~~~~~~~~~~~ -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_krnl_bcss_spsv_u.c -o librsb_nounroll_la-rsb_krnl_bcss_spsv_u.o >/dev/null 2>&1 +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_nounroll_la-rsb_krnl_bcss_misc_u.lo `test -f 'rsb_krnl_bcss_misc_u.c' || echo './'`rsb_krnl_bcss_misc_u.c +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_krnl_bcss_misc_u.c -fPIC -DPIC -o .libs/librsb_nounroll_la-rsb_krnl_bcss_misc_u.o libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_krnl.c -o librsb_nounroll_la-rsb_krnl.o >/dev/null 2>&1 rsb_test_matops.c: In function 'rsb__main_block_partitioned_mat_stats': rsb_test_matops.c:214:41: warning: '%s' directive writing up to 2047 bytes into a region of size 1011 [-Wformat-overflow=] @@ -3332,220 +3372,217 @@ | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ 32 | __va_arg_pack ()); | ~~~~~~~~~~~~~~~~~ -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_nounroll_la-rsb_krnl_bcss_spmv_u.lo `test -f 'rsb_krnl_bcss_spmv_u.c' || echo './'`rsb_krnl_bcss_spmv_u.c -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_krnl_bcss_spmv_u.c -fPIC -DPIC -o .libs/librsb_nounroll_la-rsb_krnl_bcss_spmv_u.o -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_nounroll_la-rsb_krnl_bcss_misc_u.lo `test -f 'rsb_krnl_bcss_misc_u.c' || echo './'`rsb_krnl_bcss_misc_u.c -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_krnl_bcss_misc_u.c -fPIC -DPIC -o .libs/librsb_nounroll_la-rsb_krnl_bcss_misc_u.o -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_krnl_bcss_misc_u.c -o librsb_nounroll_la-rsb_krnl_bcss_misc_u.o >/dev/null 2>&1 -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_nounroll_la-rsb_krnl_bcoo_spmv_u.lo `test -f 'rsb_krnl_bcoo_spmv_u.c' || echo './'`rsb_krnl_bcoo_spmv_u.c +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_nounroll_la-rsb_krnl_bcoo_spmv_u.lo `test -f 'rsb_krnl_bcoo_spmv_u.c' || echo './'`rsb_krnl_bcoo_spmv_u.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_krnl_bcoo_spmv_u.c -fPIC -DPIC -o .libs/librsb_nounroll_la-rsb_krnl_bcoo_spmv_u.o -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_nounroll_la-rsb_krnl_bcss.lo `test -f 'rsb_krnl_bcss.c' || echo './'`rsb_krnl_bcss.c +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_krnl_bcss_misc_u.c -o librsb_nounroll_la-rsb_krnl_bcss_misc_u.o >/dev/null 2>&1 +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_nounroll_la-rsb_krnl_bcss.lo `test -f 'rsb_krnl_bcss.c' || echo './'`rsb_krnl_bcss.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_krnl_bcss.c -fPIC -DPIC -o .libs/librsb_nounroll_la-rsb_krnl_bcss.o libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_krnl_bcss.c -o librsb_nounroll_la-rsb_krnl_bcss.o >/dev/null 2>&1 -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_nounroll_la-rsb_spmv.lo `test -f 'rsb_spmv.c' || echo './'`rsb_spmv.c +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_nounroll_la-rsb_spmv.lo `test -f 'rsb_spmv.c' || echo './'`rsb_spmv.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_spmv.c -fPIC -DPIC -o .libs/librsb_nounroll_la-rsb_spmv.o libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_spmv.c -o librsb_nounroll_la-rsb_spmv.o >/dev/null 2>&1 -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_nounroll_la-rsb_merge.lo `test -f 'rsb_merge.c' || echo './'`rsb_merge.c +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_nounroll_la-rsb_merge.lo `test -f 'rsb_merge.c' || echo './'`rsb_merge.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_merge.c -fPIC -DPIC -o .libs/librsb_nounroll_la-rsb_merge.o libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_merge.c -o librsb_nounroll_la-rsb_merge.o >/dev/null 2>&1 -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_nounroll_la-rsb_ompio.lo `test -f 'rsb_ompio.c' || echo './'`rsb_ompio.c +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_nounroll_la-rsb_ompio.lo `test -f 'rsb_ompio.c' || echo './'`rsb_ompio.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_ompio.c -fPIC -DPIC -o .libs/librsb_nounroll_la-rsb_ompio.o libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_ompio.c -o librsb_nounroll_la-rsb_ompio.o >/dev/null 2>&1 -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_nounroll_la-rsb_util.lo `test -f 'rsb_util.c' || echo './'`rsb_util.c +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_nounroll_la-rsb_util.lo `test -f 'rsb_util.c' || echo './'`rsb_util.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_util.c -fPIC -DPIC -o .libs/librsb_nounroll_la-rsb_util.o -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_util.c -o librsb_nounroll_la-rsb_util.o >/dev/null 2>&1 -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_nounroll_la-rsb_spgemm_csr.lo `test -f 'rsb_spgemm_csr.c' || echo './'`rsb_spgemm_csr.c +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_nounroll_la-rsb_spgemm_csr.lo `test -f 'rsb_spgemm_csr.c' || echo './'`rsb_spgemm_csr.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_spgemm_csr.c -fPIC -DPIC -o .libs/librsb_nounroll_la-rsb_spgemm_csr.o libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_spgemm_csr.c -o librsb_nounroll_la-rsb_spgemm_csr.o >/dev/null 2>&1 -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_nounroll_la-rsb_spsum_misc.lo `test -f 'rsb_spsum_misc.c' || echo './'`rsb_spsum_misc.c +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_nounroll_la-rsb_spsum_misc.lo `test -f 'rsb_spsum_misc.c' || echo './'`rsb_spsum_misc.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_spsum_misc.c -fPIC -DPIC -o .libs/librsb_nounroll_la-rsb_spsum_misc.o libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_spsum_misc.c -o librsb_nounroll_la-rsb_spsum_misc.o >/dev/null 2>&1 -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_nounroll_la-rsb_prec.lo `test -f 'rsb_prec.c' || echo './'`rsb_prec.c +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_nounroll_la-rsb_prec.lo `test -f 'rsb_prec.c' || echo './'`rsb_prec.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_prec.c -fPIC -DPIC -o .libs/librsb_nounroll_la-rsb_prec.o libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_prec.c -o librsb_nounroll_la-rsb_prec.o >/dev/null 2>&1 -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_base_la-rsb_is.lo `test -f 'rsb_is.c' || echo './'`rsb_is.c +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_base_la-rsb_is.lo `test -f 'rsb_is.c' || echo './'`rsb_is.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_is.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_is.o libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_is.c -o librsb_base_la-rsb_is.o >/dev/null 2>&1 -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_base_la-rsb_mio.lo `test -f 'rsb_mio.c' || echo './'`rsb_mio.c +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_base_la-rsb_mio.lo `test -f 'rsb_mio.c' || echo './'`rsb_mio.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_mio.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_mio.o libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_mio.c -o librsb_base_la-rsb_mio.o >/dev/null 2>&1 -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_base_la-rsb_op.lo `test -f 'rsb_op.c' || echo './'`rsb_op.c +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_base_la-rsb_op.lo `test -f 'rsb_op.c' || echo './'`rsb_op.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_op.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_op.o libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_op.c -o librsb_base_la-rsb_op.o >/dev/null 2>&1 -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_base_la-rsb_bio.lo `test -f 'rsb_bio.c' || echo './'`rsb_bio.c +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_base_la-rsb_bio.lo `test -f 'rsb_bio.c' || echo './'`rsb_bio.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_bio.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_bio.o libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_bio.c -o librsb_base_la-rsb_bio.o >/dev/null 2>&1 -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_base_la-rsb_get.lo `test -f 'rsb_get.c' || echo './'`rsb_get.c +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_base_la-rsb_get.lo `test -f 'rsb_get.c' || echo './'`rsb_get.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_get.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_get.o libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_get.c -o librsb_base_la-rsb_get.o >/dev/null 2>&1 -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_base_la-rsb_set.lo `test -f 'rsb_set.c' || echo './'`rsb_set.c +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_util.c -o librsb_nounroll_la-rsb_util.o >/dev/null 2>&1 +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_base_la-rsb_set.lo `test -f 'rsb_set.c' || echo './'`rsb_set.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_set.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_set.o libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_set.c -o librsb_base_la-rsb_set.o >/dev/null 2>&1 -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_krnl_bcss_spmv_u.c -o librsb_nounroll_la-rsb_krnl_bcss_spmv_u.o >/dev/null 2>&1 -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_base_la-rsb_coo.lo `test -f 'rsb_coo.c' || echo './'`rsb_coo.c +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_base_la-rsb_coo.lo `test -f 'rsb_coo.c' || echo './'`rsb_coo.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_coo.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_coo.o libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_coo.c -o librsb_base_la-rsb_coo.o >/dev/null 2>&1 -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_base_la-rsb_csr.lo `test -f 'rsb_csr.c' || echo './'`rsb_csr.c +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_base_la-rsb_csr.lo `test -f 'rsb_csr.c' || echo './'`rsb_csr.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_csr.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_csr.o libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_csr.c -o librsb_base_la-rsb_csr.o >/dev/null 2>&1 -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_base_la-rsb_coo_check.lo `test -f 'rsb_coo_check.c' || echo './'`rsb_coo_check.c +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_base_la-rsb_coo_check.lo `test -f 'rsb_coo_check.c' || echo './'`rsb_coo_check.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_coo_check.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_coo_check.o libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_coo_check.c -o librsb_base_la-rsb_coo_check.o >/dev/null 2>&1 -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_base_la-rsb_coo_symm.lo `test -f 'rsb_coo_symm.c' || echo './'`rsb_coo_symm.c +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_base_la-rsb_coo_symm.lo `test -f 'rsb_coo_symm.c' || echo './'`rsb_coo_symm.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_coo_symm.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_coo_symm.o libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_coo_symm.c -o librsb_base_la-rsb_coo_symm.o >/dev/null 2>&1 -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_base_la-rsb_idx.lo `test -f 'rsb_idx.c' || echo './'`rsb_idx.c +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_base_la-rsb_idx.lo `test -f 'rsb_idx.c' || echo './'`rsb_idx.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_idx.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_idx.o libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_idx.c -o librsb_base_la-rsb_idx.o >/dev/null 2>&1 -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_base_la-rsb_srt.lo `test -f 'rsb_srt.c' || echo './'`rsb_srt.c +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_base_la-rsb_srt.lo `test -f 'rsb_srt.c' || echo './'`rsb_srt.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_srt.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_srt.o libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_srt.c -o librsb_base_la-rsb_srt.o >/dev/null 2>&1 -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_base_la-rsb_srtp.lo `test -f 'rsb_srtp.c' || echo './'`rsb_srtp.c +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_base_la-rsb_srtp.lo `test -f 'rsb_srtp.c' || echo './'`rsb_srtp.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_srtp.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_srtp.o libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_srtp.c -o librsb_base_la-rsb_srtp.o >/dev/null 2>&1 -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_base_la-rsb_src.lo `test -f 'rsb_src.c' || echo './'`rsb_src.c +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_base_la-rsb_src.lo `test -f 'rsb_src.c' || echo './'`rsb_src.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_src.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_src.o libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_src.c -o librsb_base_la-rsb_src.o >/dev/null 2>&1 -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_base_la-rsb_test_accuracy.lo `test -f 'rsb_test_accuracy.c' || echo './'`rsb_test_accuracy.c +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_base_la-rsb_test_accuracy.lo `test -f 'rsb_test_accuracy.c' || echo './'`rsb_test_accuracy.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_test_accuracy.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_test_accuracy.o libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_test_accuracy.c -o librsb_base_la-rsb_test_accuracy.o >/dev/null 2>&1 -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_base_la-rsb_clone.lo `test -f 'rsb_clone.c' || echo './'`rsb_clone.c +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_base_la-rsb_clone.lo `test -f 'rsb_clone.c' || echo './'`rsb_clone.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_clone.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_clone.o libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_clone.c -o librsb_base_la-rsb_clone.o >/dev/null 2>&1 -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_base_la-rsb_rec.lo `test -f 'rsb_rec.c' || echo './'`rsb_rec.c +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_base_la-rsb_rec.lo `test -f 'rsb_rec.c' || echo './'`rsb_rec.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_rec.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_rec.o -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_rec.c -o librsb_base_la-rsb_rec.o >/dev/null 2>&1 -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_base_la-rsb_render.lo `test -f 'rsb_render.c' || echo './'`rsb_render.c +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_base_la-rsb_render.lo `test -f 'rsb_render.c' || echo './'`rsb_render.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_render.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_render.o libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_render.c -o librsb_base_la-rsb_render.o >/dev/null 2>&1 -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_base_la-rsb_eps.lo `test -f 'rsb_eps.c' || echo './'`rsb_eps.c +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_rec.c -o librsb_base_la-rsb_rec.o >/dev/null 2>&1 +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_base_la-rsb_eps.lo `test -f 'rsb_eps.c' || echo './'`rsb_eps.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_eps.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_eps.o -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_eps.c -o librsb_base_la-rsb_eps.o >/dev/null 2>&1 -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_base_la-rsb_msort_up.lo `test -f 'rsb_msort_up.c' || echo './'`rsb_msort_up.c +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_base_la-rsb_msort_up.lo `test -f 'rsb_msort_up.c' || echo './'`rsb_msort_up.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_msort_up.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_msort_up.o +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_eps.c -o librsb_base_la-rsb_eps.o >/dev/null 2>&1 libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_msort_up.c -o librsb_base_la-rsb_msort_up.o >/dev/null 2>&1 -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_base_la-rsb_sys.lo `test -f 'rsb_sys.c' || echo './'`rsb_sys.c +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_base_la-rsb_sys.lo `test -f 'rsb_sys.c' || echo './'`rsb_sys.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_sys.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_sys.o -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_sys.c -o librsb_base_la-rsb_sys.o >/dev/null 2>&1 -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_base_la-rsb_blas_stuff.lo `test -f 'rsb_blas_stuff.c' || echo './'`rsb_blas_stuff.c +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_base_la-rsb_blas_stuff.lo `test -f 'rsb_blas_stuff.c' || echo './'`rsb_blas_stuff.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_blas_stuff.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_blas_stuff.o +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_sys.c -o librsb_base_la-rsb_sys.o >/dev/null 2>&1 libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_blas_stuff.c -o librsb_base_la-rsb_blas_stuff.o >/dev/null 2>&1 -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_base_la-rsb_gen.lo `test -f 'rsb_gen.c' || echo './'`rsb_gen.c +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_base_la-rsb_gen.lo `test -f 'rsb_gen.c' || echo './'`rsb_gen.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_gen.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_gen.o -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_gen.c -o librsb_base_la-rsb_gen.o >/dev/null 2>&1 -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_base_la-rsb_perf.lo `test -f 'rsb_perf.c' || echo './'`rsb_perf.c +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_base_la-rsb_perf.lo `test -f 'rsb_perf.c' || echo './'`rsb_perf.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_perf.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_perf.o +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_gen.c -o librsb_base_la-rsb_gen.o >/dev/null 2>&1 libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_perf.c -o librsb_base_la-rsb_perf.o >/dev/null 2>&1 -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_base_la-rsb_rsb.lo `test -f 'rsb_rsb.c' || echo './'`rsb_rsb.c +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_krnl_bcss_spmv_u.c -o librsb_nounroll_la-rsb_krnl_bcss_spmv_u.o >/dev/null 2>&1 +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_base_la-rsb_rsb.lo `test -f 'rsb_rsb.c' || echo './'`rsb_rsb.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_rsb.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_rsb.o -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_rsb.c -o librsb_base_la-rsb_rsb.o >/dev/null 2>&1 -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_base_la-rsb_err.lo `test -f 'rsb_err.c' || echo './'`rsb_err.c +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_base_la-rsb_err.lo `test -f 'rsb_err.c' || echo './'`rsb_err.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_err.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_err.o libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_err.c -o librsb_base_la-rsb_err.o >/dev/null 2>&1 -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_base_la-rsb_tune.lo `test -f 'rsb_tune.c' || echo './'`rsb_tune.c +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_rsb.c -o librsb_base_la-rsb_rsb.o >/dev/null 2>&1 +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_base_la-rsb_tune.lo `test -f 'rsb_tune.c' || echo './'`rsb_tune.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_tune.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_tune.o -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_tune.c -o librsb_base_la-rsb_tune.o >/dev/null 2>&1 -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_base_la-rsb_do.lo `test -f 'rsb_do.c' || echo './'`rsb_do.c +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_base_la-rsb_do.lo `test -f 'rsb_do.c' || echo './'`rsb_do.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_do.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_do.o libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_do.c -o librsb_base_la-rsb_do.o >/dev/null 2>&1 -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_base_la-rsb_internals.lo `test -f 'rsb_internals.c' || echo './'`rsb_internals.c +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_tune.c -o librsb_base_la-rsb_tune.o >/dev/null 2>&1 +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_base_la-rsb_internals.lo `test -f 'rsb_internals.c' || echo './'`rsb_internals.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_internals.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_internals.o -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_internals.c -o librsb_base_la-rsb_internals.o >/dev/null 2>&1 -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_krnl_bcoo_spmv_u.c -o librsb_nounroll_la-rsb_krnl_bcoo_spmv_u.o >/dev/null 2>&1 -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_base_la-rsb_garbage.lo `test -f 'rsb_garbage.c' || echo './'`rsb_garbage.c +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_base_la-rsb_garbage.lo `test -f 'rsb_garbage.c' || echo './'`rsb_garbage.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_garbage.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_garbage.o +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_internals.c -o librsb_base_la-rsb_internals.o >/dev/null 2>&1 libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_garbage.c -o librsb_base_la-rsb_garbage.o >/dev/null 2>&1 -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_base_la-rsb_mmio.lo `test -f 'rsb_mmio.c' || echo './'`rsb_mmio.c +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_base_la-rsb_mmio.lo `test -f 'rsb_mmio.c' || echo './'`rsb_mmio.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_mmio.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_mmio.o libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_mmio.c -o librsb_base_la-rsb_mmio.o >/dev/null 2>&1 -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_base_la-rsb_partition.lo `test -f 'rsb_partition.c' || echo './'`rsb_partition.c +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_base_la-rsb_partition.lo `test -f 'rsb_partition.c' || echo './'`rsb_partition.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_partition.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_partition.o +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_base_la-rsb_mbw.lo `test -f 'rsb_mbw.c' || echo './'`rsb_mbw.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_partition.c -o librsb_base_la-rsb_partition.o >/dev/null 2>&1 -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_base_la-rsb_mbw.lo `test -f 'rsb_mbw.c' || echo './'`rsb_mbw.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_mbw.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_mbw.o -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_mbw.c -o librsb_base_la-rsb_mbw.o >/dev/null 2>&1 -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_base_la-rsb_limiter.lo `test -f 'rsb_limiter.c' || echo './'`rsb_limiter.c +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_base_la-rsb_limiter.lo `test -f 'rsb_limiter.c' || echo './'`rsb_limiter.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_limiter.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_limiter.o libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_limiter.c -o librsb_base_la-rsb_limiter.o >/dev/null 2>&1 -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_base_la-rsb_fpb.lo `test -f 'rsb_fpb.c' || echo './'`rsb_fpb.c +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_mbw.c -o librsb_base_la-rsb_mbw.o >/dev/null 2>&1 +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_base_la-rsb_fpb.lo `test -f 'rsb_fpb.c' || echo './'`rsb_fpb.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_fpb.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_fpb.o libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_fpb.c -o librsb_base_la-rsb_fpb.o >/dev/null 2>&1 -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_base_la-rsb_spgemm.lo `test -f 'rsb_spgemm.c' || echo './'`rsb_spgemm.c +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_base_la-rsb_spgemm.lo `test -f 'rsb_spgemm.c' || echo './'`rsb_spgemm.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_spgemm.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_spgemm.o -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_spgemm.c -o librsb_base_la-rsb_spgemm.o >/dev/null 2>&1 -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_base_la-rsb_spsum.lo `test -f 'rsb_spsum.c' || echo './'`rsb_spsum.c +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_base_la-rsb_spsum.lo `test -f 'rsb_spsum.c' || echo './'`rsb_spsum.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_spsum.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_spsum.o +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_spgemm.c -o librsb_base_la-rsb_spgemm.o >/dev/null 2>&1 libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_spsum.c -o librsb_base_la-rsb_spsum.o >/dev/null 2>&1 -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_base_la-rsb_spsv.lo `test -f 'rsb_spsv.c' || echo './'`rsb_spsv.c +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_base_la-rsb_spsv.lo `test -f 'rsb_spsv.c' || echo './'`rsb_spsv.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_spsv.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_spsv.o -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_spsv.c -o librsb_base_la-rsb_spsv.o >/dev/null 2>&1 -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_base_la-rsb_lock.lo `test -f 'rsb_lock.c' || echo './'`rsb_lock.c +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_base_la-rsb_lock.lo `test -f 'rsb_lock.c' || echo './'`rsb_lock.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_lock.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_lock.o libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_lock.c -o librsb_base_la-rsb_lock.o >/dev/null 2>&1 -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_base_la-rsb_swt.lo `test -f 'rsb_swt.c' || echo './'`rsb_swt.c +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_spsv.c -o librsb_base_la-rsb_spsv.o >/dev/null 2>&1 +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_base_la-rsb_swt.lo `test -f 'rsb_swt.c' || echo './'`rsb_swt.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_swt.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_swt.o -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_swt.c -o librsb_base_la-rsb_swt.o >/dev/null 2>&1 -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_base_la-rsb_init.lo `test -f 'rsb_init.c' || echo './'`rsb_init.c +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_base_la-rsb_init.lo `test -f 'rsb_init.c' || echo './'`rsb_init.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_init.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_init.o +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_swt.c -o librsb_base_la-rsb_swt.o >/dev/null 2>&1 +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_base_la-rsb_dump.lo `test -f 'rsb_dump.c' || echo './'`rsb_dump.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_init.c -o librsb_base_la-rsb_init.o >/dev/null 2>&1 -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_base_la-rsb_dump.lo `test -f 'rsb_dump.c' || echo './'`rsb_dump.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_dump.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_dump.o libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_dump.c -o librsb_base_la-rsb_dump.o >/dev/null 2>&1 -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_base_la-rsb_cpmv.lo `test -f 'rsb_cpmv.c' || echo './'`rsb_cpmv.c +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_base_la-rsb_cpmv.lo `test -f 'rsb_cpmv.c' || echo './'`rsb_cpmv.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_cpmv.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_cpmv.o libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_cpmv.c -o librsb_base_la-rsb_cpmv.o >/dev/null 2>&1 -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_base_la-rsb_asm.lo `test -f 'rsb_asm.c' || echo './'`rsb_asm.c +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_base_la-rsb_asm.lo `test -f 'rsb_asm.c' || echo './'`rsb_asm.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_asm.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_asm.o -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_asm.c -o librsb_base_la-rsb_asm.o >/dev/null 2>&1 -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_base_la-rsb_user.lo `test -f 'rsb_user.c' || echo './'`rsb_user.c +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_base_la-rsb_user.lo `test -f 'rsb_user.c' || echo './'`rsb_user.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_user.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_user.o +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_asm.c -o librsb_base_la-rsb_asm.o >/dev/null 2>&1 +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_base_la-rsb_coo2rec.lo `test -f 'rsb_coo2rec.c' || echo './'`rsb_coo2rec.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_user.c -o librsb_base_la-rsb_user.o >/dev/null 2>&1 -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_base_la-rsb_coo2rec.lo `test -f 'rsb_coo2rec.c' || echo './'`rsb_coo2rec.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_coo2rec.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_coo2rec.o -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_coo2rec.c -o librsb_base_la-rsb_coo2rec.o >/dev/null 2>&1 -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_base_la-rsb_rec2coo.lo `test -f 'rsb_rec2coo.c' || echo './'`rsb_rec2coo.c +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_base_la-rsb_rec2coo.lo `test -f 'rsb_rec2coo.c' || echo './'`rsb_rec2coo.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_rec2coo.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_rec2coo.o libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_rec2coo.c -o librsb_base_la-rsb_rec2coo.o >/dev/null 2>&1 -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_base_la-rsb_rec2csr.lo `test -f 'rsb_rec2csr.c' || echo './'`rsb_rec2csr.c +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_coo2rec.c -o librsb_base_la-rsb_coo2rec.o >/dev/null 2>&1 +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_base_la-rsb_rec2csr.lo `test -f 'rsb_rec2csr.c' || echo './'`rsb_rec2csr.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_rec2csr.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_rec2csr.o libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_rec2csr.c -o librsb_base_la-rsb_rec2csr.o >/dev/null 2>&1 -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_base_la-rsb_csr2coo.lo `test -f 'rsb_csr2coo.c' || echo './'`rsb_csr2coo.c +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_base_la-rsb_csr2coo.lo `test -f 'rsb_csr2coo.c' || echo './'`rsb_csr2coo.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_csr2coo.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_csr2coo.o libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_csr2coo.c -o librsb_base_la-rsb_csr2coo.o >/dev/null 2>&1 -/bin/bash ./libtool --tag=FC --mode=compile gfortran -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fopenmp -c -o rsb_blas_sparse.lo rsb_blas_sparse.F90 +/bin/sh ./libtool --tag=FC --mode=compile gfortran -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fopenmp -c -o rsb_blas_sparse.lo rsb_blas_sparse.F90 libtool: compile: gfortran -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fopenmp -c rsb_blas_sparse.F90 -fPIC -o .libs/rsb_blas_sparse.o -libtool: compile: gfortran -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fopenmp -c rsb_blas_sparse.F90 -o rsb_blas_sparse.o >/dev/null 2>&1 -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o rsb_libspblas_handle.lo rsb_libspblas_handle.c +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o rsb_libspblas_handle.lo rsb_libspblas_handle.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_libspblas_handle.c -fPIC -DPIC -o .libs/rsb_libspblas_handle.o libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_libspblas_handle.c -o rsb_libspblas_handle.o >/dev/null 2>&1 -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o rsb_libspblas.lo rsb_libspblas.c +libtool: compile: gfortran -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fopenmp -c rsb_blas_sparse.F90 -o rsb_blas_sparse.o >/dev/null 2>&1 +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o rsb_libspblas.lo rsb_libspblas.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_libspblas.c -fPIC -DPIC -o .libs/rsb_libspblas.o +gfortran -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fopenmp -c -o rsb_blas_sparse.o rsb_blas_sparse.F90 libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_libspblas.c -o rsb_libspblas.o >/dev/null 2>&1 -/bin/bash ./libtool --tag=CC --mode=link gcc -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -no-undefined -version-info 0:0:0 -Wl,-z,relro -o ch2icfb ch2icfb-ch2icfb.o -lm -lhwloc -lz -fopenmp -L/usr/lib/gcc/arm-linux-gnueabihf/12 -L/usr/lib/gcc/arm-linux-gnueabihf/12/../../../arm-linux-gnueabihf -L/usr/lib/gcc/arm-linux-gnueabihf/12/../../.. -L/lib/arm-linux-gnueabihf -L/usr/lib/arm-linux-gnueabihf -lgfortran -lm +/bin/sh ./libtool --tag=CC --mode=link gcc -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -no-undefined -version-info 0:0:0 -Wl,-z,relro -o ch2icfb ch2icfb-ch2icfb.o -lm -lhwloc -lz -fopenmp -L/usr/lib/gcc/arm-linux-gnueabihf/12 -L/usr/lib/gcc/arm-linux-gnueabihf/12/../../../arm-linux-gnueabihf -L/usr/lib/gcc/arm-linux-gnueabihf/12/../../.. -L/lib/arm-linux-gnueabihf -L/usr/lib/arm-linux-gnueabihf -lgfortran -lm +/bin/sh ./libtool --tag=CC --mode=link gcc -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -no-undefined -version-info 0:0:0 -Wl,-z,relro -o librsb_base.la librsb_base_la-rsb_is.lo librsb_base_la-rsb_mio.lo librsb_base_la-rsb_op.lo librsb_base_la-rsb_bio.lo librsb_base_la-rsb_get.lo librsb_base_la-rsb_set.lo librsb_base_la-rsb_coo.lo librsb_base_la-rsb_csr.lo librsb_base_la-rsb_coo_check.lo librsb_base_la-rsb_coo_symm.lo librsb_base_la-rsb_idx.lo librsb_base_la-rsb_srt.lo librsb_base_la-rsb_srtp.lo librsb_base_la-rsb_src.lo librsb_base_la-rsb_test_accuracy.lo librsb_base_la-rsb_clone.lo librsb_base_la-rsb_rec.lo librsb_base_la-rsb_render.lo librsb_base_la-rsb_eps.lo librsb_base_la-rsb_msort_up.lo librsb_base_la-rsb_sys.lo librsb_base_la-rsb_blas_stuff.lo librsb_base_la-rsb_gen.lo librsb_base_la-rsb_perf.lo librsb_base_la-rsb_rsb.lo librsb_base_la-rsb_err.lo librsb_base_la-rsb_tune.lo librsb_base_la-rsb_do.lo librsb_base_la-rsb_internals.lo librsb_base_la-rsb_garbage.lo librsb_base_la-rsb_mmio.lo librsb_base_la-rsb_partition.lo librsb_base_la-rsb_mbw.lo librsb_base_la-rsb_limiter.lo librsb_base_la-rsb_fpb.lo librsb_base_la-rsb_spgemm.lo librsb_base_la-rsb_spsum.lo librsb_base_la-rsb_spsv.lo librsb_base_la-rsb_lock.lo librsb_base_la-rsb_swt.lo librsb_base_la-rsb_init.lo librsb_base_la-rsb_dump.lo librsb_base_la-rsb_cpmv.lo librsb_base_la-rsb_asm.lo librsb_base_la-rsb_user.lo librsb_base_la-rsb_coo2rec.lo librsb_base_la-rsb_rec2coo.lo librsb_base_la-rsb_rec2csr.lo librsb_base_la-rsb_csr2coo.lo rsb_blas_sparse.lo -lm -lhwloc -lz -fopenmp -L/usr/lib/gcc/arm-linux-gnueabihf/12 -L/usr/lib/gcc/arm-linux-gnueabihf/12/../../../arm-linux-gnueabihf -L/usr/lib/gcc/arm-linux-gnueabihf/12/../../.. -L/lib/arm-linux-gnueabihf -L/usr/lib/arm-linux-gnueabihf -lgfortran -lm libtool: warning: '-version-info' is ignored for programs libtool: link: gcc -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -Wl,-z -Wl,relro -o ch2icfb ch2icfb-ch2icfb.o -fopenmp -lhwloc -lz -L/usr/lib/gcc/arm-linux-gnueabihf/12 -L/usr/lib/gcc/arm-linux-gnueabihf/12/../../../arm-linux-gnueabihf -L/usr/lib/gcc/arm-linux-gnueabihf/12/../../.. -L/lib/arm-linux-gnueabihf -L/usr/lib/arm-linux-gnueabihf -lgfortran -lm -fopenmp -/bin/bash ./libtool --tag=CC --mode=link gcc -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -no-undefined -version-info 0:0:0 -Wl,-z,relro -o librsb_base.la librsb_base_la-rsb_is.lo librsb_base_la-rsb_mio.lo librsb_base_la-rsb_op.lo librsb_base_la-rsb_bio.lo librsb_base_la-rsb_get.lo librsb_base_la-rsb_set.lo librsb_base_la-rsb_coo.lo librsb_base_la-rsb_csr.lo librsb_base_la-rsb_coo_check.lo librsb_base_la-rsb_coo_symm.lo librsb_base_la-rsb_idx.lo librsb_base_la-rsb_srt.lo librsb_base_la-rsb_srtp.lo librsb_base_la-rsb_src.lo librsb_base_la-rsb_test_accuracy.lo librsb_base_la-rsb_clone.lo librsb_base_la-rsb_rec.lo librsb_base_la-rsb_render.lo librsb_base_la-rsb_eps.lo librsb_base_la-rsb_msort_up.lo librsb_base_la-rsb_sys.lo librsb_base_la-rsb_blas_stuff.lo librsb_base_la-rsb_gen.lo librsb_base_la-rsb_perf.lo librsb_base_la-rsb_rsb.lo librsb_base_la-rsb_err.lo librsb_base_la-rsb_tune.lo librsb_base_la-rsb_do.lo librsb_base_la-rsb_internals.lo librsb_base_la-rsb_garbage.lo librsb_base_la-rsb_mmio.lo librsb_base_la-rsb_partition.lo librsb_base_la-rsb_mbw.lo librsb_base_la-rsb_limiter.lo librsb_base_la-rsb_fpb.lo librsb_base_la-rsb_spgemm.lo librsb_base_la-rsb_spsum.lo librsb_base_la-rsb_spsv.lo librsb_base_la-rsb_lock.lo librsb_base_la-rsb_swt.lo librsb_base_la-rsb_init.lo librsb_base_la-rsb_dump.lo librsb_base_la-rsb_cpmv.lo librsb_base_la-rsb_asm.lo librsb_base_la-rsb_user.lo librsb_base_la-rsb_coo2rec.lo librsb_base_la-rsb_rec2coo.lo librsb_base_la-rsb_rec2csr.lo librsb_base_la-rsb_csr2coo.lo rsb_blas_sparse.lo -lm -lhwloc -lz -fopenmp -L/usr/lib/gcc/arm-linux-gnueabihf/12 -L/usr/lib/gcc/arm-linux-gnueabihf/12/../../../arm-linux-gnueabihf -L/usr/lib/gcc/arm-linux-gnueabihf/12/../../.. -L/lib/arm-linux-gnueabihf -L/usr/lib/arm-linux-gnueabihf -lgfortran -lm libtool: warning: '-version-info/-version-number' is ignored for convenience libraries +/bin/sh ./libtool --tag=CC --mode=link gcc -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -no-undefined -version-info 0:0:0 -Wl,-z,relro -o librsb_spblas.la rsb_libspblas_handle.lo rsb_libspblas.lo -lm -lhwloc -lz -fopenmp -L/usr/lib/gcc/arm-linux-gnueabihf/12 -L/usr/lib/gcc/arm-linux-gnueabihf/12/../../../arm-linux-gnueabihf -L/usr/lib/gcc/arm-linux-gnueabihf/12/../../.. -L/lib/arm-linux-gnueabihf -L/usr/lib/arm-linux-gnueabihf -lgfortran -lm libtool: link: ar cr .libs/librsb_base.a .libs/librsb_base_la-rsb_is.o .libs/librsb_base_la-rsb_mio.o .libs/librsb_base_la-rsb_op.o .libs/librsb_base_la-rsb_bio.o .libs/librsb_base_la-rsb_get.o .libs/librsb_base_la-rsb_set.o .libs/librsb_base_la-rsb_coo.o .libs/librsb_base_la-rsb_csr.o .libs/librsb_base_la-rsb_coo_check.o .libs/librsb_base_la-rsb_coo_symm.o .libs/librsb_base_la-rsb_idx.o .libs/librsb_base_la-rsb_srt.o .libs/librsb_base_la-rsb_srtp.o .libs/librsb_base_la-rsb_src.o .libs/librsb_base_la-rsb_test_accuracy.o .libs/librsb_base_la-rsb_clone.o .libs/librsb_base_la-rsb_rec.o .libs/librsb_base_la-rsb_render.o .libs/librsb_base_la-rsb_eps.o .libs/librsb_base_la-rsb_msort_up.o .libs/librsb_base_la-rsb_sys.o .libs/librsb_base_la-rsb_blas_stuff.o .libs/librsb_base_la-rsb_gen.o .libs/librsb_base_la-rsb_perf.o .libs/librsb_base_la-rsb_rsb.o .libs/librsb_base_la-rsb_err.o .libs/librsb_base_la-rsb_tune.o .libs/librsb_base_la-rsb_do.o .libs/librsb_base_la-rsb_internals.o .libs/librsb_base_la-rsb_garbage.o .libs/librsb_base_la-rsb_mmio.o .libs/librsb_base_la-rsb_partition.o .libs/librsb_base_la-rsb_mbw.o .libs/librsb_base_la-rsb_limiter.o .libs/librsb_base_la-rsb_fpb.o .libs/librsb_base_la-rsb_spgemm.o .libs/librsb_base_la-rsb_spsum.o .libs/librsb_base_la-rsb_spsv.o .libs/librsb_base_la-rsb_lock.o .libs/librsb_base_la-rsb_swt.o .libs/librsb_base_la-rsb_init.o .libs/librsb_base_la-rsb_dump.o .libs/librsb_base_la-rsb_cpmv.o .libs/librsb_base_la-rsb_asm.o .libs/librsb_base_la-rsb_user.o .libs/librsb_base_la-rsb_coo2rec.o .libs/librsb_base_la-rsb_rec2coo.o .libs/librsb_base_la-rsb_rec2csr.o .libs/librsb_base_la-rsb_csr2coo.o .libs/rsb_blas_sparse.o libtool: link: ranlib .libs/librsb_base.a libtool: link: ( cd ".libs" && rm -f "librsb_base.la" && ln -s "../librsb_base.la" "librsb_base.la" ) -/bin/bash ./libtool --tag=CC --mode=link gcc -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -no-undefined -version-info 0:0:0 -Wl,-z,relro -o librsb_spblas.la rsb_libspblas_handle.lo rsb_libspblas.lo -lm -lhwloc -lz -fopenmp -L/usr/lib/gcc/arm-linux-gnueabihf/12 -L/usr/lib/gcc/arm-linux-gnueabihf/12/../../../arm-linux-gnueabihf -L/usr/lib/gcc/arm-linux-gnueabihf/12/../../.. -L/lib/arm-linux-gnueabihf -L/usr/lib/arm-linux-gnueabihf -lgfortran -lm +if test -f ./rsb_types.h -a ! -f ./rsb_types.h ; then cp -pv ./rsb_types.h ./rsb_types.h ; fi # out-of-dir behaviour varies between installations +if test -f ch2icfb ; then if SED=/bin/sed GREP=/bin/grep /bin/sh ./scripts/rsb_h_to_rsb_fi.sh . /build/reproducible-path/librsb-1.3.0.2+dfsg > rsb.F90 ; then true; else rm "rsb.F90"; echo "Failure generating rsb.F90!" ; exit ; fi ; else echo "Warning: Your system did not build ch2icfb for some reason --- skipping rebuild of "rsb.F90 ;true ; fi +/bin/sh ./libtool --tag=FC --mode=compile gfortran -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fopenmp -c -o rsb.lo rsb.F90 libtool: warning: '-version-info/-version-number' is ignored for convenience libraries libtool: link: ar cr .libs/librsb_spblas.a .libs/rsb_libspblas_handle.o .libs/rsb_libspblas.o libtool: link: ranlib .libs/librsb_spblas.a -libtool: link: ( cd ".libs" && rm -f "librsb_spblas.la" && ln -s "../librsb_spblas.la" "librsb_spblas.la" ) -if test -f ./rsb_types.h -a ! -f ./rsb_types.h ; then cp -pv ./rsb_types.h ./rsb_types.h ; fi # out-of-dir behaviour varies between installations -if test -f ch2icfb ; then if SED=/bin/sed GREP=/bin/grep /bin/bash ./scripts/rsb_h_to_rsb_fi.sh . /build/reproducible-path/librsb-1.3.0.2+dfsg > rsb.F90 ; then true; else rm "rsb.F90"; echo "Failure generating rsb.F90!" ; exit ; fi ; else echo "Warning: Your system did not build ch2icfb for some reason --- skipping rebuild of "rsb.F90 ;true ; fi -/bin/bash ./libtool --tag=FC --mode=compile gfortran -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fopenmp -c -o rsb.lo rsb.F90 libtool: compile: gfortran -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fopenmp -c rsb.F90 -fPIC -o .libs/rsb.o -libtool: compile: gfortran -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fopenmp -c rsb.F90 -o rsb.o >/dev/null 2>&1 +libtool: link: ( cd ".libs" && rm -f "librsb_spblas.la" && ln -s "../librsb_spblas.la" "librsb_spblas.la" ) gfortran -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fopenmp -c -o rsb.o rsb.F90 -/bin/bash ./libtool --tag=CC --mode=link gcc -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -no-undefined -version-info 0:0:0 -Wl,-z,relro -o librsb_nounroll.la librsb_nounroll_la-rsb_stropts.lo librsb_nounroll_la-rsb_strmif.lo librsb_nounroll_la-rsb_unroll.lo librsb_nounroll_la-rsb_krnl_vb.lo librsb_nounroll_la-rsb_krnl_lb.lo librsb_nounroll_la-rsb_krnl.lo librsb_nounroll_la-rsb_bench.lo librsb_nounroll_la-rsb_mergesort.lo librsb_nounroll_la-rsb_permute.lo librsb_nounroll_la-rsb_krnl_bcss_l.lo librsb_nounroll_la-rsb_krnl_bcss_u.lo librsb_nounroll_la-rsb_krnl_bcss_spsv_u.lo librsb_nounroll_la-rsb_krnl_bcss_spmv_u.lo librsb_nounroll_la-rsb_krnl_bcss_misc_u.lo librsb_nounroll_la-rsb_krnl_bcoo_spmv_u.lo librsb_nounroll_la-rsb_krnl_bcss.lo librsb_nounroll_la-rsb_spmv.lo librsb_nounroll_la-rsb_merge.lo librsb_nounroll_la-rsb_ompio.lo librsb_nounroll_la-rsb_util.lo librsb_nounroll_la-rsb_spgemm_csr.lo librsb_nounroll_la-rsb_spsum_misc.lo librsb_nounroll_la-rsb_prec.lo -lm -lhwloc -lz -fopenmp -L/usr/lib/gcc/arm-linux-gnueabihf/12 -L/usr/lib/gcc/arm-linux-gnueabihf/12/../../../arm-linux-gnueabihf -L/usr/lib/gcc/arm-linux-gnueabihf/12/../../.. -L/lib/arm-linux-gnueabihf -L/usr/lib/arm-linux-gnueabihf -lgfortran -lm +libtool: compile: gfortran -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fopenmp -c rsb.F90 -o rsb.o >/dev/null 2>&1 +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_krnl_bcoo_spmv_u.c -o librsb_nounroll_la-rsb_krnl_bcoo_spmv_u.o >/dev/null 2>&1 +/bin/sh ./libtool --tag=CC --mode=link gcc -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -no-undefined -version-info 0:0:0 -Wl,-z,relro -o librsb_nounroll.la librsb_nounroll_la-rsb_stropts.lo librsb_nounroll_la-rsb_strmif.lo librsb_nounroll_la-rsb_unroll.lo librsb_nounroll_la-rsb_krnl_vb.lo librsb_nounroll_la-rsb_krnl_lb.lo librsb_nounroll_la-rsb_krnl.lo librsb_nounroll_la-rsb_bench.lo librsb_nounroll_la-rsb_mergesort.lo librsb_nounroll_la-rsb_permute.lo librsb_nounroll_la-rsb_krnl_bcss_l.lo librsb_nounroll_la-rsb_krnl_bcss_u.lo librsb_nounroll_la-rsb_krnl_bcss_spsv_u.lo librsb_nounroll_la-rsb_krnl_bcss_spmv_u.lo librsb_nounroll_la-rsb_krnl_bcss_misc_u.lo librsb_nounroll_la-rsb_krnl_bcoo_spmv_u.lo librsb_nounroll_la-rsb_krnl_bcss.lo librsb_nounroll_la-rsb_spmv.lo librsb_nounroll_la-rsb_merge.lo librsb_nounroll_la-rsb_ompio.lo librsb_nounroll_la-rsb_util.lo librsb_nounroll_la-rsb_spgemm_csr.lo librsb_nounroll_la-rsb_spsum_misc.lo librsb_nounroll_la-rsb_prec.lo -lm -lhwloc -lz -fopenmp -L/usr/lib/gcc/arm-linux-gnueabihf/12 -L/usr/lib/gcc/arm-linux-gnueabihf/12/../../../arm-linux-gnueabihf -L/usr/lib/gcc/arm-linux-gnueabihf/12/../../.. -L/lib/arm-linux-gnueabihf -L/usr/lib/arm-linux-gnueabihf -lgfortran -lm libtool: warning: '-version-info/-version-number' is ignored for convenience libraries libtool: link: ar cr .libs/librsb_nounroll.a .libs/librsb_nounroll_la-rsb_stropts.o .libs/librsb_nounroll_la-rsb_strmif.o .libs/librsb_nounroll_la-rsb_unroll.o .libs/librsb_nounroll_la-rsb_krnl_vb.o .libs/librsb_nounroll_la-rsb_krnl_lb.o .libs/librsb_nounroll_la-rsb_krnl.o .libs/librsb_nounroll_la-rsb_bench.o .libs/librsb_nounroll_la-rsb_mergesort.o .libs/librsb_nounroll_la-rsb_permute.o .libs/librsb_nounroll_la-rsb_krnl_bcss_l.o .libs/librsb_nounroll_la-rsb_krnl_bcss_u.o .libs/librsb_nounroll_la-rsb_krnl_bcss_spsv_u.o .libs/librsb_nounroll_la-rsb_krnl_bcss_spmv_u.o .libs/librsb_nounroll_la-rsb_krnl_bcss_misc_u.o .libs/librsb_nounroll_la-rsb_krnl_bcoo_spmv_u.o .libs/librsb_nounroll_la-rsb_krnl_bcss.o .libs/librsb_nounroll_la-rsb_spmv.o .libs/librsb_nounroll_la-rsb_merge.o .libs/librsb_nounroll_la-rsb_ompio.o .libs/librsb_nounroll_la-rsb_util.o .libs/librsb_nounroll_la-rsb_spgemm_csr.o .libs/librsb_nounroll_la-rsb_spsum_misc.o .libs/librsb_nounroll_la-rsb_prec.o libtool: link: ranlib .libs/librsb_nounroll.a libtool: link: ( cd ".libs" && rm -f "librsb_nounroll.la" && ln -s "../librsb_nounroll.la" "librsb_nounroll.la" ) -/bin/bash ./libtool --tag=CC --mode=link gcc -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -no-undefined -version-info 0:0:0 -Wl,-z,relro -o librsb.la -rpath /usr/lib/arm-linux-gnueabihf rsb.lo librsb_nounroll.la librsb_base.la librsb_spblas.la /build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp/librsbpp.la -lstdc++ -lm -lhwloc -lz -fopenmp -L/usr/lib/gcc/arm-linux-gnueabihf/12 -L/usr/lib/gcc/arm-linux-gnueabihf/12/../../../arm-linux-gnueabihf -L/usr/lib/gcc/arm-linux-gnueabihf/12/../../.. -L/lib/arm-linux-gnueabihf -L/usr/lib/arm-linux-gnueabihf -lgfortran -lm +/bin/sh ./libtool --tag=CC --mode=link gcc -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -no-undefined -version-info 0:0:0 -Wl,-z,relro -o librsb.la -rpath /usr/lib/arm-linux-gnueabihf rsb.lo librsb_nounroll.la librsb_base.la librsb_spblas.la /build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp/librsbpp.la -lstdc++ -lm -lhwloc -lz -fopenmp -L/usr/lib/gcc/arm-linux-gnueabihf/12 -L/usr/lib/gcc/arm-linux-gnueabihf/12/../../../arm-linux-gnueabihf -L/usr/lib/gcc/arm-linux-gnueabihf/12/../../.. -L/lib/arm-linux-gnueabihf -L/usr/lib/arm-linux-gnueabihf -lgfortran -lm libtool: link: gcc -shared -fPIC -DPIC .libs/rsb.o -Wl,--whole-archive ./.libs/librsb_nounroll.a ./.libs/librsb_base.a ./.libs/librsb_spblas.a /build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp/.libs/librsbpp.a -Wl,--no-whole-archive -L/usr/lib/gcc/arm-linux-gnueabihf/12 -L/usr/lib/gcc/arm-linux-gnueabihf/12/../../../arm-linux-gnueabihf -L/usr/lib/gcc/arm-linux-gnueabihf/12/../../.. -L/lib/arm-linux-gnueabihf -L/usr/lib/arm-linux-gnueabihf -lpthread -lstdc++fs -lstdc++ -lhwloc -lz -lgfortran -lm -g -O2 -fstack-protector-strong -O3 -Wl,-z -Wl,relro -fopenmp -fopenmp -Wl,-soname -Wl,librsb.so.0 -o .libs/librsb.so.0.0.0 libtool: link: (cd ".libs" && rm -f "librsb.so.0" && ln -s "librsb.so.0.0.0" "librsb.so.0") libtool: link: (cd ".libs" && rm -f "librsb.so" && ln -s "librsb.so.0.0.0" "librsb.so") @@ -3557,7 +3594,7 @@ libtool: link: ranlib .libs/librsb.a libtool: link: rm -fr .libs/librsb.lax libtool: link: ( cd ".libs" && rm -f "librsb.la" && ln -s "../librsb.la" "librsb.la" ) -/bin/bash ./libtool --tag=CXX --mode=link g++ -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -fopenmp -no-undefined -version-info 0:0:0 -Wl,-z,relro -o rsbench rsbench-rsbench.o rsbench-rsb_test_matops.o rsbench-rsb_mkl.o rsbench-rsb_genmm.o rsbench-rsb_mmls.o rsbench-rsb_pr.o rsbench-rsb_pcnt.o rsbench-rsb_failure_tests.o rsbench-rsb_libspblas_tests.o rsb_dummy.o librsb.la -lhwloc -lm -lhwloc -lz -fopenmp -L/usr/lib/gcc/arm-linux-gnueabihf/12 -L/usr/lib/gcc/arm-linux-gnueabihf/12/../../../arm-linux-gnueabihf -L/usr/lib/gcc/arm-linux-gnueabihf/12/../../.. -L/lib/arm-linux-gnueabihf -L/usr/lib/arm-linux-gnueabihf -lgfortran -lm +/bin/sh ./libtool --tag=CXX --mode=link g++ -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -fopenmp -no-undefined -version-info 0:0:0 -Wl,-z,relro -o rsbench rsbench-rsbench.o rsbench-rsb_test_matops.o rsbench-rsb_mkl.o rsbench-rsb_genmm.o rsbench-rsb_mmls.o rsbench-rsb_pr.o rsbench-rsb_pcnt.o rsbench-rsb_failure_tests.o rsbench-rsb_libspblas_tests.o rsb_dummy.o librsb.la -lhwloc -lm -lhwloc -lz -fopenmp -L/usr/lib/gcc/arm-linux-gnueabihf/12 -L/usr/lib/gcc/arm-linux-gnueabihf/12/../../../arm-linux-gnueabihf -L/usr/lib/gcc/arm-linux-gnueabihf/12/../../.. -L/lib/arm-linux-gnueabihf -L/usr/lib/arm-linux-gnueabihf -lgfortran -lm libtool: warning: '-version-info' is ignored for programs libtool: link: g++ -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -fopenmp -Wl,-z -Wl,relro -o .libs/rsbench rsbench-rsbench.o rsbench-rsb_test_matops.o rsbench-rsb_mkl.o rsbench-rsb_genmm.o rsbench-rsb_mmls.o rsbench-rsb_pr.o rsbench-rsb_pcnt.o rsbench-rsb_failure_tests.o rsbench-rsb_libspblas_tests.o rsb_dummy.o -fopenmp ./.libs/librsb.so -lhwloc -lz -L/usr/lib/gcc/arm-linux-gnueabihf/12 -L/usr/lib/gcc/arm-linux-gnueabihf/12/../../../arm-linux-gnueabihf -L/usr/lib/gcc/arm-linux-gnueabihf/12/../../.. -L/lib/arm-linux-gnueabihf -L/usr/lib/arm-linux-gnueabihf -lgfortran -lm -fopenmp gmake[4]: Leaving directory '/build/reproducible-path/librsb-1.3.0.2+dfsg' @@ -3574,27 +3611,27 @@ gfortran -DHAVE_CONFIG_H -I. -I.. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -I.. -I.. -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fopenmp -c -o fortran.o fortran.F90 gfortran -DHAVE_CONFIG_H -I. -I.. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -I.. -I.. -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fopenmp -c -o fortran_rsb_fi.o fortran_rsb_fi.F90 g++ -DHAVE_CONFIG_H -I. -I.. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -fopenmp -c -o cplusplus.o cplusplus.cpp -/bin/bash ../libtool --tag=CXX --mode=link g++ -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -fopenmp -Wl,-z,relro -o hello hello.o -L.. /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la -lhwloc -lm -lhwloc -lz -fopenmp -L/usr/lib/gcc/arm-linux-gnueabihf/12 -L/usr/lib/gcc/arm-linux-gnueabihf/12/../../../arm-linux-gnueabihf -L/usr/lib/gcc/arm-linux-gnueabihf/12/../../.. -L/lib/arm-linux-gnueabihf -L/usr/lib/arm-linux-gnueabihf -lgfortran -lm -/bin/bash ../libtool --tag=CXX --mode=link g++ -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -fopenmp -Wl,-z,relro -o snippets snippets.o -L.. /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la -lhwloc -lm -lhwloc -lz -fopenmp -L/usr/lib/gcc/arm-linux-gnueabihf/12 -L/usr/lib/gcc/arm-linux-gnueabihf/12/../../../arm-linux-gnueabihf -L/usr/lib/gcc/arm-linux-gnueabihf/12/../../.. -L/lib/arm-linux-gnueabihf -L/usr/lib/arm-linux-gnueabihf -lgfortran -lm +/bin/sh ../libtool --tag=CXX --mode=link g++ -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -fopenmp -Wl,-z,relro -o hello hello.o -L.. /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la -lhwloc -lm -lhwloc -lz -fopenmp -L/usr/lib/gcc/arm-linux-gnueabihf/12 -L/usr/lib/gcc/arm-linux-gnueabihf/12/../../../arm-linux-gnueabihf -L/usr/lib/gcc/arm-linux-gnueabihf/12/../../.. -L/lib/arm-linux-gnueabihf -L/usr/lib/arm-linux-gnueabihf -lgfortran -lm +/bin/sh ../libtool --tag=CXX --mode=link g++ -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -fopenmp -Wl,-z,relro -o transpose transpose.o -L.. /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la -lhwloc -lm -lhwloc -lz -fopenmp -L/usr/lib/gcc/arm-linux-gnueabihf/12 -L/usr/lib/gcc/arm-linux-gnueabihf/12/../../../arm-linux-gnueabihf -L/usr/lib/gcc/arm-linux-gnueabihf/12/../../.. -L/lib/arm-linux-gnueabihf -L/usr/lib/arm-linux-gnueabihf -lgfortran -lm +/bin/sh ../libtool --tag=CXX --mode=link g++ -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -fopenmp -Wl,-z,relro -o power power.o -L.. /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la -lhwloc -lm -lhwloc -lz -fopenmp -L/usr/lib/gcc/arm-linux-gnueabihf/12 -L/usr/lib/gcc/arm-linux-gnueabihf/12/../../../arm-linux-gnueabihf -L/usr/lib/gcc/arm-linux-gnueabihf/12/../../.. -L/lib/arm-linux-gnueabihf -L/usr/lib/arm-linux-gnueabihf -lgfortran -lm libtool: link: g++ -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -fopenmp -Wl,-z -Wl,relro -o .libs/hello hello.o -fopenmp -L.. /build/reproducible-path/librsb-1.3.0.2+dfsg/.libs/librsb.so -lhwloc -lz -L/usr/lib/gcc/arm-linux-gnueabihf/12 -L/usr/lib/gcc/arm-linux-gnueabihf/12/../../../arm-linux-gnueabihf -L/usr/lib/gcc/arm-linux-gnueabihf/12/../../.. -L/lib/arm-linux-gnueabihf -L/usr/lib/arm-linux-gnueabihf -lgfortran -lm -fopenmp -libtool: link: g++ -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -fopenmp -Wl,-z -Wl,relro -o .libs/snippets snippets.o -fopenmp -L.. /build/reproducible-path/librsb-1.3.0.2+dfsg/.libs/librsb.so -lhwloc -lz -L/usr/lib/gcc/arm-linux-gnueabihf/12 -L/usr/lib/gcc/arm-linux-gnueabihf/12/../../../arm-linux-gnueabihf -L/usr/lib/gcc/arm-linux-gnueabihf/12/../../.. -L/lib/arm-linux-gnueabihf -L/usr/lib/arm-linux-gnueabihf -lgfortran -lm -fopenmp -/bin/bash ../libtool --tag=CXX --mode=link g++ -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -fopenmp -Wl,-z,relro -o transpose transpose.o -L.. /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la -lhwloc -lm -lhwloc -lz -fopenmp -L/usr/lib/gcc/arm-linux-gnueabihf/12 -L/usr/lib/gcc/arm-linux-gnueabihf/12/../../../arm-linux-gnueabihf -L/usr/lib/gcc/arm-linux-gnueabihf/12/../../.. -L/lib/arm-linux-gnueabihf -L/usr/lib/arm-linux-gnueabihf -lgfortran -lm -/bin/bash ../libtool --tag=CXX --mode=link g++ -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -fopenmp -Wl,-z,relro -o power power.o -L.. /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la -lhwloc -lm -lhwloc -lz -fopenmp -L/usr/lib/gcc/arm-linux-gnueabihf/12 -L/usr/lib/gcc/arm-linux-gnueabihf/12/../../../arm-linux-gnueabihf -L/usr/lib/gcc/arm-linux-gnueabihf/12/../../.. -L/lib/arm-linux-gnueabihf -L/usr/lib/arm-linux-gnueabihf -lgfortran -lm +/bin/sh ../libtool --tag=CXX --mode=link g++ -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -fopenmp -Wl,-z,relro -o autotune autotune.o -L.. /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la -lhwloc -lm -lhwloc -lz -fopenmp -L/usr/lib/gcc/arm-linux-gnueabihf/12 -L/usr/lib/gcc/arm-linux-gnueabihf/12/../../../arm-linux-gnueabihf -L/usr/lib/gcc/arm-linux-gnueabihf/12/../../.. -L/lib/arm-linux-gnueabihf -L/usr/lib/arm-linux-gnueabihf -lgfortran -lm libtool: link: g++ -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -fopenmp -Wl,-z -Wl,relro -o .libs/transpose transpose.o -fopenmp -L.. /build/reproducible-path/librsb-1.3.0.2+dfsg/.libs/librsb.so -lhwloc -lz -L/usr/lib/gcc/arm-linux-gnueabihf/12 -L/usr/lib/gcc/arm-linux-gnueabihf/12/../../../arm-linux-gnueabihf -L/usr/lib/gcc/arm-linux-gnueabihf/12/../../.. -L/lib/arm-linux-gnueabihf -L/usr/lib/arm-linux-gnueabihf -lgfortran -lm -fopenmp libtool: link: g++ -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -fopenmp -Wl,-z -Wl,relro -o .libs/power power.o -fopenmp -L.. /build/reproducible-path/librsb-1.3.0.2+dfsg/.libs/librsb.so -lhwloc -lz -L/usr/lib/gcc/arm-linux-gnueabihf/12 -L/usr/lib/gcc/arm-linux-gnueabihf/12/../../../arm-linux-gnueabihf -L/usr/lib/gcc/arm-linux-gnueabihf/12/../../.. -L/lib/arm-linux-gnueabihf -L/usr/lib/arm-linux-gnueabihf -lgfortran -lm -fopenmp -/bin/bash ../libtool --tag=CXX --mode=link g++ -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -fopenmp -Wl,-z,relro -o autotune autotune.o -L.. /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la -lhwloc -lm -lhwloc -lz -fopenmp -L/usr/lib/gcc/arm-linux-gnueabihf/12 -L/usr/lib/gcc/arm-linux-gnueabihf/12/../../../arm-linux-gnueabihf -L/usr/lib/gcc/arm-linux-gnueabihf/12/../../.. -L/lib/arm-linux-gnueabihf -L/usr/lib/arm-linux-gnueabihf -lgfortran -lm -/bin/bash ../libtool --tag=CXX --mode=link g++ -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -fopenmp -Wl,-z,relro -o backsolve backsolve.o -L.. /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la -lhwloc -lm -lhwloc -lz -fopenmp -L/usr/lib/gcc/arm-linux-gnueabihf/12 -L/usr/lib/gcc/arm-linux-gnueabihf/12/../../../arm-linux-gnueabihf -L/usr/lib/gcc/arm-linux-gnueabihf/12/../../.. -L/lib/arm-linux-gnueabihf -L/usr/lib/arm-linux-gnueabihf -lgfortran -lm +/bin/sh ../libtool --tag=CXX --mode=link g++ -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -fopenmp -Wl,-z,relro -o backsolve backsolve.o -L.. /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la -lhwloc -lm -lhwloc -lz -fopenmp -L/usr/lib/gcc/arm-linux-gnueabihf/12 -L/usr/lib/gcc/arm-linux-gnueabihf/12/../../../arm-linux-gnueabihf -L/usr/lib/gcc/arm-linux-gnueabihf/12/../../.. -L/lib/arm-linux-gnueabihf -L/usr/lib/arm-linux-gnueabihf -lgfortran -lm +/bin/sh ../libtool --tag=CXX --mode=link g++ -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -fopenmp -Wl,-z,relro -o hello-spblas hello-spblas.o -L.. /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la -lhwloc -lm -lhwloc -lz -fopenmp -L/usr/lib/gcc/arm-linux-gnueabihf/12 -L/usr/lib/gcc/arm-linux-gnueabihf/12/../../../arm-linux-gnueabihf -L/usr/lib/gcc/arm-linux-gnueabihf/12/../../.. -L/lib/arm-linux-gnueabihf -L/usr/lib/arm-linux-gnueabihf -lgfortran -lm libtool: link: g++ -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -fopenmp -Wl,-z -Wl,relro -o .libs/autotune autotune.o -fopenmp -L.. /build/reproducible-path/librsb-1.3.0.2+dfsg/.libs/librsb.so -lhwloc -lz -L/usr/lib/gcc/arm-linux-gnueabihf/12 -L/usr/lib/gcc/arm-linux-gnueabihf/12/../../../arm-linux-gnueabihf -L/usr/lib/gcc/arm-linux-gnueabihf/12/../../.. -L/lib/arm-linux-gnueabihf -L/usr/lib/arm-linux-gnueabihf -lgfortran -lm -fopenmp libtool: link: g++ -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -fopenmp -Wl,-z -Wl,relro -o .libs/backsolve backsolve.o -fopenmp -L.. /build/reproducible-path/librsb-1.3.0.2+dfsg/.libs/librsb.so -lhwloc -lz -L/usr/lib/gcc/arm-linux-gnueabihf/12 -L/usr/lib/gcc/arm-linux-gnueabihf/12/../../../arm-linux-gnueabihf -L/usr/lib/gcc/arm-linux-gnueabihf/12/../../.. -L/lib/arm-linux-gnueabihf -L/usr/lib/arm-linux-gnueabihf -lgfortran -lm -fopenmp -/bin/bash ../libtool --tag=CXX --mode=link g++ -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -fopenmp -Wl,-z,relro -o hello-spblas hello-spblas.o -L.. /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la -lhwloc -lm -lhwloc -lz -fopenmp -L/usr/lib/gcc/arm-linux-gnueabihf/12 -L/usr/lib/gcc/arm-linux-gnueabihf/12/../../../arm-linux-gnueabihf -L/usr/lib/gcc/arm-linux-gnueabihf/12/../../.. -L/lib/arm-linux-gnueabihf -L/usr/lib/arm-linux-gnueabihf -lgfortran -lm -/bin/bash ../libtool --tag=CXX --mode=link g++ -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -fopenmp -Wl,-z,relro -o io-spblas io-spblas.o -L.. /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la -lhwloc -lm -lhwloc -lz -fopenmp -L/usr/lib/gcc/arm-linux-gnueabihf/12 -L/usr/lib/gcc/arm-linux-gnueabihf/12/../../../arm-linux-gnueabihf -L/usr/lib/gcc/arm-linux-gnueabihf/12/../../.. -L/lib/arm-linux-gnueabihf -L/usr/lib/arm-linux-gnueabihf -lgfortran -lm libtool: link: g++ -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -fopenmp -Wl,-z -Wl,relro -o .libs/hello-spblas hello-spblas.o -fopenmp -L.. /build/reproducible-path/librsb-1.3.0.2+dfsg/.libs/librsb.so -lhwloc -lz -L/usr/lib/gcc/arm-linux-gnueabihf/12 -L/usr/lib/gcc/arm-linux-gnueabihf/12/../../../arm-linux-gnueabihf -L/usr/lib/gcc/arm-linux-gnueabihf/12/../../.. -L/lib/arm-linux-gnueabihf -L/usr/lib/arm-linux-gnueabihf -lgfortran -lm -fopenmp -/bin/bash ../libtool --tag=CXX --mode=link g++ -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -fopenmp -Wl,-z,relro -o fortran fortran.o -L.. /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la -lhwloc -lm -lhwloc -lz -fopenmp -L/usr/lib/gcc/arm-linux-gnueabihf/12 -L/usr/lib/gcc/arm-linux-gnueabihf/12/../../../arm-linux-gnueabihf -L/usr/lib/gcc/arm-linux-gnueabihf/12/../../.. -L/lib/arm-linux-gnueabihf -L/usr/lib/arm-linux-gnueabihf -lgfortran -lm +/bin/sh ../libtool --tag=CXX --mode=link g++ -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -fopenmp -Wl,-z,relro -o io-spblas io-spblas.o -L.. /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la -lhwloc -lm -lhwloc -lz -fopenmp -L/usr/lib/gcc/arm-linux-gnueabihf/12 -L/usr/lib/gcc/arm-linux-gnueabihf/12/../../../arm-linux-gnueabihf -L/usr/lib/gcc/arm-linux-gnueabihf/12/../../.. -L/lib/arm-linux-gnueabihf -L/usr/lib/arm-linux-gnueabihf -lgfortran -lm +/bin/sh ../libtool --tag=CXX --mode=link g++ -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -fopenmp -Wl,-z,relro -o fortran fortran.o -L.. /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la -lhwloc -lm -lhwloc -lz -fopenmp -L/usr/lib/gcc/arm-linux-gnueabihf/12 -L/usr/lib/gcc/arm-linux-gnueabihf/12/../../../arm-linux-gnueabihf -L/usr/lib/gcc/arm-linux-gnueabihf/12/../../.. -L/lib/arm-linux-gnueabihf -L/usr/lib/arm-linux-gnueabihf -lgfortran -lm +/bin/sh ../libtool --tag=CXX --mode=link g++ -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -fopenmp -Wl,-z,relro -o fortran_rsb_fi fortran_rsb_fi.o -L.. /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la -lhwloc -lm -lhwloc -lz -fopenmp -L/usr/lib/gcc/arm-linux-gnueabihf/12 -L/usr/lib/gcc/arm-linux-gnueabihf/12/../../../arm-linux-gnueabihf -L/usr/lib/gcc/arm-linux-gnueabihf/12/../../.. -L/lib/arm-linux-gnueabihf -L/usr/lib/arm-linux-gnueabihf -lgfortran -lm +/bin/sh ../libtool --tag=CXX --mode=link g++ -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -fopenmp -Wl,-z,relro -o snippets snippets.o -L.. /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la -lhwloc -lm -lhwloc -lz -fopenmp -L/usr/lib/gcc/arm-linux-gnueabihf/12 -L/usr/lib/gcc/arm-linux-gnueabihf/12/../../../arm-linux-gnueabihf -L/usr/lib/gcc/arm-linux-gnueabihf/12/../../.. -L/lib/arm-linux-gnueabihf -L/usr/lib/arm-linux-gnueabihf -lgfortran -lm libtool: link: g++ -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -fopenmp -Wl,-z -Wl,relro -o .libs/io-spblas io-spblas.o -fopenmp -L.. /build/reproducible-path/librsb-1.3.0.2+dfsg/.libs/librsb.so -lhwloc -lz -L/usr/lib/gcc/arm-linux-gnueabihf/12 -L/usr/lib/gcc/arm-linux-gnueabihf/12/../../../arm-linux-gnueabihf -L/usr/lib/gcc/arm-linux-gnueabihf/12/../../.. -L/lib/arm-linux-gnueabihf -L/usr/lib/arm-linux-gnueabihf -lgfortran -lm -fopenmp -/bin/bash ../libtool --tag=CXX --mode=link g++ -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -fopenmp -Wl,-z,relro -o fortran_rsb_fi fortran_rsb_fi.o -L.. /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la -lhwloc -lm -lhwloc -lz -fopenmp -L/usr/lib/gcc/arm-linux-gnueabihf/12 -L/usr/lib/gcc/arm-linux-gnueabihf/12/../../../arm-linux-gnueabihf -L/usr/lib/gcc/arm-linux-gnueabihf/12/../../.. -L/lib/arm-linux-gnueabihf -L/usr/lib/arm-linux-gnueabihf -lgfortran -lm libtool: link: g++ -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -fopenmp -Wl,-z -Wl,relro -o .libs/fortran fortran.o -fopenmp -L.. /build/reproducible-path/librsb-1.3.0.2+dfsg/.libs/librsb.so -lhwloc -lz -L/usr/lib/gcc/arm-linux-gnueabihf/12 -L/usr/lib/gcc/arm-linux-gnueabihf/12/../../../arm-linux-gnueabihf -L/usr/lib/gcc/arm-linux-gnueabihf/12/../../.. -L/lib/arm-linux-gnueabihf -L/usr/lib/arm-linux-gnueabihf -lgfortran -lm -fopenmp -/bin/bash ../libtool --tag=CXX --mode=link g++ -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -fopenmp -Wl,-z,relro -o cplusplus cplusplus.o -L.. /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la -lhwloc -lm -lhwloc -lz -fopenmp -L/usr/lib/gcc/arm-linux-gnueabihf/12 -L/usr/lib/gcc/arm-linux-gnueabihf/12/../../../arm-linux-gnueabihf -L/usr/lib/gcc/arm-linux-gnueabihf/12/../../.. -L/lib/arm-linux-gnueabihf -L/usr/lib/arm-linux-gnueabihf -lgfortran -lm +/bin/sh ../libtool --tag=CXX --mode=link g++ -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -fopenmp -Wl,-z,relro -o cplusplus cplusplus.o -L.. /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la -lhwloc -lm -lhwloc -lz -fopenmp -L/usr/lib/gcc/arm-linux-gnueabihf/12 -L/usr/lib/gcc/arm-linux-gnueabihf/12/../../../arm-linux-gnueabihf -L/usr/lib/gcc/arm-linux-gnueabihf/12/../../.. -L/lib/arm-linux-gnueabihf -L/usr/lib/arm-linux-gnueabihf -lgfortran -lm libtool: link: g++ -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -fopenmp -Wl,-z -Wl,relro -o .libs/fortran_rsb_fi fortran_rsb_fi.o -fopenmp -L.. /build/reproducible-path/librsb-1.3.0.2+dfsg/.libs/librsb.so -lhwloc -lz -L/usr/lib/gcc/arm-linux-gnueabihf/12 -L/usr/lib/gcc/arm-linux-gnueabihf/12/../../../arm-linux-gnueabihf -L/usr/lib/gcc/arm-linux-gnueabihf/12/../../.. -L/lib/arm-linux-gnueabihf -L/usr/lib/arm-linux-gnueabihf -lgfortran -lm -fopenmp +libtool: link: g++ -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -fopenmp -Wl,-z -Wl,relro -o .libs/snippets snippets.o -fopenmp -L.. /build/reproducible-path/librsb-1.3.0.2+dfsg/.libs/librsb.so -lhwloc -lz -L/usr/lib/gcc/arm-linux-gnueabihf/12 -L/usr/lib/gcc/arm-linux-gnueabihf/12/../../../arm-linux-gnueabihf -L/usr/lib/gcc/arm-linux-gnueabihf/12/../../.. -L/lib/arm-linux-gnueabihf -L/usr/lib/arm-linux-gnueabihf -lgfortran -lm -fopenmp libtool: link: g++ -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -fopenmp -Wl,-z -Wl,relro -o .libs/cplusplus cplusplus.o -fopenmp -L.. /build/reproducible-path/librsb-1.3.0.2+dfsg/.libs/librsb.so -lhwloc -lz -L/usr/lib/gcc/arm-linux-gnueabihf/12 -L/usr/lib/gcc/arm-linux-gnueabihf/12/../../../arm-linux-gnueabihf -L/usr/lib/gcc/arm-linux-gnueabihf/12/../../.. -L/lib/arm-linux-gnueabihf -L/usr/lib/arm-linux-gnueabihf -lgfortran -lm -fopenmp gmake[4]: Leaving directory '/build/reproducible-path/librsb-1.3.0.2+dfsg/examples' Making all in scripts @@ -3612,12 +3649,12 @@ Making all in doc gmake[4]: Entering directory '/build/reproducible-path/librsb-1.3.0.2+dfsg/doc' /bin/mkdir -p man -/bin/mkdir -p man -gmake makedox -SOURCE_DATE_EPOCH=1704114061 \ +SOURCE_DATE_EPOCH=1704020461 \ help2man --name="benchmark and test for librsb" --no-info ../rsbench | /bin/sed 's/January //g' > man/rsbench.1 -SOURCE_DATE_EPOCH=1704114061 \ +/bin/mkdir -p man +SOURCE_DATE_EPOCH=1704020461 \ help2man --name="provide configuration information for librsb" --no-info /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb-config | /bin/sed 's/January //g' > man/librsb-config.1 +gmake makedox gmake[5]: Entering directory '/build/reproducible-path/librsb-1.3.0.2+dfsg/doc' DOXYGEN_PROJECT_NUMBER=1.3.0.2 doxygen Doxyfile || echo "are you sure you have doxygen installed ?" warning: Tag 'LATEX_SOURCE_CODE' at line 2082 of file 'Doxyfile' has become obsolete. @@ -4259,13 +4296,13 @@ g++ -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -c -o rgt-rgt.o `test -f 'rgt.cpp' || echo './'`rgt.cpp g++ -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -DRSBP_NOTHROW=1 -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -c -o rgt_ne-rgt.o `test -f 'rgt.cpp' || echo './'`rgt.cpp g++ -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -DRSBP_NOTHROW=1 -DRSBP_WANT_REV=1 -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -c -o rgt_rv-rgt.o `test -f 'rgt.cpp' || echo './'`rgt.cpp -/bin/bash ./libtool --tag=CXX --mode=link g++ -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -Wl,-z,relro -o rgt rgt-rgt.o -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la -/bin/bash ./libtool --tag=CXX --mode=link g++ -DRSBP_NOTHROW=1 -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -Wl,-z,relro -o rgt_ne rgt_ne-rgt.o -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la +/bin/sh ./libtool --tag=CXX --mode=link g++ -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -Wl,-z,relro -o rgt rgt-rgt.o -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la +/bin/sh ./libtool --tag=CXX --mode=link g++ -DRSBP_NOTHROW=1 -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -Wl,-z,relro -o rgt_ne rgt_ne-rgt.o -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la +/bin/sh ./libtool --tag=CXX --mode=link g++ -DRSBP_NOTHROW=1 -DRSBP_WANT_REV=1 -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -Wl,-z,relro -o rgt_rv rgt_rv-rgt.o -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la libtool: link: g++ -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -Wl,-z -Wl,relro -o .libs/rgt rgt-rgt.o -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/.libs/librsb.so -fopenmp -libtool: link: g++ -DRSBP_NOTHROW=1 -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -Wl,-z -Wl,relro -o .libs/rgt_ne rgt_ne-rgt.o -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/.libs/librsb.so -fopenmp -/bin/bash ./libtool --tag=CXX --mode=link g++ -DRSBP_NOTHROW=1 -DRSBP_WANT_REV=1 -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -Wl,-z,relro -o rgt_rv rgt_rv-rgt.o -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la libtool: link: g++ -DRSBP_NOTHROW=1 -DRSBP_WANT_REV=1 -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -Wl,-z -Wl,relro -o .libs/rgt_rv rgt_rv-rgt.o -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/.libs/librsb.so -fopenmp -/bin/bash ./libtool --tag=CXX --mode=link g++ -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -Wl,-z,relro -o rsb rsb.o -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la +libtool: link: g++ -DRSBP_NOTHROW=1 -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -Wl,-z -Wl,relro -o .libs/rgt_ne rgt_ne-rgt.o -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/.libs/librsb.so -fopenmp +/bin/sh ./libtool --tag=CXX --mode=link g++ -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -Wl,-z,relro -o rsb rsb.o -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la libtool: link: g++ -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -Wl,-z -Wl,relro -o .libs/rsb rsb.o -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/.libs/librsb.so -fopenmp gmake[6]: Leaving directory '/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib' Making all in examples @@ -4275,8 +4312,6 @@ g++ -DHAVE_CONFIG_H -I.. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I.. -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -c -o bench.o bench.cpp g++ -DHAVE_CONFIG_H -I.. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I.. -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -c -o build.o build.cpp g++ -DHAVE_CONFIG_H -I.. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I.. -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -c -o misc.o misc.cpp -g++ -DHAVE_CONFIG_H -I.. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I.. -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -c -o twonnz.o twonnz.cpp -g++ -DHAVE_CONFIG_H -I.. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I.. -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -c -o example.o example.cpp In file included from /usr/include/c++/12/vector:64, from ../rsb.hpp:57, from misc.cpp:31: @@ -4291,55 +4326,57 @@ misc.cpp:70:48: note: parameter passing for argument of type 'std::initializer_list' changed in GCC 7.1 70 | const std::vector VA {1,1,1,1,1,1,2}, X(ncA,1); | ^ +g++ -DHAVE_CONFIG_H -I.. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I.. -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -c -o twonnz.o twonnz.cpp +g++ -DHAVE_CONFIG_H -I.. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I.. -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -c -o example.o example.cpp g++ -DHAVE_CONFIG_H -I.. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I.. -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -c -o mtx2bin.o mtx2bin.cpp +g++ -DHAVE_CONFIG_H -I.. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I.. -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -c -o render.o render.cpp +g++ -DHAVE_CONFIG_H -I.. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I.. -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -c -o span.o span.cpp In file included from /usr/include/c++/12/vector:70, from twonnz.cpp:33: /usr/include/c++/12/bits/vector.tcc: In member function 'void std::vector<_Tp, _Alloc>::_M_realloc_insert(iterator, _Args&& ...) [with _Args = {const double&}; _Tp = double; _Alloc = std::allocator]': /usr/include/c++/12/bits/vector.tcc:439:7: note: parameter passing for argument of type 'std::vector::iterator' changed in GCC 7.1 439 | vector<_Tp, _Alloc>:: | ^~~~~~~~~~~~~~~~~~~ +/bin/sh ../libtool --tag=CXX --mode=link g++ -I.. -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -Wl,-z,relro -o assemble assemble.o -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la In file included from /usr/include/c++/12/vector:64: In member function 'void std::vector<_Tp, _Alloc>::push_back(const value_type&) [with _Tp = double; _Alloc = std::allocator]', inlined from 'void bench(rsb_coo_idx_t, rsb_coo_idx_t, nt_t, nt_t) [with nt_t = std::complex]' at twonnz.cpp:87:17: /usr/include/c++/12/bits/stl_vector.h:1287:28: note: parameter passing for argument of type '__gnu_cxx::__normal_iterator >' changed in GCC 7.1 1287 | _M_realloc_insert(end(), __x); | ~~~~~~~~~~~~~~~~~^~~~~~~~~~~~ -g++ -DHAVE_CONFIG_H -I.. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I.. -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -c -o render.o render.cpp +libtool: link: g++ -I.. -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -Wl,-z -Wl,relro -o .libs/assemble assemble.o -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/.libs/librsb.so -fopenmp +/bin/sh ../libtool --tag=CXX --mode=link g++ -I.. -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -Wl,-z,relro -o autotune autotune.o -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la +/bin/sh ../libtool --tag=CXX --mode=link g++ -I.. -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -Wl,-z,relro -o bench bench.o -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la +libtool: link: g++ -I.. -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -Wl,-z -Wl,relro -o .libs/bench bench.o -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/.libs/librsb.so -fopenmp In member function 'void std::vector<_Tp, _Alloc>::push_back(const value_type&) [with _Tp = double; _Alloc = std::allocator]', inlined from 'void bench(rsb_coo_idx_t, rsb_coo_idx_t, nt_t, nt_t) [with nt_t = double]' at twonnz.cpp:87:17: /usr/include/c++/12/bits/stl_vector.h:1287:28: note: parameter passing for argument of type '__gnu_cxx::__normal_iterator >' changed in GCC 7.1 1287 | _M_realloc_insert(end(), __x); | ~~~~~~~~~~~~~~~~~^~~~~~~~~~~~ +/bin/sh ../libtool --tag=CXX --mode=link g++ -I.. -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -Wl,-z,relro -o build build.o -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la +libtool: link: g++ -I.. -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -Wl,-z -Wl,relro -o .libs/autotune autotune.o -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/.libs/librsb.so -fopenmp In member function 'void std::vector<_Tp, _Alloc>::push_back(const value_type&) [with _Tp = double; _Alloc = std::allocator]', inlined from 'void bench(rsb_coo_idx_t, rsb_coo_idx_t, nt_t, nt_t) [with nt_t = std::complex]' at twonnz.cpp:87:17: /usr/include/c++/12/bits/stl_vector.h:1287:28: note: parameter passing for argument of type '__gnu_cxx::__normal_iterator >' changed in GCC 7.1 1287 | _M_realloc_insert(end(), __x); | ~~~~~~~~~~~~~~~~~^~~~~~~~~~~~ +/bin/sh ../libtool --tag=CXX --mode=link g++ -I.. -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -Wl,-z,relro -o misc misc.o -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la +libtool: link: g++ -I.. -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -Wl,-z -Wl,relro -o .libs/build build.o -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/.libs/librsb.so -fopenmp In member function 'void std::vector<_Tp, _Alloc>::push_back(const value_type&) [with _Tp = double; _Alloc = std::allocator]', inlined from 'void bench(rsb_coo_idx_t, rsb_coo_idx_t, nt_t, nt_t) [with nt_t = float]' at twonnz.cpp:87:17: /usr/include/c++/12/bits/stl_vector.h:1287:28: note: parameter passing for argument of type '__gnu_cxx::__normal_iterator >' changed in GCC 7.1 1287 | _M_realloc_insert(end(), __x); | ~~~~~~~~~~~~~~~~~^~~~~~~~~~~~ -g++ -DHAVE_CONFIG_H -I.. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I.. -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -c -o span.o span.cpp -/bin/bash ../libtool --tag=CXX --mode=link g++ -I.. -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -Wl,-z,relro -o assemble assemble.o -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la -libtool: link: g++ -I.. -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -Wl,-z -Wl,relro -o .libs/assemble assemble.o -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/.libs/librsb.so -fopenmp -/bin/bash ../libtool --tag=CXX --mode=link g++ -I.. -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -Wl,-z,relro -o autotune autotune.o -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la -libtool: link: g++ -I.. -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -Wl,-z -Wl,relro -o .libs/autotune autotune.o -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/.libs/librsb.so -fopenmp -/bin/bash ../libtool --tag=CXX --mode=link g++ -I.. -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -Wl,-z,relro -o bench bench.o -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la -libtool: link: g++ -I.. -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -Wl,-z -Wl,relro -o .libs/bench bench.o -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/.libs/librsb.so -fopenmp -/bin/bash ../libtool --tag=CXX --mode=link g++ -I.. -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -Wl,-z,relro -o build build.o -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la -/bin/bash ../libtool --tag=CXX --mode=link g++ -I.. -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -Wl,-z,relro -o misc misc.o -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la -libtool: link: g++ -I.. -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -Wl,-z -Wl,relro -o .libs/build build.o -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/.libs/librsb.so -fopenmp +/bin/sh ../libtool --tag=CXX --mode=link g++ -I.. -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -Wl,-z,relro -o example example.o -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la libtool: link: g++ -I.. -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -Wl,-z -Wl,relro -o .libs/misc misc.o -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/.libs/librsb.so -fopenmp -/bin/bash ../libtool --tag=CXX --mode=link g++ -I.. -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -Wl,-z,relro -o twonnz twonnz.o -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la -/bin/bash ../libtool --tag=CXX --mode=link g++ -I.. -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -Wl,-z,relro -o example example.o -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la -libtool: link: g++ -I.. -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -Wl,-z -Wl,relro -o .libs/twonnz twonnz.o -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/.libs/librsb.so -fopenmp +/bin/sh ../libtool --tag=CXX --mode=link g++ -I.. -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -Wl,-z,relro -o render render.o -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la libtool: link: g++ -I.. -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -Wl,-z -Wl,relro -o .libs/example example.o -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/.libs/librsb.so -fopenmp -/bin/bash ../libtool --tag=CXX --mode=link g++ -I.. -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -Wl,-z,relro -o render render.o -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la -/bin/bash ../libtool --tag=CXX --mode=link g++ -I.. -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -Wl,-z,relro -o span span.o -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la -/bin/bash ../libtool --tag=CXX --mode=link g++ -I.. -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -Wl,-z,relro -o mtx2bin mtx2bin.o -lstdc++fs -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la +/bin/sh ../libtool --tag=CXX --mode=link g++ -I.. -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -Wl,-z,relro -o span span.o -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la libtool: link: g++ -I.. -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -Wl,-z -Wl,relro -o .libs/render render.o -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/.libs/librsb.so -fopenmp +/bin/sh ../libtool --tag=CXX --mode=link g++ -I.. -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -Wl,-z,relro -o twonnz twonnz.o -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la libtool: link: g++ -I.. -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -Wl,-z -Wl,relro -o .libs/span span.o -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/.libs/librsb.so -fopenmp +libtool: link: g++ -I.. -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -Wl,-z -Wl,relro -o .libs/twonnz twonnz.o -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/.libs/librsb.so -fopenmp +/bin/sh ../libtool --tag=CXX --mode=link g++ -I.. -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -Wl,-z,relro -o mtx2bin mtx2bin.o -lstdc++fs -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la libtool: link: g++ -I.. -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -Wl,-z -Wl,relro -o .libs/mtx2bin mtx2bin.o -lstdc++fs -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/.libs/librsb.so -fopenmp gmake[6]: Leaving directory '/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib/examples' gmake[5]: Leaving directory '/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib' @@ -4390,7 +4427,7 @@ /usr/include/c++/12/bits/vector.tcc:123:28: note: parameter passing for argument of type '__gnu_cxx::__normal_iterator*, std::vector, std::allocator > > >' changed in GCC 7.1 123 | _M_realloc_insert(end(), std::forward<_Args>(__args)...); | ~~~~~~~~~~~~~~~~~^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ -/bin/bash ./libtool --tag=CXX --mode=link g++ -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -Wl,-z,relro -o rsbtest rsbtest.o /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la -lstdc++fs -lstdc++fs +/bin/sh ./libtool --tag=CXX --mode=link g++ -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -Wl,-z,relro -o rsbtest rsbtest.o /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la -lstdc++fs -lstdc++fs libtool: link: g++ -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -Wl,-z -Wl,relro -o .libs/rsbtest rsbtest.o /build/reproducible-path/librsb-1.3.0.2+dfsg/.libs/librsb.so -lstdc++fs -fopenmp gmake[5]: Leaving directory '/build/reproducible-path/librsb-1.3.0.2+dfsg/rsbtest' gmake[4]: Leaving directory '/build/reproducible-path/librsb-1.3.0.2+dfsg/rsbtest' @@ -4466,7 +4503,7 @@ gmake[3]: Leaving directory '/build/reproducible-path/librsb-1.3.0.2+dfsg' gmake mtests -C . gmake[3]: Entering directory '/build/reproducible-path/librsb-1.3.0.2+dfsg' -srcdir="/build/reproducible-path/librsb-1.3.0.2+dfsg" /bin/bash -ex ./scripts/readme-tests.sh +srcdir="/build/reproducible-path/librsb-1.3.0.2+dfsg" /bin/sh -ex ./scripts/readme-tests.sh + test x/build/reproducible-path/librsb-1.3.0.2+dfsg = x + ./rsbench -oa -Ob --bench -f /build/reproducible-path/librsb-1.3.0.2+dfsg/A.mtx -qH -R -n1,4 -T z --verbose --nrhs 1,2 --by-rows # --bench option implies -qH -R --write-performance-record --want-mkl-autotune --mkl-benchmark --types : --split-experimental 6 --merge-experimental 6 --also-transpose --sort-filenames-list --want-memory-benchmark @@ -4476,15 +4513,15 @@ Adding matrix file: /build/reproducible-path/librsb-1.3.0.2+dfsg/A.mtx # Sorting matrices list (use --no-sort-filenames-list to prevent this) # Using matrices: A.mtx -# beginning run at 1710619212 +# beginning run at 1710622465 # /build/reproducible-path/librsb-1.3.0.2+dfsg/.libs/rsbench -oa -Ob --bench -f /build/reproducible-path/librsb-1.3.0.2+dfsg/A.mtx -qH -R -n1,4 -T z --verbose --nrhs 1,2 --by-rows # compiled with: CC=gcc CFLAGS=-g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -# average timer granularity: 1.12e-07 s -# Will write a final performance record to file rsbench_pr__1710619212_gcc-12.2-1,4th.rpr and periodic checkpoints to rsbench_pr__1710619212_gcc-12.2-1,4th.rpr.tmp +# average timer granularity: 9.73e-08 s +# Will write a final performance record to file rsbench_pr__1710622465_gcc-12.2-1,4th.rpr and periodic checkpoints to rsbench_pr__1710622465_gcc-12.2-1,4th.rpr.tmp # will NOT perform ancillary tests. # will flush cache memory: between each operation measurement series, and NOT between each operation. # will keep any zero encountered in the matrix. -# env: export PATH=/usr/sbin:/usr/bin:/sbin:/bin:/usr/games +# env: export PATH=/usr/sbin:/usr/bin:/sbin:/bin:/usr/games:/i/capture/the/path # env: export LD_LIBRARY_PATH=/build/reproducible-path/librsb-1.3.0.2+dfsg/.libs # env: HOSTNAME is not set # env: KMP_AFFINITY is not set @@ -4523,61 +4560,61 @@ # env: SLURM_NTASKS is not set # env: SLURM_STEP_TASKS_PER_NODE is not set # env: SLURM_TASKS_PER_NODE is not set -# detected hostname: virt64c +# detected hostname: i-capture-the-hostname # user specified a verbosity level of 1 (each --verbose occurrence counts +1) # This test will measure times in scanning arrays sized and aligned to fit in caches. # 2 cache levels detected Will fill struct with 40 samples... -# Memory benchmark took 6.183s +# Memory benchmark took 6.300s # auto-tuning oriented output implies times==0 iterations and sort-after-load. #pr: allocated a performance record for 8 samples (2240 bytes). # Cache block size total 524288 bytes, per-thread 131072 bytes -# so far, program took 6.188s of wall clock time; ancillary tests 0.000s; I/O 0.000s; checks 0.000s; conversions 0.000s; rsb/mkl tuning 0.000s/0.000s . +# so far, program took 6.305s of wall clock time; ancillary tests 0.000s; I/O 0.000s; checks 0.000s; conversions 0.000s; rsb/mkl tuning 0.000s/0.000s . # Using 1 threads # reading A.mtx (184 bytes / 1 MiB / 6 nnz / 3 rows / 3 columns / 1 MiB COO) as type Z... -# file input of A.mtx took 0.00 s (6 nnz, 26687 nnz/s ) (0.82 MB/s ) -#pre-sorting (6 elements) took 0.00141001 s +# file input of A.mtx took 0.00 s (6 nnz, 25420 nnz/s ) (0.78 MB/s ) +#pre-sorting (6 elements) took 0.00383115 s #weeding duplicates (to 6 elements) took 3.09944e-06 s (and check, 1.90735e-06 s ) # multi-nrhs benchmarking (1,2) -- now using nrhs 1. # Using alpha=1 beta=1 order=rows for rsb_spmv/rsb_spsv/rsb_spmm/rsb_spsm. # multi-transpose benchmarking -- now using transA = N. # will use input matrix flags: RSB_FLAG_USE_HALFWORD_INDICES, RSB_FLAG_SORTED_INPUT, RSB_FLAG_QUAD_PARTITIONING, RSB_FLAG_SYMMETRIC, RSB_FLAG_OWN_PARTITIONING_ARRAYS # Using 1 threads -# Constructed matrix (took 0.006s): (3 x 3)[0x21a46c0]{Z} @ (0(0..0),0(0..0)) (6 nnz, 2 nnz/r) flags 0x2442186 (coo:1, csr:0, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'S' +# Constructed matrix (took 0.017s): (3 x 3)[0x1af4710]{Z} @ (0(0..0),0(0..0)) (6 nnz, 2 nnz/r) flags 0x2442186 (coo:1, csr:0, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'S' # matrix consistency check took 0.000s (ok) RSB Sparse Blocks Autotuner invoked requesting max 6 splits and max 6 merges in 1 rounds, threads spec.0 (specify negative values to enable threads tuning). Will autotune matrix: 3 x 3, type Z, 6 nnz, 2 nnz/r, 4 subms, 3 lsubms, 4.0000 bpnz. Parameters: verbosity:1 mintimes:3 maxtimes:10 mindt:0 maxdt:3 -3 iterations (1 th.) took 0.003213s; avg 0.001071s ( +/- 49.40/ 50.42 %); best 0.0005419s; worst 0.001611s; std dev. 0.0004365 (taking best). -Reference operation time is 0.000541925 s (0.1771 Mflops) with 1 threads. -Starting merge (same threads) based auto-tuning procedure (transA=N, nrhs=1, order=rows) (max 6 steps, inclusive 3 grace steps) on: 3 x 3, type Z, 6 nnz, 2 nnz/r, 4 subms, 3 lsubms, 4.0000 bpnz (tpop: 0.0005419 Mflops: 0.177) -Merge (3 -> 1 leaves) took w.c.t. of 3.791e-05s, ~1.311e-05s of computing time (of which 1.907e-06s sorting, 7.868e-06s analysis) -3 iterations (1 th.) took 7.296e-05s; avg 2.432e-05s ( +/- 96.08/187.25 %); best 9.537e-07s; worst 6.986e-05s; std dev. 3.22e-05 (taking best). +3 iterations (1 th.) took 0.009307s; avg 0.003102s ( +/- 19.45/ 16.75 %); best 0.002499s; worst 0.003622s; std dev. 0.0004622 (taking best). +Reference operation time is 0.0024991 s (0.03841 Mflops) with 1 threads. +Starting merge (same threads) based auto-tuning procedure (transA=N, nrhs=1, order=rows) (max 6 steps, inclusive 3 grace steps) on: 3 x 3, type Z, 6 nnz, 2 nnz/r, 4 subms, 3 lsubms, 4.0000 bpnz (tpop: 0.002499 Mflops: 0.038) +Merge (3 -> 1 leaves) took w.c.t. of 3.481e-05s, ~1.192e-05s of computing time (of which 2.146e-06s sorting, 7.868e-06s analysis) +3 iterations (1 th.) took 0.000212s; avg 7.065e-05s ( +/- 98.65/195.95 %); best 9.537e-07s; worst 0.0002091s; std dev. 9.789e-05 (taking best). Reference operation time is 9.53674e-07 s (100.7 Mflops) with 1 threads. After merge step 1: tpop: 9.537e-07 s ~Mflops: 100.663 nsubm:1 otn:1 -Applying merge (3 -> 1 leaves, 1 th.) yielded SPEEDUP of 568.250x: 0.0005419s -> 9.537e-07s, so taking this instance. +Applying merge (3 -> 1 leaves, 1 th.) yielded SPEEDUP of 2620.500x: 0.002499s -> 9.537e-07s, so taking this instance. Merged all the matrix leaves: no reason to continue merging. -A total of 1 merge steps (of max 6) (3 -> 1 subms) took 0.00318s (of which 4.697e-05s partitioning, 0s I/O); computing times: 1.311e-05s in par. loops, 1.907e-06s sorting, 7.868e-06s analyzing) -Total merge + benchmarking process took 0.00318s, equivalent to 3334.5/5.9 new/old ops (0.006108s for 2 clones -- as 6405.0/11.3 ops, or 3202.5/5.6 ops per clone), SPEEDUP of 568.250x -Applying multi-merge (3 -> 1 leaves, 1 steps, 0 -> 1 th.sp.) yielded SPEEDUP of 568.250x (0.0005419s -> 9.537e-07s), will amortize in 5.9 ops by saving 0.000541s per op. -In 1 tuning rounds (tot. 0.0096s, 0.0061s for constructor, 2 clones) obtained a SPEEDUP of 56725.0% (568.2x) (from 0.1771 to 100.7 Mflops). +A total of 1 merge steps (of max 6) (3 -> 1 subms) took 0.01139s (of which 4.315e-05s partitioning, 0s I/O); computing times: 1.192e-05s in par. loops, 2.146e-06s sorting, 7.868e-06s analyzing) +Total merge + benchmarking process took 0.01139s, equivalent to 11946.5/4.6 new/old ops (0.02316s for 2 clones -- as 24284.2/9.3 ops, or 12142.1/4.6 ops per clone), SPEEDUP of 2620.500x +Applying multi-merge (3 -> 1 leaves, 1 steps, 0 -> 1 th.sp.) yielded SPEEDUP of 2620.500x (0.002499s -> 9.537e-07s), will amortize in 4.6 ops by saving 0.002498s per op. +In 1 tuning rounds (tot. 0.033s, 0.023s for constructor, 2 clones) obtained a SPEEDUP of 261950.0% (2620x) (from 0.03841 to 100.7 Mflops). #pr: updating sample at index 1 (0^th of 8), 0^th touch for (0,0,0,0,0,0,0). -First run of RSB Autotuner took 0.00963593 s (5.419e-04 s -> 9.537e-07 s per spmv_sxsa) (tuned: 3 -> 1 lsubm). +First run of RSB Autotuner took 0.0329351 s (2.499e-03 s -> 9.537e-07 s per spmv_sxsa) (tuned: 3 -> 1 lsubm). RSB Sparse Blocks Autotuner invoked requesting max 0 splits and max 0 merges in 1 rounds, auto threads spec. -Second run of RSB Autotuner took 0.0529931 s and estimated a speedup of 1.000000 x (9.537e-07 s -> 9.537e-07 s per op) in same matrix (1 -> 1 lsubm) +Second run of RSB Autotuner took 0.185767 s and estimated a speedup of 1.000000 x (8.900e-08 s -> 8.900e-08 s per op) in same matrix (1 -> 1 lsubm) #min:1 0 #max:1 0 #sum:3 0 #norm:1.7320508075688772 0 #used index storage compared to COO:28 vs 48 bytes (58.33%) ; compared to CSR:28 vs 40 bytes (77.78%) #%:CONSTRUCTOR_*:SORT SCAN INSERT SCAN+INSERT -%:CONSTRUCTOR_TIMES:A.mtx S N 1 3 3 6 0.000000 0.001137 0.002261 0.003398 -%:UNSORTEDCOO2RSB_TIME:A.mtx S N 1 3 3 6 0.003398 -%:RSB_SUBDIVISION_TIME:A.mtx S N 1 3 3 6 0.001137 -%:RSB_SHUFFLE_TIME:A.mtx S N 1 3 3 6 0.002261 +%:CONSTRUCTOR_TIMES:A.mtx S N 1 3 3 6 0.000000 0.004883 0.006038 0.010921 +%:UNSORTEDCOO2RSB_TIME:A.mtx S N 1 3 3 6 0.010921 +%:RSB_SUBDIVISION_TIME:A.mtx S N 1 3 3 6 0.004883 +%:RSB_SHUFFLE_TIME:A.mtx S N 1 3 3 6 0.006038 %:ROW_MAJOR_SORT_TIME:A.mtx S N 1 3 3 6 0.000000 %:ROW_MAJOR_SORT_SCALING:A.mtx S N 1 3 3 6 nan -%:SORTEDCOO2RSB_TIME:A.mtx S N 1 3 3 6 0.003398 +%:SORTEDCOO2RSB_TIME:A.mtx S N 1 3 3 6 0.010921 %:ROW_MAJOR_SORT_TO_MOP:A.mtx S N 1 3 3 6 0.000 %:UNSORTEDCOO2RSB_SCALING:A.mtx S N 1 3 3 6 1.00 %:SORTEDCOO2RSB_SCALING:A.mtx S N 1 3 3 6 1.00 @@ -4592,47 +4629,47 @@ %:SM_MINMAXAVGNNZ:A.mtx S N 1 3 3 6 6 6 6 # # Using 4 threads -# Constructed matrix (took 0.006s): (3 x 3)[0x21a8380]{Z} @ (0(0..0),0(0..0)) (6 nnz, 2 nnz/r) flags 0x2442186 (coo:1, csr:0, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'S' +# Constructed matrix (took 0.024s): (3 x 3)[0x1af83e0]{Z} @ (0(0..0),0(0..0)) (6 nnz, 2 nnz/r) flags 0x2442186 (coo:1, csr:0, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'S' # matrix consistency check took 0.000s (ok) RSB Sparse Blocks Autotuner invoked requesting max 6 splits and max 6 merges in 1 rounds, threads spec.1 (specify negative values to enable threads tuning). Will autotune matrix: 3 x 3, type Z, 6 nnz, 2 nnz/r, 4 subms, 3 lsubms, 4.0000 bpnz. Parameters: verbosity:1 mintimes:3 maxtimes:10 mindt:0 maxdt:3 -3 iterations (4 th.) took 0.03257s; avg 0.01086s ( +/- 89.92/179.49 %); best 0.001094s; worst 0.03034s; std dev. 0.01378 (taking best). -Reference operation time is 0.0010941 s (0.08774 Mflops) with 4 threads. -Starting merge (user-supplied threads) based auto-tuning procedure (transA=N, nrhs=1, order=rows) (max 6 steps, inclusive 3 grace steps) on: 3 x 3, type Z, 6 nnz, 2 nnz/r, 4 subms, 3 lsubms, 4.0000 bpnz (tpop: 0.001094 Mflops: 0.088) -Merge (3 -> 1 leaves) took w.c.t. of 2.789e-05s, ~8.106e-06s of computing time (of which 9.537e-07s sorting, 5.96e-06s analysis) -3 iterations (4 th.) took 6.914e-06s; avg 2.305e-06s ( +/- 58.62/117.24 %); best 9.537e-07s; worst 5.007e-06s; std dev. 1.911e-06 (taking best). -Reference operation time is 9.53674e-07 s (100.7 Mflops) with 4 threads. -After merge step 1: tpop: 9.537e-07 s ~Mflops: 100.663 nsubm:1 otn:1 -Applying merge (3 -> 1 leaves, 1 th.) yielded SPEEDUP of 1147.250x: 0.001094s -> 9.537e-07s, so taking this instance. +3 iterations (4 th.) took 0.01012s; avg 0.003373s ( +/- 29.56/ 43.12 %); best 0.002376s; worst 0.004828s; std dev. 0.001052 (taking best). +Reference operation time is 0.00237608 s (0.0404 Mflops) with 4 threads. +Starting merge (user-supplied threads) based auto-tuning procedure (transA=N, nrhs=1, order=rows) (max 6 steps, inclusive 3 grace steps) on: 3 x 3, type Z, 6 nnz, 2 nnz/r, 4 subms, 3 lsubms, 4.0000 bpnz (tpop: 0.002376 Mflops: 0.040) +Merge (3 -> 1 leaves) took w.c.t. of 1.788e-05s, ~6.914e-06s of computing time (of which 1.907e-06s sorting, 3.815e-06s analysis) +3 iterations (4 th.) took 5.96e-06s; avg 1.987e-06s ( +/- 95.52/152.00 %); best 8.9e-08s; worst 5.007e-06s; std dev. 2.171e-06 (taking best). +Reference operation time is 8.90017e-08 s (1079 Mflops) with 4 threads. +After merge step 1: tpop: 8.9e-08 s ~Mflops: 1078.632 nsubm:1 otn:1 +Applying merge (3 -> 1 leaves, 1 th.) yielded SPEEDUP of 26697.027x: 0.002376s -> 8.9e-08s, so taking this instance. Merged all the matrix leaves: no reason to continue merging. -A total of 1 merge steps (of max 6) (3 -> 1 subms) took 0.003124s (of which 3.481e-05s partitioning, 0s I/O); computing times: 8.106e-06s in par. loops, 9.537e-07s sorting, 5.96e-06s analyzing) -Total merge + benchmarking process took 0.003124s, equivalent to 3275.8/2.9 new/old ops (0.006122s for 2 clones -- as 6419.5/5.6 ops, or 3209.8/2.8 ops per clone), SPEEDUP of 1147.250x -Applying multi-merge (3 -> 1 leaves, 1 steps, 1 -> 1 th.sp.) yielded SPEEDUP of 1147.250x (0.001094s -> 9.537e-07s), will amortize in 2.9 ops by saving 0.001093s per op. -In 1 tuning rounds (tot. 0.039s, 0.0061s for constructor, 2 clones) obtained a SPEEDUP of 114625.0% (1147x) (from 0.08774 to 100.7 Mflops). +A total of 1 merge steps (of max 6) (3 -> 1 subms) took 0.01161s (of which 2.408e-05s partitioning, 0s I/O); computing times: 6.914e-06s in par. loops, 1.907e-06s sorting, 3.815e-06s analyzing) +Total merge + benchmarking process took 0.01161s, equivalent to 130471.5/4.9 new/old ops (0.02288s for 2 clones -- as 257098.8/9.6 ops, or 128549.4/4.8 ops per clone), SPEEDUP of 26697.027x +Applying multi-merge (3 -> 1 leaves, 1 steps, 1 -> 1 th.sp.) yielded SPEEDUP of 26697.027x (0.002376s -> 8.9e-08s), will amortize in 4.9 ops by saving 0.002376s per op. +In 1 tuning rounds (tot. 0.033s, 0.023s for constructor, 2 clones) obtained a SPEEDUP of 2669602.7% (2.67e+04x) (from 0.0404 to 1079 Mflops). #pr: updating sample at index 5 (1^th of 8), 0^th touch for (0,1,0,0,0,0,0). -First run of RSB Autotuner took 0.038852 s (1.094e-03 s -> 9.537e-07 s per spmv_sxsa) (tuned: 3 -> 1 lsubm). +First run of RSB Autotuner took 0.033134 s (2.376e-03 s -> 8.900e-08 s per spmv_sxsa) (tuned: 3 -> 1 lsubm). RSB Sparse Blocks Autotuner invoked requesting max 0 splits and max 0 merges in 1 rounds, auto threads spec. -Second run of RSB Autotuner took 0.0961781 s and estimated a speedup of 1.000000 x (9.537e-07 s -> 9.537e-07 s per op) in same matrix (1 -> 1 lsubm) +Second run of RSB Autotuner took 0.183674 s and estimated a speedup of 1.000000 x (9.537e-07 s -> 9.537e-07 s per op) in same matrix (1 -> 1 lsubm) #min:1 0 #max:1 0 #sum:3 0 #norm:1.7320508075688772 0 #used index storage compared to COO:28 vs 48 bytes (58.33%) ; compared to CSR:28 vs 40 bytes (77.78%) #%:CONSTRUCTOR_*:SORT SCAN INSERT SCAN+INSERT -%:CONSTRUCTOR_TIMES:A.mtx S N 4 3 3 6 0.000000 0.002133 0.002221 0.004354 -%:UNSORTEDCOO2RSB_TIME:A.mtx S N 4 3 3 6 0.004354 -%:RSB_SUBDIVISION_TIME:A.mtx S N 4 3 3 6 0.002133 -%:RSB_SHUFFLE_TIME:A.mtx S N 4 3 3 6 0.002221 +%:CONSTRUCTOR_TIMES:A.mtx S N 4 3 3 6 0.000000 0.009967 0.007155 0.017122 +%:UNSORTEDCOO2RSB_TIME:A.mtx S N 4 3 3 6 0.017122 +%:RSB_SUBDIVISION_TIME:A.mtx S N 4 3 3 6 0.009967 +%:RSB_SHUFFLE_TIME:A.mtx S N 4 3 3 6 0.007155 %:ROW_MAJOR_SORT_TIME:A.mtx S N 4 3 3 6 0.000000 %:ROW_MAJOR_SORT_SCALING:A.mtx S N 4 3 3 6 nan -%:SORTEDCOO2RSB_TIME:A.mtx S N 4 3 3 6 0.004354 +%:SORTEDCOO2RSB_TIME:A.mtx S N 4 3 3 6 0.017122 %:ROW_MAJOR_SORT_TO_MOP:A.mtx S N 4 3 3 6 0.000 -%:UNSORTEDCOO2RSB_SCALING:A.mtx S N 4 3 3 6 0.78 -%:SORTEDCOO2RSB_SCALING:A.mtx S N 4 3 3 6 0.78 -%:RSB_SUBDIVISION_SCALING:A.mtx S N 4 3 3 6 0.53 -%:RSB_SHUFFLE_SCALING:A.mtx S N 4 3 3 6 1.02 -%:CONSTRUCTOR_SCALING:A.mtx S N 4 3 3 6 nan 0.53 1.02 0.78 +%:UNSORTEDCOO2RSB_SCALING:A.mtx S N 4 3 3 6 0.64 +%:SORTEDCOO2RSB_SCALING:A.mtx S N 4 3 3 6 0.64 +%:RSB_SUBDIVISION_SCALING:A.mtx S N 4 3 3 6 0.49 +%:RSB_SHUFFLE_SCALING:A.mtx S N 4 3 3 6 0.84 +%:CONSTRUCTOR_SCALING:A.mtx S N 4 3 3 6 nan 0.49 0.84 0.64 #%:SM_COUNTS: Tot HalfwordCsr FullwordCsr HalfwordCoo FullwordCoo %:SM_COUNTS:A.mtx S N 4 3 3 6 1 1 0 0 0 %:SM_IDXOCCUPATIONRSBVSCOOANDCSR:A.mtx S N 4 3 3 6 28 48 36 @@ -4641,50 +4678,50 @@ %:SM_MINMAXAVGNNZ:A.mtx S N 4 3 3 6 6 6 6 # %operation:matrix CONSTRUCTOR[1] SPMV[1] SPMV[4] -%operation:A.mtx 0.00554204 1e+09 1e+09 +%operation:A.mtx 0.017231 1e+09 1e+09 %constructor:matrix SORT[1] SCAN[1] SHUFFLE[1] INSERT[1] -%constructor:A.mtx 0 0.00113702 0 0.00226092 +%constructor:A.mtx 0 0.00488305 0 0.00603795 # symmetric matrix --- skipping transposed benchmarking # multi-nrhs benchmarking (1,2) -- now using nrhs 2. # Using alpha=1 beta=1 order=rows for rsb_spmv/rsb_spsv/rsb_spmm/rsb_spsm. # multi-transpose benchmarking -- now using transA = N. # will use input matrix flags: RSB_FLAG_USE_HALFWORD_INDICES, RSB_FLAG_SORTED_INPUT, RSB_FLAG_QUAD_PARTITIONING, RSB_FLAG_SYMMETRIC, RSB_FLAG_OWN_PARTITIONING_ARRAYS # Using 1 threads -# Constructed matrix (took 0.006s): (3 x 3)[0x21a8380]{Z} @ (0(0..0),0(0..0)) (6 nnz, 2 nnz/r) flags 0x2442186 (coo:1, csr:0, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'S' +# Constructed matrix (took 0.020s): (3 x 3)[0x1af83e0]{Z} @ (0(0..0),0(0..0)) (6 nnz, 2 nnz/r) flags 0x2442186 (coo:1, csr:0, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'S' # matrix consistency check took 0.000s (ok) RSB Sparse Blocks Autotuner invoked requesting max 6 splits and max 6 merges in 1 rounds, threads spec.0 (specify negative values to enable threads tuning). Will autotune matrix: 3 x 3, type Z, 6 nnz, 2 nnz/r, 4 subms, 3 lsubms, 4.0000 bpnz. Parameters: verbosity:1 mintimes:3 maxtimes:10 mindt:0 maxdt:3 -3 iterations (1 th.) took 0.00375s; avg 0.00125s ( +/- 17.85/ 34.64 %); best 0.001027s; worst 0.001683s; std dev. 0.0003062 (taking best). -Reference operation time is 0.00102687 s (0.187 Mflops) with 1 threads. -Starting merge (same threads) based auto-tuning procedure (transA=N, nrhs=2, order=rows) (max 6 steps, inclusive 3 grace steps) on: 3 x 3, type Z, 6 nnz, 2 nnz/r, 4 subms, 3 lsubms, 4.0000 bpnz (tpop: 0.001027 Mflops: 0.187) -Merge (3 -> 1 leaves) took w.c.t. of 2.408e-05s, ~7.153e-06s of computing time (of which 1.907e-06s sorting, 5.007e-06s analysis) -3 iterations (1 th.) took 4.387e-05s; avg 1.462e-05s ( +/- 93.48/180.43 %); best 9.537e-07s; worst 4.101e-05s; std dev. 1.866e-05 (taking best). -Reference operation time is 9.53674e-07 s (201.3 Mflops) with 1 threads. -After merge step 1: tpop: 9.537e-07 s ~Mflops: 201.327 nsubm:1 otn:1 -Applying merge (3 -> 1 leaves, 1 th.) yielded SPEEDUP of 1076.750x: 0.001027s -> 9.537e-07s, so taking this instance. +3 iterations (1 th.) took 0.01214s; avg 0.004047s ( +/- 39.19/ 22.24 %); best 0.002461s; worst 0.004947s; std dev. 0.001125 (taking best). +Reference operation time is 0.00246096 s (0.07802 Mflops) with 1 threads. +Starting merge (same threads) based auto-tuning procedure (transA=N, nrhs=2, order=rows) (max 6 steps, inclusive 3 grace steps) on: 3 x 3, type Z, 6 nnz, 2 nnz/r, 4 subms, 3 lsubms, 4.0000 bpnz (tpop: 0.002461 Mflops: 0.078) +Merge (3 -> 1 leaves) took w.c.t. of 1.907e-05s, ~6.914e-06s of computing time (of which 1.907e-06s sorting, 3.099e-06s analysis) +3 iterations (1 th.) took 9.012e-05s; avg 3.004e-05s ( +/- 93.65/186.51 %); best 1.907e-06s; worst 8.607e-05s; std dev. 3.962e-05 (taking best). +Reference operation time is 1.90735e-06 s (100.7 Mflops) with 1 threads. +After merge step 1: tpop: 1.907e-06 s ~Mflops: 100.663 nsubm:1 otn:1 +Applying merge (3 -> 1 leaves, 1 th.) yielded SPEEDUP of 1290.250x: 0.002461s -> 1.907e-06s, so taking this instance. Merged all the matrix leaves: no reason to continue merging. -A total of 1 merge steps (of max 6) (3 -> 1 subms) took 0.002763s (of which 3.099e-05s partitioning, 0s I/O); computing times: 7.153e-06s in par. loops, 1.907e-06s sorting, 5.007e-06s analyzing) -Total merge + benchmarking process took 0.002763s, equivalent to 2897.2/2.7 new/old ops (0.00537s for 2 clones -- as 5631.0/5.2 ops, or 2815.5/2.6 ops per clone), SPEEDUP of 1076.750x -Applying multi-merge (3 -> 1 leaves, 1 steps, 0 -> 1 th.sp.) yielded SPEEDUP of 1076.750x (0.001027s -> 9.537e-07s), will amortize in 2.7 ops by saving 0.001026s per op. -In 1 tuning rounds (tot. 0.0093s, 0.0054s for constructor, 2 clones) obtained a SPEEDUP of 107575.0% (1077x) (from 0.187 to 201.3 Mflops). +A total of 1 merge steps (of max 6) (3 -> 1 subms) took 0.01109s (of which 2.408e-05s partitioning, 0s I/O); computing times: 6.914e-06s in par. loops, 1.907e-06s sorting, 3.099e-06s analyzing) +Total merge + benchmarking process took 0.01109s, equivalent to 5815.9/4.5 new/old ops (0.02087s for 2 clones -- as 10941.9/8.5 ops, or 5470.9/4.2 ops per clone), SPEEDUP of 1290.250x +Applying multi-merge (3 -> 1 leaves, 1 steps, 0 -> 1 th.sp.) yielded SPEEDUP of 1290.250x (0.002461s -> 1.907e-06s), will amortize in 4.5 ops by saving 0.002459s per op. +In 1 tuning rounds (tot. 0.033s, 0.021s for constructor, 2 clones) obtained a SPEEDUP of 128925.0% (1290x) (from 0.07802 to 100.7 Mflops). #pr: updating sample at index 3 (2^th of 8), 0^th touch for (0,0,0,0,1,0,0). -First run of RSB Autotuner took 0.00931907 s (1.027e-03 s -> 9.537e-07 s per spmv_sxsa) (tuned: 3 -> 1 lsubm). +First run of RSB Autotuner took 0.0332279 s (2.461e-03 s -> 1.907e-06 s per spmv_sxsa) (tuned: 3 -> 1 lsubm). RSB Sparse Blocks Autotuner invoked requesting max 0 splits and max 0 merges in 1 rounds, auto threads spec. -Second run of RSB Autotuner took 0.054333 s and estimated a speedup of 1.000000 x (9.537e-07 s -> 9.537e-07 s per op) in same matrix (1 -> 1 lsubm) +Second run of RSB Autotuner took 0.186733 s and estimated a speedup of 1.000000 x (9.537e-07 s -> 9.537e-07 s per op) in same matrix (1 -> 1 lsubm) #min:1 0 #max:1 0 #sum:3 0 #norm:1.7320508075688772 0 #used index storage compared to COO:28 vs 48 bytes (58.33%) ; compared to CSR:28 vs 40 bytes (77.78%) #%:CONSTRUCTOR_*:SORT SCAN INSERT SCAN+INSERT -%:CONSTRUCTOR_TIMES:A.mtx S N 1 3 3 6 0.000000 0.001104 0.002127 0.003231 -%:UNSORTEDCOO2RSB_TIME:A.mtx S N 1 3 3 6 0.003231 -%:RSB_SUBDIVISION_TIME:A.mtx S N 1 3 3 6 0.001104 -%:RSB_SHUFFLE_TIME:A.mtx S N 1 3 3 6 0.002127 +%:CONSTRUCTOR_TIMES:A.mtx S N 1 3 3 6 0.000000 0.005461 0.006833 0.012294 +%:UNSORTEDCOO2RSB_TIME:A.mtx S N 1 3 3 6 0.012294 +%:RSB_SUBDIVISION_TIME:A.mtx S N 1 3 3 6 0.005461 +%:RSB_SHUFFLE_TIME:A.mtx S N 1 3 3 6 0.006833 %:ROW_MAJOR_SORT_TIME:A.mtx S N 1 3 3 6 0.000000 %:ROW_MAJOR_SORT_SCALING:A.mtx S N 1 3 3 6 nan -%:SORTEDCOO2RSB_TIME:A.mtx S N 1 3 3 6 0.003231 +%:SORTEDCOO2RSB_TIME:A.mtx S N 1 3 3 6 0.012294 %:ROW_MAJOR_SORT_TO_MOP:A.mtx S N 1 3 3 6 0.000 %:UNSORTEDCOO2RSB_SCALING:A.mtx S N 1 3 3 6 1.00 %:SORTEDCOO2RSB_SCALING:A.mtx S N 1 3 3 6 1.00 @@ -4699,47 +4736,47 @@ %:SM_MINMAXAVGNNZ:A.mtx S N 1 3 3 6 6 6 6 # # Using 4 threads -# Constructed matrix (took 0.007s): (3 x 3)[0x21a8380]{Z} @ (0(0..0),0(0..0)) (6 nnz, 2 nnz/r) flags 0x2442186 (coo:1, csr:0, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'S' +# Constructed matrix (took 0.022s): (3 x 3)[0x1af83e0]{Z} @ (0(0..0),0(0..0)) (6 nnz, 2 nnz/r) flags 0x2442186 (coo:1, csr:0, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'S' # matrix consistency check took 0.000s (ok) RSB Sparse Blocks Autotuner invoked requesting max 6 splits and max 6 merges in 1 rounds, threads spec.1 (specify negative values to enable threads tuning). Will autotune matrix: 3 x 3, type Z, 6 nnz, 2 nnz/r, 4 subms, 3 lsubms, 4.0000 bpnz. Parameters: verbosity:1 mintimes:3 maxtimes:10 mindt:0 maxdt:3 -3 iterations (4 th.) took 0.02466s; avg 0.008222s ( +/- 82.68/162.09 %); best 0.001424s; worst 0.02155s; std dev. 0.009424 (taking best). -Reference operation time is 0.00142407 s (0.1348 Mflops) with 4 threads. -Starting merge (user-supplied threads) based auto-tuning procedure (transA=N, nrhs=2, order=rows) (max 6 steps, inclusive 3 grace steps) on: 3 x 3, type Z, 6 nnz, 2 nnz/r, 4 subms, 3 lsubms, 4.0000 bpnz (tpop: 0.001424 Mflops: 0.135) -Merge (3 -> 1 leaves) took w.c.t. of 2.789e-05s, ~8.106e-06s of computing time (of which 2.146e-06s sorting, 5.96e-06s analysis) -3 iterations (4 th.) took 1.001e-05s; avg 3.338e-06s ( +/- 71.43/107.14 %); best 9.537e-07s; worst 6.914e-06s; std dev. 2.575e-06 (taking best). -Reference operation time is 9.53674e-07 s (201.3 Mflops) with 4 threads. -After merge step 1: tpop: 9.537e-07 s ~Mflops: 201.327 nsubm:1 otn:1 -Applying merge (3 -> 1 leaves, 1 th.) yielded SPEEDUP of 1493.250x: 0.001424s -> 9.537e-07s, so taking this instance. +3 iterations (4 th.) took 0.01055s; avg 0.003515s ( +/- 35.05/ 37.41 %); best 0.002283s; worst 0.00483s; std dev. 0.001041 (taking best). +Reference operation time is 0.0022831 s (0.0841 Mflops) with 4 threads. +Starting merge (user-supplied threads) based auto-tuning procedure (transA=N, nrhs=2, order=rows) (max 6 steps, inclusive 3 grace steps) on: 3 x 3, type Z, 6 nnz, 2 nnz/r, 4 subms, 3 lsubms, 4.0000 bpnz (tpop: 0.002283 Mflops: 0.084) +Merge (3 -> 1 leaves) took w.c.t. of 1.812e-05s, ~7.153e-06s of computing time (of which 9.537e-07s sorting, 3.099e-06s analysis) +3 iterations (4 th.) took 8.106e-06s; avg 2.702e-06s ( +/- 55.88/ 85.29 %); best 1.192e-06s; worst 5.007e-06s; std dev. 1.656e-06 (taking best). +Reference operation time is 1.19209e-06 s (161.1 Mflops) with 4 threads. +After merge step 1: tpop: 1.192e-06 s ~Mflops: 161.061 nsubm:1 otn:1 +Applying merge (3 -> 1 leaves, 1 th.) yielded SPEEDUP of 1915.200x: 0.002283s -> 1.192e-06s, so taking this instance. Merged all the matrix leaves: no reason to continue merging. -A total of 1 merge steps (of max 6) (3 -> 1 subms) took 0.003184s (of which 3.386e-05s partitioning, 0s I/O); computing times: 8.106e-06s in par. loops, 2.146e-06s sorting, 5.96e-06s analyzing) -Total merge + benchmarking process took 0.003184s, equivalent to 3338.5/2.2 new/old ops (0.006293s for 2 clones -- as 6598.8/4.4 ops, or 3299.4/2.2 ops per clone), SPEEDUP of 1493.250x -Applying multi-merge (3 -> 1 leaves, 1 steps, 1 -> 1 th.sp.) yielded SPEEDUP of 1493.250x (0.001424s -> 9.537e-07s), will amortize in 2.2 ops by saving 0.001423s per op. -In 1 tuning rounds (tot. 0.031s, 0.0063s for constructor, 2 clones) obtained a SPEEDUP of 149225.0% (1493x) (from 0.1348 to 201.3 Mflops). +A total of 1 merge steps (of max 6) (3 -> 1 subms) took 0.008624s (of which 2.503e-05s partitioning, 0s I/O); computing times: 7.153e-06s in par. loops, 9.537e-07s sorting, 3.099e-06s analyzing) +Total merge + benchmarking process took 0.008624s, equivalent to 7234.4/3.8 new/old ops (0.02041s for 2 clones -- as 17121.4/8.9 ops, or 8560.7/4.5 ops per clone), SPEEDUP of 1915.200x +Applying multi-merge (3 -> 1 leaves, 1 steps, 1 -> 1 th.sp.) yielded SPEEDUP of 1915.200x (0.002283s -> 1.192e-06s), will amortize in 3.8 ops by saving 0.002282s per op. +In 1 tuning rounds (tot. 0.031s, 0.02s for constructor, 2 clones) obtained a SPEEDUP of 191420.0% (1915x) (from 0.0841 to 161.1 Mflops). #pr: updating sample at index 7 (3^th of 8), 0^th touch for (0,1,0,0,1,0,0). -First run of RSB Autotuner took 0.0311232 s (1.424e-03 s -> 9.537e-07 s per spmv_sxsa) (tuned: 3 -> 1 lsubm). +First run of RSB Autotuner took 0.0310879 s (2.283e-03 s -> 1.192e-06 s per spmv_sxsa) (tuned: 3 -> 1 lsubm). RSB Sparse Blocks Autotuner invoked requesting max 0 splits and max 0 merges in 1 rounds, auto threads spec. -Second run of RSB Autotuner took 0.115048 s and estimated a speedup of 1.000000 x (9.537e-07 s -> 9.537e-07 s per op) in same matrix (1 -> 1 lsubm) +Second run of RSB Autotuner took 0.184593 s and estimated a speedup of 1.000000 x (9.537e-07 s -> 9.537e-07 s per op) in same matrix (1 -> 1 lsubm) #min:1 0 #max:1 0 #sum:3 0 #norm:1.7320508075688772 0 #used index storage compared to COO:28 vs 48 bytes (58.33%) ; compared to CSR:28 vs 40 bytes (77.78%) #%:CONSTRUCTOR_*:SORT SCAN INSERT SCAN+INSERT -%:CONSTRUCTOR_TIMES:A.mtx S N 4 3 3 6 0.000000 0.002334 0.002127 0.004461 -%:UNSORTEDCOO2RSB_TIME:A.mtx S N 4 3 3 6 0.004461 -%:RSB_SUBDIVISION_TIME:A.mtx S N 4 3 3 6 0.002334 -%:RSB_SHUFFLE_TIME:A.mtx S N 4 3 3 6 0.002127 +%:CONSTRUCTOR_TIMES:A.mtx S N 4 3 3 6 0.000000 0.006974 0.008067 0.015041 +%:UNSORTEDCOO2RSB_TIME:A.mtx S N 4 3 3 6 0.015041 +%:RSB_SUBDIVISION_TIME:A.mtx S N 4 3 3 6 0.006974 +%:RSB_SHUFFLE_TIME:A.mtx S N 4 3 3 6 0.008067 %:ROW_MAJOR_SORT_TIME:A.mtx S N 4 3 3 6 0.000000 %:ROW_MAJOR_SORT_SCALING:A.mtx S N 4 3 3 6 nan -%:SORTEDCOO2RSB_TIME:A.mtx S N 4 3 3 6 0.004461 +%:SORTEDCOO2RSB_TIME:A.mtx S N 4 3 3 6 0.015041 %:ROW_MAJOR_SORT_TO_MOP:A.mtx S N 4 3 3 6 0.000 -%:UNSORTEDCOO2RSB_SCALING:A.mtx S N 4 3 3 6 0.72 -%:SORTEDCOO2RSB_SCALING:A.mtx S N 4 3 3 6 0.72 -%:RSB_SUBDIVISION_SCALING:A.mtx S N 4 3 3 6 0.47 -%:RSB_SHUFFLE_SCALING:A.mtx S N 4 3 3 6 1.00 -%:CONSTRUCTOR_SCALING:A.mtx S N 4 3 3 6 nan 0.47 1.00 0.72 +%:UNSORTEDCOO2RSB_SCALING:A.mtx S N 4 3 3 6 0.82 +%:SORTEDCOO2RSB_SCALING:A.mtx S N 4 3 3 6 0.82 +%:RSB_SUBDIVISION_SCALING:A.mtx S N 4 3 3 6 0.78 +%:RSB_SHUFFLE_SCALING:A.mtx S N 4 3 3 6 0.85 +%:CONSTRUCTOR_SCALING:A.mtx S N 4 3 3 6 nan 0.78 0.85 0.82 #%:SM_COUNTS: Tot HalfwordCsr FullwordCsr HalfwordCoo FullwordCoo %:SM_COUNTS:A.mtx S N 4 3 3 6 1 1 0 0 0 %:SM_IDXOCCUPATIONRSBVSCOOANDCSR:A.mtx S N 4 3 3 6 28 48 36 @@ -4748,185 +4785,185 @@ %:SM_MINMAXAVGNNZ:A.mtx S N 4 3 3 6 6 6 6 # %operation:matrix CONSTRUCTOR[1] SPMV[1] SPMV[4] -%operation:A.mtx 0.00590086 1e+09 1e+09 +%operation:A.mtx 0.0203972 1e+09 1e+09 %constructor:matrix SORT[1] SCAN[1] SHUFFLE[1] INSERT[1] -%constructor:A.mtx 0 0.00110388 0 0.00212693 +%constructor:A.mtx 0 0.00546122 0 0.00683284 # symmetric matrix --- skipping transposed benchmarking -# so far, program took 6.663s of wall clock time; ancillary tests 0.000s; I/O 0.000s; checks 0.000s; conversions 0.000s; rsb/mkl tuning 0.407s/0.000s . +# so far, program took 7.379s of wall clock time; ancillary tests 0.000s; I/O 0.000s; checks 0.000s; conversions 0.000s; rsb/mkl tuning 0.871s/0.000s . getrusage() stats: ru_maxrss: 5 (maximum resident set size -- MB) -ru_stime : 0.06033s (system CPU time used) -ru_utime : 7.522s (user CPU time used) +ru_stime : 0.09231s (system CPU time used) +ru_utime : 7.272s (user CPU time used) # benchmarking terminated --- finalizing run. # ====== BEGIN Total summary record. #pr: ======== Limiting to nrhs=1: #pr: 2 samples (out of 4) matched the dump limiting criteria. #pr: Dump from a base of 4 samples (of max 8) ordered by (1,2,1,1,2,1,2) = (filename x cores x incX x incY x nrhs x typecode x transA). pr: BESTCODE MTX NR NC NNZ NRHS TYPE SYM TRANS NT AT-NT AT-MKL-NT BPNZ AT-BPNZ NSUBM AT-SUBM RSBBEST-MFLOPS OPTIME MKL-OPTIME AT-OPTIME AT-MKL-OPTIME AT-TIME RWminBW-GBps CB-bpf AT-MS CMFLOPS -pr: 1:R_R A 3 3 6 1 Z S N 1 1 0 4.0000 4.6667 3 1 100.66 5.419e-04 0.000e+00 9.537e-07 0.000e+00 9.636e-03 2.81e-01 2.29e+00 1 9.60e-05 -pr: 5:R_R A 3 3 6 1 Z S N 4 1 0 4.0000 4.6667 3 1 100.66 1.094e-03 0.000e+00 9.537e-07 0.000e+00 3.885e-02 2.81e-01 2.29e+00 1 9.60e-05 +pr: 1:R_R A 3 3 6 1 Z S N 1 1 0 4.0000 4.6667 3 1 100.66 2.499e-03 0.000e+00 9.537e-07 0.000e+00 3.294e-02 2.81e-01 2.29e+00 1 9.60e-05 +pr: 5:R_R A 3 3 6 1 Z S N 4 1 0 4.0000 4.6667 3 1 1078.63 2.376e-03 0.000e+00 8.900e-08 0.000e+00 3.313e-02 3.01e+00 2.29e+00 1 9.60e-05 #pr: 2 samples (out of 4) matched the dump limiting criteria. #pr: below, we define 'successful' autotuning when speedup of 1.010000x is exceeded, and 'tuned' results even the ones which are same as untuned #pr: rsb autotuning was successful in 2 cases (100.00 %) and unsuccessful in 0 cases (0.00 %) -#pr: (in succ. cases rsb autotuning gave avg. 85675.0 % faster, avg. sp. ratio 857.750x, max sp. ratio 1147.250x, avg. ratio 0.000x) -#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 25421.6/10104.0/40739.2/50843.2 tuned ops) -#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 26.6/ 17.8/ 35.5/ 53.3 untuned ops) -#pr: (and amortizes from untuned rsb in avg. 26.7, min. 17.8, max. 35.5 ops) +#pr: (in succ. cases rsb autotuning gave avg. 1465776.3 % faster, avg. sp. ratio 14658.763x, max sp. ratio 26697.027x, avg. ratio 0.000x) +#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 203410.0/34535.0/372285.0/406820.0 tuned ops) +#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 13.6/ 13.2/ 13.9/ 27.1 untuned ops) +#pr: (and amortizes from untuned rsb in avg. 13.6, min. 13.2, max. 13.9 ops) #pr: (avg/min/max (avg) nnz per subm before successful tuning were 2/ 2/ 2) #pr: (avg/min/max (avg) nnz per subm after successful tuning were 6/ 6/ 6) #pr: (avg/min/max (avg) bytes per subm before successful tuning were 32/ 32/ 32) #pr: (avg/min/max (avg) bytes per subm after successful tuning were 96/ 96/ 96) #pr: (avg/min/max (avg) bytes per nnz before successful tuning were 4.000/ 4.000/ 4.000) -#pr: (avg/min/max operands (mtx,lhs,rhs) read bandwidth lower bound 0.231/ 0.231/ 0.231,GBps) -#pr: (avg/min/max operands (mtx,rhs:r;lhs:rw) bandwidth lower bound 0.562/ 0.281/ 0.281,GBps) +#pr: (avg/min/max operands (mtx,lhs,rhs) read bandwidth lower bound 1.351/ 0.231/ 2.472,GBps) +#pr: (avg/min/max operands (mtx,rhs:r;lhs:rw) bandwidth lower bound 3.292/ 0.281/ 3.011,GBps) #pr: (avg/min/max code balance (bytes read at least once per flop) 2.292/ 2.292/ 2.292) #pr: (avg/min/max (avg) bytes per nnz after successful tuning were 4.667/ 4.667/ 4.667) #pr: (matrix has been subdivided more/less/same in resp. 0 / 2 /0 cases) #pr: (matrix has used more/less/same threads in resp. 0 / 1 /1 cases) #pr: no unsuccessful rsb autotuning attempt (according to 1.01x threshold) -#pr: rsb auto tuning (either succ. or uns.) time was: on avg.: 0.02 s, min 0.01 s, max 0.04 s, tot 0.05 s (2 samples) -#pr: rsb auto tuning ( only successful ) time was: on avg.: 0.02 s, min 0.01 s, max 0.04 s, tot 0.05 s (2 samples) -#pr: best tun. rsb canon. mflops were: on avg. 1.007e+02, min 1.007e+02, max 1.007e+02 (2 samples) -#pr: ref. unt. rsb canon. mflops were: on avg. 1.324e-01, min 8.774e-02, max 1.771e-01 (2 samples) -#pr: best tun. rsb operation time was: on avg. 9.537e-07s, min 9.537e-07s, max 9.537e-07s, tot 1.907e-06s (2 samples) -#pr: ref. unt. rsb operation time was: on avg. 8.180e-04s, min 5.419e-04s, max 1.094e-03s, tot 1.636e-03s (2 samples) -#pr: min / max ratio of in-memory MEMSET bandwidth to extrapolated read bandwidth ratio: 2.548e+01 2.548e+01 -#pr: in-cache to in-memory MEMSET bandwidth ratio: 9.965e-01 +#pr: rsb auto tuning (either succ. or uns.) time was: on avg.: 0.03 s, min 0.03 s, max 0.03 s, tot 0.07 s (2 samples) +#pr: rsb auto tuning ( only successful ) time was: on avg.: 0.03 s, min 0.03 s, max 0.03 s, tot 0.07 s (2 samples) +#pr: best tun. rsb canon. mflops were: on avg. 5.896e+02, min 1.007e+02, max 1.079e+03 (2 samples) +#pr: ref. unt. rsb canon. mflops were: on avg. 3.941e-02, min 3.841e-02, max 4.040e-02 (2 samples) +#pr: best tun. rsb operation time was: on avg. 5.213e-07s, min 8.900e-08s, max 9.537e-07s, tot 1.043e-06s (2 samples) +#pr: ref. unt. rsb operation time was: on avg. 2.438e-03s, min 2.376e-03s, max 2.499e-03s, tot 4.875e-03s (2 samples) +#pr: min / max ratio of in-memory MEMSET bandwidth to extrapolated read bandwidth ratio: 2.382e+00 2.552e+01 +#pr: in-cache to in-memory MEMSET bandwidth ratio: 9.963e-01 #pr: ======== Limiting to nrhs=2: #pr: 2 samples (out of 4) matched the dump limiting criteria. #pr: Dump from a base of 4 samples (of max 8) ordered by (1,2,1,1,2,1,2) = (filename x cores x incX x incY x nrhs x typecode x transA). pr: BESTCODE MTX NR NC NNZ NRHS TYPE SYM TRANS NT AT-NT AT-MKL-NT BPNZ AT-BPNZ NSUBM AT-SUBM RSBBEST-MFLOPS OPTIME MKL-OPTIME AT-OPTIME AT-MKL-OPTIME AT-TIME RWminBW-GBps CB-bpf AT-MS CMFLOPS -pr: 3:R_R A 3 3 6 2 Z S N 1 1 0 4.0000 4.6667 3 1 201.33 1.027e-03 0.000e+00 9.537e-07 0.000e+00 9.319e-03 4.32e-01 1.65e+00 1 1.92e-04 -pr: 7:R_R A 3 3 6 2 Z S N 4 1 0 4.0000 4.6667 3 1 201.33 1.424e-03 0.000e+00 9.537e-07 0.000e+00 3.112e-02 4.32e-01 1.65e+00 1 1.92e-04 +pr: 3:R_R A 3 3 6 2 Z S N 1 1 0 4.0000 4.6667 3 1 100.66 2.461e-03 0.000e+00 1.907e-06 0.000e+00 3.323e-02 2.16e-01 1.65e+00 1 1.92e-04 +pr: 7:R_R A 3 3 6 2 Z S N 4 1 0 4.0000 4.6667 3 1 161.06 2.283e-03 0.000e+00 1.192e-06 0.000e+00 3.109e-02 3.46e-01 1.65e+00 1 1.92e-04 #pr: 2 samples (out of 4) matched the dump limiting criteria. #pr: below, we define 'successful' autotuning when speedup of 1.010000x is exceeded, and 'tuned' results even the ones which are same as untuned #pr: rsb autotuning was successful in 2 cases (100.00 %) and unsuccessful in 0 cases (0.00 %) -#pr: (in succ. cases rsb autotuning gave avg. 128400.0 % faster, avg. sp. ratio 1285.000x, max sp. ratio 1493.250x, avg. ratio 0.000x) -#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 21203.4/9771.8/32635.0/42406.8 tuned ops) -#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 15.5/ 9.1/ 21.9/ 30.9 untuned ops) -#pr: (and amortizes from untuned rsb in avg. 15.5, min. 9.1, max. 21.9 ops) +#pr: (in succ. cases rsb autotuning gave avg. 160172.5 % faster, avg. sp. ratio 1602.725x, max sp. ratio 1915.200x, avg. ratio 0.000x) +#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 21749.7/17421.0/26078.4/43499.4 tuned ops) +#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 13.6/ 13.5/ 13.6/ 27.1 untuned ops) +#pr: (and amortizes from untuned rsb in avg. 13.6, min. 13.5, max. 13.6 ops) #pr: (avg/min/max (avg) nnz per subm before successful tuning were 2/ 2/ 2) #pr: (avg/min/max (avg) nnz per subm after successful tuning were 6/ 6/ 6) #pr: (avg/min/max (avg) bytes per subm before successful tuning were 32/ 32/ 32) #pr: (avg/min/max (avg) bytes per subm after successful tuning were 96/ 96/ 96) #pr: (avg/min/max (avg) bytes per nnz before successful tuning were 4.000/ 4.000/ 4.000) -#pr: (avg/min/max operands (mtx,lhs,rhs) read bandwidth lower bound 0.331/ 0.331/ 0.331,GBps) -#pr: (avg/min/max operands (mtx,rhs:r;lhs:rw) bandwidth lower bound 0.864/ 0.432/ 0.432,GBps) +#pr: (avg/min/max operands (mtx,lhs,rhs) read bandwidth lower bound 0.215/ 0.166/ 0.265,GBps) +#pr: (avg/min/max operands (mtx,rhs:r;lhs:rw) bandwidth lower bound 0.562/ 0.216/ 0.346,GBps) #pr: (avg/min/max code balance (bytes read at least once per flop) 1.646/ 1.646/ 1.646) #pr: (avg/min/max (avg) bytes per nnz after successful tuning were 4.667/ 4.667/ 4.667) #pr: (matrix has been subdivided more/less/same in resp. 0 / 2 /0 cases) #pr: (matrix has used more/less/same threads in resp. 0 / 1 /1 cases) #pr: no unsuccessful rsb autotuning attempt (according to 1.01x threshold) -#pr: rsb auto tuning (either succ. or uns.) time was: on avg.: 0.02 s, min 0.01 s, max 0.03 s, tot 0.04 s (2 samples) -#pr: rsb auto tuning ( only successful ) time was: on avg.: 0.02 s, min 0.01 s, max 0.03 s, tot 0.04 s (2 samples) -#pr: best tun. rsb canon. mflops were: on avg. 2.013e+02, min 2.013e+02, max 2.013e+02 (2 samples) -#pr: ref. unt. rsb canon. mflops were: on avg. 1.609e-01, min 1.348e-01, max 1.870e-01 (2 samples) -#pr: best tun. rsb operation time was: on avg. 9.537e-07s, min 9.537e-07s, max 9.537e-07s, tot 1.907e-06s (2 samples) -#pr: ref. unt. rsb operation time was: on avg. 1.225e-03s, min 1.027e-03s, max 1.424e-03s, tot 2.451e-03s (2 samples) -#pr: min / max ratio of in-memory MEMSET bandwidth to extrapolated read bandwidth ratio: 1.774e+01 1.774e+01 -#pr: in-cache to in-memory MEMSET bandwidth ratio: 9.965e-01 -#pr: rsb nrhs-to-overall-min-rhs speed ratio was: on avg. 2.000e+00 x, min 2.000e+00 x, max 2.000e+00 x (2 samples, the non-min-nrhs ones) +#pr: rsb auto tuning (either succ. or uns.) time was: on avg.: 0.03 s, min 0.03 s, max 0.03 s, tot 0.06 s (2 samples) +#pr: rsb auto tuning ( only successful ) time was: on avg.: 0.03 s, min 0.03 s, max 0.03 s, tot 0.06 s (2 samples) +#pr: best tun. rsb canon. mflops were: on avg. 1.309e+02, min 1.007e+02, max 1.611e+02 (2 samples) +#pr: ref. unt. rsb canon. mflops were: on avg. 8.106e-02, min 7.802e-02, max 8.410e-02 (2 samples) +#pr: best tun. rsb operation time was: on avg. 1.550e-06s, min 1.192e-06s, max 1.907e-06s, tot 3.099e-06s (2 samples) +#pr: ref. unt. rsb operation time was: on avg. 2.372e-03s, min 2.283e-03s, max 2.461e-03s, tot 4.744e-03s (2 samples) +#pr: min / max ratio of in-memory MEMSET bandwidth to extrapolated read bandwidth ratio: 2.221e+01 3.554e+01 +#pr: in-cache to in-memory MEMSET bandwidth ratio: 9.963e-01 +#pr: rsb nrhs-to-overall-min-rhs speed ratio was: on avg. 5.747e-01 x, min 1.493e-01 x, max 1.000e+00 x (2 samples, the non-min-nrhs ones) #pr: ======== Limiting to transA=N: #pr: Dump from a base of 4 samples (of max 8) ordered by (1,2,1,1,2,1,2) = (filename x cores x incX x incY x nrhs x typecode x transA). pr: BESTCODE MTX NR NC NNZ NRHS TYPE SYM TRANS NT AT-NT AT-MKL-NT BPNZ AT-BPNZ NSUBM AT-SUBM RSBBEST-MFLOPS OPTIME MKL-OPTIME AT-OPTIME AT-MKL-OPTIME AT-TIME RWminBW-GBps CB-bpf AT-MS CMFLOPS -pr: 1:R_R A 3 3 6 1 Z S N 1 1 0 4.0000 4.6667 3 1 100.66 5.419e-04 0.000e+00 9.537e-07 0.000e+00 9.636e-03 2.81e-01 2.29e+00 1 9.60e-05 -pr: 3:R_R A 3 3 6 2 Z S N 1 1 0 4.0000 4.6667 3 1 201.33 1.027e-03 0.000e+00 9.537e-07 0.000e+00 9.319e-03 4.32e-01 1.65e+00 1 1.92e-04 -pr: 5:R_R A 3 3 6 1 Z S N 4 1 0 4.0000 4.6667 3 1 100.66 1.094e-03 0.000e+00 9.537e-07 0.000e+00 3.885e-02 2.81e-01 2.29e+00 1 9.60e-05 -pr: 7:R_R A 3 3 6 2 Z S N 4 1 0 4.0000 4.6667 3 1 201.33 1.424e-03 0.000e+00 9.537e-07 0.000e+00 3.112e-02 4.32e-01 1.65e+00 1 1.92e-04 +pr: 1:R_R A 3 3 6 1 Z S N 1 1 0 4.0000 4.6667 3 1 100.66 2.499e-03 0.000e+00 9.537e-07 0.000e+00 3.294e-02 2.81e-01 2.29e+00 1 9.60e-05 +pr: 3:R_R A 3 3 6 2 Z S N 1 1 0 4.0000 4.6667 3 1 100.66 2.461e-03 0.000e+00 1.907e-06 0.000e+00 3.323e-02 2.16e-01 1.65e+00 1 1.92e-04 +pr: 5:R_R A 3 3 6 1 Z S N 4 1 0 4.0000 4.6667 3 1 1078.63 2.376e-03 0.000e+00 8.900e-08 0.000e+00 3.313e-02 3.01e+00 2.29e+00 1 9.60e-05 +pr: 7:R_R A 3 3 6 2 Z S N 4 1 0 4.0000 4.6667 3 1 161.06 2.283e-03 0.000e+00 1.192e-06 0.000e+00 3.109e-02 3.46e-01 1.65e+00 1 1.92e-04 #pr: below, we define 'successful' autotuning when speedup of 1.010000x is exceeded, and 'tuned' results even the ones which are same as untuned #pr: rsb autotuning was successful in 4 cases (100.00 %) and unsuccessful in 0 cases (0.00 %) -#pr: (in succ. cases rsb autotuning gave avg. 107037.5 % faster, avg. sp. ratio 1071.375x, max sp. ratio 1493.250x, avg. ratio 0.000x) -#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 23312.5/9771.8/40739.2/93250.0 tuned ops) -#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 21.1/ 9.1/ 35.5/ 84.2 untuned ops) -#pr: (and amortizes from untuned rsb in avg. 21.1, min. 9.1, max. 35.5 ops) +#pr: (in succ. cases rsb autotuning gave avg. 812974.4 % faster, avg. sp. ratio 8130.744x, max sp. ratio 26697.027x, avg. ratio 0.000x) +#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 112579.9/17421.0/372285.0/450319.4 tuned ops) +#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 13.6/ 13.2/ 13.9/ 54.2 untuned ops) +#pr: (and amortizes from untuned rsb in avg. 13.6, min. 13.2, max. 13.9 ops) #pr: (avg/min/max (avg) nnz per subm before successful tuning were 2/ 2/ 2) #pr: (avg/min/max (avg) nnz per subm after successful tuning were 6/ 6/ 6) #pr: (avg/min/max (avg) bytes per subm before successful tuning were 32/ 32/ 32) #pr: (avg/min/max (avg) bytes per subm after successful tuning were 96/ 96/ 96) #pr: (avg/min/max (avg) bytes per nnz before successful tuning were 4.000/ 4.000/ 4.000) -#pr: (avg/min/max operands (mtx,lhs,rhs) read bandwidth lower bound 0.281/ 0.231/ 0.331,GBps) -#pr: (avg/min/max operands (mtx,rhs:r;lhs:rw) bandwidth lower bound 1.426/ 0.281/ 0.432,GBps) +#pr: (avg/min/max operands (mtx,lhs,rhs) read bandwidth lower bound 0.783/ 0.166/ 2.472,GBps) +#pr: (avg/min/max operands (mtx,rhs:r;lhs:rw) bandwidth lower bound 3.854/ 0.216/ 3.011,GBps) #pr: (avg/min/max code balance (bytes read at least once per flop) 1.969/ 1.646/ 2.292) #pr: (avg/min/max (avg) bytes per nnz after successful tuning were 4.667/ 4.667/ 4.667) #pr: (matrix has been subdivided more/less/same in resp. 0 / 4 /0 cases) #pr: (matrix has used more/less/same threads in resp. 0 / 2 /2 cases) #pr: no unsuccessful rsb autotuning attempt (according to 1.01x threshold) -#pr: rsb auto tuning (either succ. or uns.) time was: on avg.: 0.02 s, min 0.01 s, max 0.04 s, tot 0.09 s (4 samples) -#pr: rsb auto tuning ( only successful ) time was: on avg.: 0.02 s, min 0.01 s, max 0.04 s, tot 0.09 s (4 samples) -#pr: best tun. rsb canon. mflops were: on avg. 1.510e+02, min 1.007e+02, max 2.013e+02 (4 samples) -#pr: ref. unt. rsb canon. mflops were: on avg. 1.467e-01, min 8.774e-02, max 1.870e-01 (4 samples) -#pr: best tun. rsb operation time was: on avg. 9.537e-07s, min 9.537e-07s, max 9.537e-07s, tot 3.815e-06s (4 samples) -#pr: ref. unt. rsb operation time was: on avg. 1.022e-03s, min 5.419e-04s, max 1.424e-03s, tot 4.087e-03s (4 samples) -#pr: min / max ratio of in-memory MEMSET bandwidth to extrapolated read bandwidth ratio: 1.774e+01 2.548e+01 -#pr: in-cache to in-memory MEMSET bandwidth ratio: 9.965e-01 -#pr: rsb nrhs-to-overall-min-rhs speed ratio was: on avg. 2.000e+00 x, min 2.000e+00 x, max 2.000e+00 x (2 samples, the non-min-nrhs ones) +#pr: rsb auto tuning (either succ. or uns.) time was: on avg.: 0.03 s, min 0.03 s, max 0.03 s, tot 0.13 s (4 samples) +#pr: rsb auto tuning ( only successful ) time was: on avg.: 0.03 s, min 0.03 s, max 0.03 s, tot 0.13 s (4 samples) +#pr: best tun. rsb canon. mflops were: on avg. 3.603e+02, min 1.007e+02, max 1.079e+03 (4 samples) +#pr: ref. unt. rsb canon. mflops were: on avg. 6.023e-02, min 3.841e-02, max 8.410e-02 (4 samples) +#pr: best tun. rsb operation time was: on avg. 1.036e-06s, min 8.900e-08s, max 1.907e-06s, tot 4.142e-06s (4 samples) +#pr: ref. unt. rsb operation time was: on avg. 2.405e-03s, min 2.283e-03s, max 2.499e-03s, tot 9.619e-03s (4 samples) +#pr: min / max ratio of in-memory MEMSET bandwidth to extrapolated read bandwidth ratio: 2.382e+00 3.554e+01 +#pr: in-cache to in-memory MEMSET bandwidth ratio: 9.963e-01 +#pr: rsb nrhs-to-overall-min-rhs speed ratio was: on avg. 5.747e-01 x, min 1.493e-01 x, max 1.000e+00 x (2 samples, the non-min-nrhs ones) #pr: ======== Limiting to both transA=N and nrhs=1: #pr: 2 samples (out of 4) matched the dump limiting criteria. #pr: Dump from a base of 4 samples (of max 8) ordered by (1,2,1,1,2,1,2) = (filename x cores x incX x incY x nrhs x typecode x transA). pr: BESTCODE MTX NR NC NNZ NRHS TYPE SYM TRANS NT AT-NT AT-MKL-NT BPNZ AT-BPNZ NSUBM AT-SUBM RSBBEST-MFLOPS OPTIME MKL-OPTIME AT-OPTIME AT-MKL-OPTIME AT-TIME RWminBW-GBps CB-bpf AT-MS CMFLOPS -pr: 1:R_R A 3 3 6 1 Z S N 1 1 0 4.0000 4.6667 3 1 100.66 5.419e-04 0.000e+00 9.537e-07 0.000e+00 9.636e-03 2.81e-01 2.29e+00 1 9.60e-05 -pr: 5:R_R A 3 3 6 1 Z S N 4 1 0 4.0000 4.6667 3 1 100.66 1.094e-03 0.000e+00 9.537e-07 0.000e+00 3.885e-02 2.81e-01 2.29e+00 1 9.60e-05 +pr: 1:R_R A 3 3 6 1 Z S N 1 1 0 4.0000 4.6667 3 1 100.66 2.499e-03 0.000e+00 9.537e-07 0.000e+00 3.294e-02 2.81e-01 2.29e+00 1 9.60e-05 +pr: 5:R_R A 3 3 6 1 Z S N 4 1 0 4.0000 4.6667 3 1 1078.63 2.376e-03 0.000e+00 8.900e-08 0.000e+00 3.313e-02 3.01e+00 2.29e+00 1 9.60e-05 #pr: 2 samples (out of 4) matched the dump limiting criteria. #pr: below, we define 'successful' autotuning when speedup of 1.010000x is exceeded, and 'tuned' results even the ones which are same as untuned #pr: rsb autotuning was successful in 2 cases (100.00 %) and unsuccessful in 0 cases (0.00 %) -#pr: (in succ. cases rsb autotuning gave avg. 85675.0 % faster, avg. sp. ratio 857.750x, max sp. ratio 1147.250x, avg. ratio 0.000x) -#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 25421.6/10104.0/40739.2/50843.2 tuned ops) -#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 26.6/ 17.8/ 35.5/ 53.3 untuned ops) -#pr: (and amortizes from untuned rsb in avg. 26.7, min. 17.8, max. 35.5 ops) +#pr: (in succ. cases rsb autotuning gave avg. 1465776.3 % faster, avg. sp. ratio 14658.763x, max sp. ratio 26697.027x, avg. ratio 0.000x) +#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 203410.0/34535.0/372285.0/406820.0 tuned ops) +#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 13.6/ 13.2/ 13.9/ 27.1 untuned ops) +#pr: (and amortizes from untuned rsb in avg. 13.6, min. 13.2, max. 13.9 ops) #pr: (avg/min/max (avg) nnz per subm before successful tuning were 2/ 2/ 2) #pr: (avg/min/max (avg) nnz per subm after successful tuning were 6/ 6/ 6) #pr: (avg/min/max (avg) bytes per subm before successful tuning were 32/ 32/ 32) #pr: (avg/min/max (avg) bytes per subm after successful tuning were 96/ 96/ 96) #pr: (avg/min/max (avg) bytes per nnz before successful tuning were 4.000/ 4.000/ 4.000) -#pr: (avg/min/max operands (mtx,lhs,rhs) read bandwidth lower bound 0.231/ 0.231/ 0.231,GBps) -#pr: (avg/min/max operands (mtx,rhs:r;lhs:rw) bandwidth lower bound 0.562/ 0.281/ 0.281,GBps) +#pr: (avg/min/max operands (mtx,lhs,rhs) read bandwidth lower bound 1.351/ 0.231/ 2.472,GBps) +#pr: (avg/min/max operands (mtx,rhs:r;lhs:rw) bandwidth lower bound 3.292/ 0.281/ 3.011,GBps) #pr: (avg/min/max code balance (bytes read at least once per flop) 2.292/ 2.292/ 2.292) #pr: (avg/min/max (avg) bytes per nnz after successful tuning were 4.667/ 4.667/ 4.667) #pr: (matrix has been subdivided more/less/same in resp. 0 / 2 /0 cases) #pr: (matrix has used more/less/same threads in resp. 0 / 1 /1 cases) #pr: no unsuccessful rsb autotuning attempt (according to 1.01x threshold) -#pr: rsb auto tuning (either succ. or uns.) time was: on avg.: 0.02 s, min 0.01 s, max 0.04 s, tot 0.05 s (2 samples) -#pr: rsb auto tuning ( only successful ) time was: on avg.: 0.02 s, min 0.01 s, max 0.04 s, tot 0.05 s (2 samples) -#pr: best tun. rsb canon. mflops were: on avg. 1.007e+02, min 1.007e+02, max 1.007e+02 (2 samples) -#pr: ref. unt. rsb canon. mflops were: on avg. 1.324e-01, min 8.774e-02, max 1.771e-01 (2 samples) -#pr: best tun. rsb operation time was: on avg. 9.537e-07s, min 9.537e-07s, max 9.537e-07s, tot 1.907e-06s (2 samples) -#pr: ref. unt. rsb operation time was: on avg. 8.180e-04s, min 5.419e-04s, max 1.094e-03s, tot 1.636e-03s (2 samples) -#pr: min / max ratio of in-memory MEMSET bandwidth to extrapolated read bandwidth ratio: 2.548e+01 2.548e+01 -#pr: in-cache to in-memory MEMSET bandwidth ratio: 9.965e-01 +#pr: rsb auto tuning (either succ. or uns.) time was: on avg.: 0.03 s, min 0.03 s, max 0.03 s, tot 0.07 s (2 samples) +#pr: rsb auto tuning ( only successful ) time was: on avg.: 0.03 s, min 0.03 s, max 0.03 s, tot 0.07 s (2 samples) +#pr: best tun. rsb canon. mflops were: on avg. 5.896e+02, min 1.007e+02, max 1.079e+03 (2 samples) +#pr: ref. unt. rsb canon. mflops were: on avg. 3.941e-02, min 3.841e-02, max 4.040e-02 (2 samples) +#pr: best tun. rsb operation time was: on avg. 5.213e-07s, min 8.900e-08s, max 9.537e-07s, tot 1.043e-06s (2 samples) +#pr: ref. unt. rsb operation time was: on avg. 2.438e-03s, min 2.376e-03s, max 2.499e-03s, tot 4.875e-03s (2 samples) +#pr: min / max ratio of in-memory MEMSET bandwidth to extrapolated read bandwidth ratio: 2.382e+00 2.552e+01 +#pr: in-cache to in-memory MEMSET bandwidth ratio: 9.963e-01 #pr: ======== Limiting to both transA=N and nrhs=2: #pr: 2 samples (out of 4) matched the dump limiting criteria. #pr: Dump from a base of 4 samples (of max 8) ordered by (1,2,1,1,2,1,2) = (filename x cores x incX x incY x nrhs x typecode x transA). pr: BESTCODE MTX NR NC NNZ NRHS TYPE SYM TRANS NT AT-NT AT-MKL-NT BPNZ AT-BPNZ NSUBM AT-SUBM RSBBEST-MFLOPS OPTIME MKL-OPTIME AT-OPTIME AT-MKL-OPTIME AT-TIME RWminBW-GBps CB-bpf AT-MS CMFLOPS -pr: 3:R_R A 3 3 6 2 Z S N 1 1 0 4.0000 4.6667 3 1 201.33 1.027e-03 0.000e+00 9.537e-07 0.000e+00 9.319e-03 4.32e-01 1.65e+00 1 1.92e-04 -pr: 7:R_R A 3 3 6 2 Z S N 4 1 0 4.0000 4.6667 3 1 201.33 1.424e-03 0.000e+00 9.537e-07 0.000e+00 3.112e-02 4.32e-01 1.65e+00 1 1.92e-04 +pr: 3:R_R A 3 3 6 2 Z S N 1 1 0 4.0000 4.6667 3 1 100.66 2.461e-03 0.000e+00 1.907e-06 0.000e+00 3.323e-02 2.16e-01 1.65e+00 1 1.92e-04 +pr: 7:R_R A 3 3 6 2 Z S N 4 1 0 4.0000 4.6667 3 1 161.06 2.283e-03 0.000e+00 1.192e-06 0.000e+00 3.109e-02 3.46e-01 1.65e+00 1 1.92e-04 #pr: 2 samples (out of 4) matched the dump limiting criteria. #pr: below, we define 'successful' autotuning when speedup of 1.010000x is exceeded, and 'tuned' results even the ones which are same as untuned #pr: rsb autotuning was successful in 2 cases (100.00 %) and unsuccessful in 0 cases (0.00 %) -#pr: (in succ. cases rsb autotuning gave avg. 128400.0 % faster, avg. sp. ratio 1285.000x, max sp. ratio 1493.250x, avg. ratio 0.000x) -#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 21203.4/9771.8/32635.0/42406.8 tuned ops) -#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 15.5/ 9.1/ 21.9/ 30.9 untuned ops) -#pr: (and amortizes from untuned rsb in avg. 15.5, min. 9.1, max. 21.9 ops) +#pr: (in succ. cases rsb autotuning gave avg. 160172.5 % faster, avg. sp. ratio 1602.725x, max sp. ratio 1915.200x, avg. ratio 0.000x) +#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 21749.7/17421.0/26078.4/43499.4 tuned ops) +#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 13.6/ 13.5/ 13.6/ 27.1 untuned ops) +#pr: (and amortizes from untuned rsb in avg. 13.6, min. 13.5, max. 13.6 ops) #pr: (avg/min/max (avg) nnz per subm before successful tuning were 2/ 2/ 2) #pr: (avg/min/max (avg) nnz per subm after successful tuning were 6/ 6/ 6) #pr: (avg/min/max (avg) bytes per subm before successful tuning were 32/ 32/ 32) #pr: (avg/min/max (avg) bytes per subm after successful tuning were 96/ 96/ 96) #pr: (avg/min/max (avg) bytes per nnz before successful tuning were 4.000/ 4.000/ 4.000) -#pr: (avg/min/max operands (mtx,lhs,rhs) read bandwidth lower bound 0.331/ 0.331/ 0.331,GBps) -#pr: (avg/min/max operands (mtx,rhs:r;lhs:rw) bandwidth lower bound 0.864/ 0.432/ 0.432,GBps) +#pr: (avg/min/max operands (mtx,lhs,rhs) read bandwidth lower bound 0.215/ 0.166/ 0.265,GBps) +#pr: (avg/min/max operands (mtx,rhs:r;lhs:rw) bandwidth lower bound 0.562/ 0.216/ 0.346,GBps) #pr: (avg/min/max code balance (bytes read at least once per flop) 1.646/ 1.646/ 1.646) #pr: (avg/min/max (avg) bytes per nnz after successful tuning were 4.667/ 4.667/ 4.667) #pr: (matrix has been subdivided more/less/same in resp. 0 / 2 /0 cases) #pr: (matrix has used more/less/same threads in resp. 0 / 1 /1 cases) #pr: no unsuccessful rsb autotuning attempt (according to 1.01x threshold) -#pr: rsb auto tuning (either succ. or uns.) time was: on avg.: 0.02 s, min 0.01 s, max 0.03 s, tot 0.04 s (2 samples) -#pr: rsb auto tuning ( only successful ) time was: on avg.: 0.02 s, min 0.01 s, max 0.03 s, tot 0.04 s (2 samples) -#pr: best tun. rsb canon. mflops were: on avg. 2.013e+02, min 2.013e+02, max 2.013e+02 (2 samples) -#pr: ref. unt. rsb canon. mflops were: on avg. 1.609e-01, min 1.348e-01, max 1.870e-01 (2 samples) -#pr: best tun. rsb operation time was: on avg. 9.537e-07s, min 9.537e-07s, max 9.537e-07s, tot 1.907e-06s (2 samples) -#pr: ref. unt. rsb operation time was: on avg. 1.225e-03s, min 1.027e-03s, max 1.424e-03s, tot 2.451e-03s (2 samples) -#pr: min / max ratio of in-memory MEMSET bandwidth to extrapolated read bandwidth ratio: 1.774e+01 1.774e+01 -#pr: in-cache to in-memory MEMSET bandwidth ratio: 9.965e-01 -#pr: rsb nrhs-to-overall-min-rhs speed ratio was: on avg. 2.000e+00 x, min 2.000e+00 x, max 2.000e+00 x (2 samples, the non-min-nrhs ones) +#pr: rsb auto tuning (either succ. or uns.) time was: on avg.: 0.03 s, min 0.03 s, max 0.03 s, tot 0.06 s (2 samples) +#pr: rsb auto tuning ( only successful ) time was: on avg.: 0.03 s, min 0.03 s, max 0.03 s, tot 0.06 s (2 samples) +#pr: best tun. rsb canon. mflops were: on avg. 1.309e+02, min 1.007e+02, max 1.611e+02 (2 samples) +#pr: ref. unt. rsb canon. mflops were: on avg. 8.106e-02, min 7.802e-02, max 8.410e-02 (2 samples) +#pr: best tun. rsb operation time was: on avg. 1.550e-06s, min 1.192e-06s, max 1.907e-06s, tot 3.099e-06s (2 samples) +#pr: ref. unt. rsb operation time was: on avg. 2.372e-03s, min 2.283e-03s, max 2.461e-03s, tot 4.744e-03s (2 samples) +#pr: min / max ratio of in-memory MEMSET bandwidth to extrapolated read bandwidth ratio: 2.221e+01 3.554e+01 +#pr: in-cache to in-memory MEMSET bandwidth ratio: 9.963e-01 +#pr: rsb nrhs-to-overall-min-rhs speed ratio was: on avg. 5.747e-01 x, min 1.493e-01 x, max 1.000e+00 x (2 samples, the non-min-nrhs ones) #pr: ======== Limiting to transA=T: #pr: No sample (out of 4) matched the dump criteria -- skipping dump round. #pr: ======== Limiting to both transA=T and nrhs=1: @@ -4936,44 +4973,44 @@ #pr: ======== All results (not limiting) #pr: Dump from a base of 4 samples (of max 8) ordered by (1,2,1,1,2,1,2) = (filename x cores x incX x incY x nrhs x typecode x transA). pr: BESTCODE MTX NR NC NNZ NRHS TYPE SYM TRANS NT AT-NT AT-MKL-NT BPNZ AT-BPNZ NSUBM AT-SUBM RSBBEST-MFLOPS OPTIME MKL-OPTIME AT-OPTIME AT-MKL-OPTIME AT-TIME RWminBW-GBps CB-bpf AT-MS CMFLOPS -pr: 1:R_R A 3 3 6 1 Z S N 1 1 0 4.0000 4.6667 3 1 100.66 5.419e-04 0.000e+00 9.537e-07 0.000e+00 9.636e-03 2.81e-01 2.29e+00 1 9.60e-05 -pr: 3:R_R A 3 3 6 2 Z S N 1 1 0 4.0000 4.6667 3 1 201.33 1.027e-03 0.000e+00 9.537e-07 0.000e+00 9.319e-03 4.32e-01 1.65e+00 1 1.92e-04 -pr: 5:R_R A 3 3 6 1 Z S N 4 1 0 4.0000 4.6667 3 1 100.66 1.094e-03 0.000e+00 9.537e-07 0.000e+00 3.885e-02 2.81e-01 2.29e+00 1 9.60e-05 -pr: 7:R_R A 3 3 6 2 Z S N 4 1 0 4.0000 4.6667 3 1 201.33 1.424e-03 0.000e+00 9.537e-07 0.000e+00 3.112e-02 4.32e-01 1.65e+00 1 1.92e-04 +pr: 1:R_R A 3 3 6 1 Z S N 1 1 0 4.0000 4.6667 3 1 100.66 2.499e-03 0.000e+00 9.537e-07 0.000e+00 3.294e-02 2.81e-01 2.29e+00 1 9.60e-05 +pr: 3:R_R A 3 3 6 2 Z S N 1 1 0 4.0000 4.6667 3 1 100.66 2.461e-03 0.000e+00 1.907e-06 0.000e+00 3.323e-02 2.16e-01 1.65e+00 1 1.92e-04 +pr: 5:R_R A 3 3 6 1 Z S N 4 1 0 4.0000 4.6667 3 1 1078.63 2.376e-03 0.000e+00 8.900e-08 0.000e+00 3.313e-02 3.01e+00 2.29e+00 1 9.60e-05 +pr: 7:R_R A 3 3 6 2 Z S N 4 1 0 4.0000 4.6667 3 1 161.06 2.283e-03 0.000e+00 1.192e-06 0.000e+00 3.109e-02 3.46e-01 1.65e+00 1 1.92e-04 #pr: below, we define 'successful' autotuning when speedup of 1.010000x is exceeded, and 'tuned' results even the ones which are same as untuned #pr: rsb autotuning was successful in 4 cases (100.00 %) and unsuccessful in 0 cases (0.00 %) -#pr: (in succ. cases rsb autotuning gave avg. 107037.5 % faster, avg. sp. ratio 1071.375x, max sp. ratio 1493.250x, avg. ratio 0.000x) -#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 23312.5/9771.8/40739.2/93250.0 tuned ops) -#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 21.1/ 9.1/ 35.5/ 84.2 untuned ops) -#pr: (and amortizes from untuned rsb in avg. 21.1, min. 9.1, max. 35.5 ops) +#pr: (in succ. cases rsb autotuning gave avg. 812974.4 % faster, avg. sp. ratio 8130.744x, max sp. ratio 26697.027x, avg. ratio 0.000x) +#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 112579.9/17421.0/372285.0/450319.4 tuned ops) +#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 13.6/ 13.2/ 13.9/ 54.2 untuned ops) +#pr: (and amortizes from untuned rsb in avg. 13.6, min. 13.2, max. 13.9 ops) #pr: (avg/min/max (avg) nnz per subm before successful tuning were 2/ 2/ 2) #pr: (avg/min/max (avg) nnz per subm after successful tuning were 6/ 6/ 6) #pr: (avg/min/max (avg) bytes per subm before successful tuning were 32/ 32/ 32) #pr: (avg/min/max (avg) bytes per subm after successful tuning were 96/ 96/ 96) #pr: (avg/min/max (avg) bytes per nnz before successful tuning were 4.000/ 4.000/ 4.000) -#pr: (avg/min/max operands (mtx,lhs,rhs) read bandwidth lower bound 0.281/ 0.231/ 0.331,GBps) -#pr: (avg/min/max operands (mtx,rhs:r;lhs:rw) bandwidth lower bound 1.426/ 0.281/ 0.432,GBps) +#pr: (avg/min/max operands (mtx,lhs,rhs) read bandwidth lower bound 0.783/ 0.166/ 2.472,GBps) +#pr: (avg/min/max operands (mtx,rhs:r;lhs:rw) bandwidth lower bound 3.854/ 0.216/ 3.011,GBps) #pr: (avg/min/max code balance (bytes read at least once per flop) 1.969/ 1.646/ 2.292) #pr: (avg/min/max (avg) bytes per nnz after successful tuning were 4.667/ 4.667/ 4.667) #pr: (matrix has been subdivided more/less/same in resp. 0 / 4 /0 cases) #pr: (matrix has used more/less/same threads in resp. 0 / 2 /2 cases) #pr: no unsuccessful rsb autotuning attempt (according to 1.01x threshold) -#pr: rsb auto tuning (either succ. or uns.) time was: on avg.: 0.02 s, min 0.01 s, max 0.04 s, tot 0.09 s (4 samples) -#pr: rsb auto tuning ( only successful ) time was: on avg.: 0.02 s, min 0.01 s, max 0.04 s, tot 0.09 s (4 samples) -#pr: best tun. rsb canon. mflops were: on avg. 1.510e+02, min 1.007e+02, max 2.013e+02 (4 samples) -#pr: ref. unt. rsb canon. mflops were: on avg. 1.467e-01, min 8.774e-02, max 1.870e-01 (4 samples) -#pr: best tun. rsb operation time was: on avg. 9.537e-07s, min 9.537e-07s, max 9.537e-07s, tot 3.815e-06s (4 samples) -#pr: ref. unt. rsb operation time was: on avg. 1.022e-03s, min 5.419e-04s, max 1.424e-03s, tot 4.087e-03s (4 samples) -#pr: min / max ratio of in-memory MEMSET bandwidth to extrapolated read bandwidth ratio: 1.774e+01 2.548e+01 -#pr: in-cache to in-memory MEMSET bandwidth ratio: 9.965e-01 -#pr: rsb nrhs-to-overall-min-rhs speed ratio was: on avg. 2.000e+00 x, min 2.000e+00 x, max 2.000e+00 x (2 samples, the non-min-nrhs ones) -#pr: Record collection took 0.35 s. +#pr: rsb auto tuning (either succ. or uns.) time was: on avg.: 0.03 s, min 0.03 s, max 0.03 s, tot 0.13 s (4 samples) +#pr: rsb auto tuning ( only successful ) time was: on avg.: 0.03 s, min 0.03 s, max 0.03 s, tot 0.13 s (4 samples) +#pr: best tun. rsb canon. mflops were: on avg. 3.603e+02, min 1.007e+02, max 1.079e+03 (4 samples) +#pr: ref. unt. rsb canon. mflops were: on avg. 6.023e-02, min 3.841e-02, max 8.410e-02 (4 samples) +#pr: best tun. rsb operation time was: on avg. 1.036e-06s, min 8.900e-08s, max 1.907e-06s, tot 4.142e-06s (4 samples) +#pr: ref. unt. rsb operation time was: on avg. 2.405e-03s, min 2.283e-03s, max 2.499e-03s, tot 9.619e-03s (4 samples) +#pr: min / max ratio of in-memory MEMSET bandwidth to extrapolated read bandwidth ratio: 2.382e+00 3.554e+01 +#pr: in-cache to in-memory MEMSET bandwidth ratio: 9.963e-01 +#pr: rsb nrhs-to-overall-min-rhs speed ratio was: on avg. 5.747e-01 x, min 1.493e-01 x, max 1.000e+00 x (2 samples, the non-min-nrhs ones) +#pr: Record collection took 0.86 s. #pr: Record comprises 40 memory benchmark samples (prepend RSB_PR_MBW=1 to dump this). -#pr: Record comprises 90 environment variables in 3809 bytes (prepend RSB_PR_ENV=1 to dump this). +#pr: Record comprises 90 environment variables in 3863 bytes (prepend RSB_PR_ENV=1 to dump this). # ====== END Total summary record. -#pr: ======== Saved a performance record of 8 samples to rsbench_pr__1710619212_gcc-12.2-1,4th.rpr -# Removing the temporary record file rsbench_pr__1710619212_gcc-12.2-1,4th.rpr.tmp. -# terminating run at 1710619218 (after 6.7s of w.c.t.) +#pr: ======== Saved a performance record of 8 samples to rsbench_pr__1710622465_gcc-12.2-1,4th.rpr +# Removing the temporary record file rsbench_pr__1710622465_gcc-12.2-1,4th.rpr.tmp. +# terminating run at 1710622473 (after 7.4s of w.c.t.) + ./rsbench -oa -Ob --help /build/reproducible-path/librsb-1.3.0.2+dfsg/.libs/rsbench is a swiss army knife for testing the library functionality and performance. You can use it to perform sparse matrix - unitary vector multiplication, specifying the blocking parameters, the times to perform multiplication. @@ -5237,10 +5274,10 @@ L1 size: 24576 L2 size: 524288 sysconf() : 4096 bytes per pagesize -sysconf() : 1732235 physical pages -sysconf() : 2800267264 bytes (2670 MB) of physical memory -sysconf() : 574390 available (free) physical pages -sysconf() : 2352701440 available (free) physical memory +sysconf() : 1749468 physical pages +sysconf() : 2870853632 bytes (2737 MB) of physical memory +sysconf() : 215940 available (free) physical pages +sysconf() : 884490240 available (free) physical memory sysconf() , processors : 4 sysconf() , processors online : 4 sysconf() : no level 1 cache @@ -5270,25 +5307,25 @@ CXXFLAGS : -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -fopenmp CC : gcc memhinfo : L2:4/64/512K,L1:8/64/24K -detected free memory : -1942265856 -detected total memory : -1494700032 -for array sized 524288 elems, took 0.000674963 s for linear search and 0 s for binary search for element 524287, in 145 tries, for a total of 0.100346 s (ignore this:152043230) -for array sized 524288 elems, took 0.000336885 s for linear search and 0 s for binary search for element 262143, in 293 tries, for a total of 0.100298 s (ignore this:305659028) -for array sized 524288 elems, took 0.0001688 s for linear search and 0 s for binary search for element 131071, in 584 tries, for a total of 0.100075 s (ignore this:458749956) -for array sized 524288 elems, took 8.39233e-05 s for linear search and 0 s for binary search for element 65535, in 1150 tries, for a total of 0.100027 s (ignore this:609480456) -for array sized 524288 elems, took 4.07696e-05 s for linear search and 0 s for binary search for element 32767, in 2296 tries, for a total of 0.100016 s (ignore this:759946520) -for array sized 524288 elems, took 1.97887e-05 s for linear search and 0 s for binary search for element 16383, in 4642 tries, for a total of 0.100000 s (ignore this:912046292) -for array sized 524288 elems, took 9.77516e-06 s for linear search and 0 s for binary search for element 8191, in 8904 tries, for a total of 0.100004 s (ignore this:1057911620) -for array sized 524288 elems, took 4.76837e-06 s for linear search and 0 s for binary search for element 4095, in 17779 tries, for a total of 0.100003 s (ignore this:1203521630) -for array sized 524288 elems, took 1.90735e-06 s for linear search and 0 s for binary search for element 2047, in 33996 tries, for a total of 0.100001 s (ignore this:1342701254) -for array sized 524288 elems, took 9.53674e-07 s for linear search and 0 s for binary search for element 1023, in 61663 tries, for a total of 0.100001 s (ignore this:1468863752) -for array sized 524288 elems, took 0 s for linear search and 0 s for binary search for element 511, in 102973 tries, for a total of 0.100000 s (ignore this:1574102158) -for array sized 524288 elems, took 0 s for linear search and 0 s for binary search for element 255, in 154620 tries, for a total of 0.100000 s (ignore this:1652958358) -for array sized 524288 elems, took 0 s for linear search and 0 s for binary search for element 127, in 205641 tries, for a total of 0.100001 s (ignore this:1705191172) -for array sized 524288 elems, took 0 s for linear search and 0 s for binary search for element 63, in 256521 tries, for a total of 0.100001 s (ignore this:1737512818) -for array sized 524288 elems, took 0 s for linear search and 0 s for binary search for element 31, in 286431 tries, for a total of 0.100001 s (ignore this:1755271540) -for array sized 524288 elems, took 0 s for linear search and 0 s for binary search for element 15, in 299848 tries, for a total of 0.100001 s (ignore this:1764266980) -for array sized 524288 elems, took 0 s for linear search and 0 s for binary search for element 7, in 314703 tries, for a total of 0.100000 s (ignore this:1768672822) +detected free memory : 884490240 +detected total memory : -1424113664 +for array sized 524288 elems, took 0.000674009 s for linear search and 0 s for binary search for element 524287, in 145 tries, for a total of 0.100570 s (ignore this:152043230) +for array sized 524288 elems, took 0.00033617 s for linear search and 0 s for binary search for element 262143, in 293 tries, for a total of 0.100179 s (ignore this:305659028) +for array sized 524288 elems, took 0.000167847 s for linear search and 0 s for binary search for element 131071, in 585 tries, for a total of 0.100104 s (ignore this:459012098) +for array sized 524288 elems, took 8.29697e-05 s for linear search and 0 s for binary search for element 65535, in 1169 tries, for a total of 0.100022 s (ignore this:612232928) +for array sized 524288 elems, took 4.07696e-05 s for linear search and 0 s for binary search for element 32767, in 2401 tries, for a total of 0.100027 s (ignore this:769580062) +for array sized 524288 elems, took 1.97887e-05 s for linear search and 0 s for binary search for element 16383, in 4767 tries, for a total of 0.100002 s (ignore this:925775584) +for array sized 524288 elems, took 9.77516e-06 s for linear search and 0 s for binary search for element 8191, in 9404 tries, for a total of 0.100006 s (ignore this:1079831912) +for array sized 524288 elems, took 4.76837e-06 s for linear search and 0 s for binary search for element 4095, in 18303 tries, for a total of 0.100005 s (ignore this:1229733482) +for array sized 524288 elems, took 1.90735e-06 s for linear search and 0 s for binary search for element 2047, in 34905 tries, for a total of 0.100002 s (ignore this:1372634552) +for array sized 524288 elems, took 9.53674e-07 s for linear search and 0 s for binary search for element 1023, in 63357 tries, for a total of 0.100001 s (ignore this:1502262974) +for array sized 524288 elems, took 0 s for linear search and 0 s for binary search for element 511, in 107140 tries, for a total of 0.100001 s (ignore this:1611760054) +for array sized 524288 elems, took 0 s for linear search and 0 s for binary search for element 255, in 162851 tries, for a total of 0.100001 s (ignore this:1694814064) +for array sized 524288 elems, took 0 s for linear search and 0 s for binary search for element 127, in 221030 tries, for a total of 0.100001 s (ignore this:1750955684) +for array sized 524288 elems, took 0 s for linear search and 0 s for binary search for element 63, in 277350 tries, for a total of 0.100000 s (ignore this:1785901784) +for array sized 524288 elems, took 0 s for linear search and 0 s for binary search for element 31, in 311378 tries, for a total of 0.100000 s (ignore this:1805207220) +for array sized 524288 elems, took 0 s for linear search and 0 s for binary search for element 15, in 327706 tries, for a total of 0.100000 s (ignore this:1815038400) +for array sized 524288 elems, took 0 s for linear search and 0 s for binary search for element 7, in 340986 tries, for a total of 0.100001 s (ignore this:1819812204) + ./rsbench -C /build/reproducible-path/librsb-1.3.0.2+dfsg/.libs/rsbench version: 1.3.0 format switches:br @@ -5335,17 +5372,17 @@ Adding matrix file: /build/reproducible-path/librsb-1.3.0.2+dfsg/A.mtx # Sorting matrices list (use --no-sort-filenames-list to prevent this) # Using matrices: A.mtx -# beginning run at 1710619221 +# beginning run at 1710622475 # /build/reproducible-path/librsb-1.3.0.2+dfsg/.libs/rsbench -oa -Ob --bench -f /build/reproducible-path/librsb-1.3.0.2+dfsg/A.mtx --verbose --nrhs 1,4 --by-rows # compiled with: CC=gcc CFLAGS=-g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 # User did not specify threads; assuming 1. Environment provides max 4 threads; this build supports max 128. # User did not specify threads; assuming 1. Environment provides max 4 threads; this build supports max 128. -# average timer granularity: 9.79e-08 s -# Will write a final performance record to file rsbench_pr__1710619221_gcc-12.2.rpr and periodic checkpoints to rsbench_pr__1710619221_gcc-12.2.rpr.tmp +# average timer granularity: 1.01e-07 s +# Will write a final performance record to file rsbench_pr__1710622475_gcc-12.2.rpr and periodic checkpoints to rsbench_pr__1710622475_gcc-12.2.rpr.tmp # will NOT perform ancillary tests. # will flush cache memory: between each operation measurement series, and NOT between each operation. # will keep any zero encountered in the matrix. -# env: export PATH=/usr/sbin:/usr/bin:/sbin:/bin:/usr/games +# env: export PATH=/usr/sbin:/usr/bin:/sbin:/bin:/usr/games:/i/capture/the/path # env: export LD_LIBRARY_PATH=/build/reproducible-path/librsb-1.3.0.2+dfsg/.libs # env: HOSTNAME is not set # env: KMP_AFFINITY is not set @@ -5384,61 +5421,61 @@ # env: SLURM_NTASKS is not set # env: SLURM_STEP_TASKS_PER_NODE is not set # env: SLURM_TASKS_PER_NODE is not set -# detected hostname: virt64c +# detected hostname: i-capture-the-hostname # user specified a verbosity level of 1 (each --verbose occurrence counts +1) # This test will measure times in scanning arrays sized and aligned to fit in caches. # 2 cache levels detected Will fill struct with 40 samples... -# Memory benchmark took 6.149s +# Memory benchmark took 6.299s # auto-tuning oriented output implies times==0 iterations and sort-after-load. #pr: allocated a performance record for 16 samples (4480 bytes). # multi-type benchmarking (DSCZ) -- now using typecode D (last was D). # Cache block size total 524288 bytes, per-thread 131072 bytes -# so far, program took 6.153s of wall clock time; ancillary tests 0.000s; I/O 0.000s; checks 0.000s; conversions 0.000s; rsb/mkl tuning 0.000s/0.000s . +# so far, program took 6.303s of wall clock time; ancillary tests 0.000s; I/O 0.000s; checks 0.000s; conversions 0.000s; rsb/mkl tuning 0.000s/0.000s . # reading A.mtx (184 bytes / 1 MiB / 6 nnz / 3 rows / 3 columns / 1 MiB COO) as type D... -# file input of A.mtx took 0.00 s (6 nnz, 24082 nnz/s ) (0.74 MB/s ) -#pre-sorting (6 elements) took 0.00164604 s -#weeding duplicates (to 6 elements) took 4.05312e-06 s (and check, 3.09944e-06 s ) +# file input of A.mtx took 0.00 s (6 nnz, 30803 nnz/s ) (0.94 MB/s ) +#pre-sorting (6 elements) took 0.00451303 s +#weeding duplicates (to 6 elements) took 3.09944e-06 s (and check, 1.90735e-06 s ) # multi-nrhs benchmarking (1,4) -- now using nrhs 1. # Using alpha=1 beta=1 order=rows for rsb_spmv/rsb_spsv/rsb_spmm/rsb_spsm. # multi-transpose benchmarking -- now using transA = N. # will use input matrix flags: RSB_FLAG_USE_HALFWORD_INDICES, RSB_FLAG_SORTED_INPUT, RSB_FLAG_QUAD_PARTITIONING, RSB_FLAG_SYMMETRIC, RSB_FLAG_OWN_PARTITIONING_ARRAYS # Using 4 threads -# Constructed matrix (took 0.007s): (3 x 3)[0x19cbf50]{D} @ (0(0..0),0(0..0)) (6 nnz, 2 nnz/r) flags 0x2442186 (coo:1, csr:0, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'S' +# Constructed matrix (took 0.021s): (3 x 3)[0x19d0fa0]{D} @ (0(0..0),0(0..0)) (6 nnz, 2 nnz/r) flags 0x2442186 (coo:1, csr:0, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'S' # matrix consistency check took 0.000s (ok) RSB Sparse Blocks Autotuner invoked requesting max 6 splits and max 6 merges in 1 rounds, threads spec.0 (specify negative values to enable threads tuning). Will autotune matrix: 3 x 3, type D, 6 nnz, 2 nnz/r, 4 subms, 3 lsubms, 4.0000 bpnz. Parameters: verbosity:1 mintimes:3 maxtimes:10 mindt:0 maxdt:3 -3 iterations (4 th.) took 0.003354s; avg 0.001118s ( +/- 4.56/ 3.22 %); best 0.001067s; worst 0.001154s; std dev. 3.708e-05 (taking best). -Reference operation time is 0.00106692 s (0.02249 Mflops) with 4 threads. -Starting merge (same threads) based auto-tuning procedure (transA=N, nrhs=1, order=rows) (max 6 steps, inclusive 3 grace steps) on: 3 x 3, type D, 6 nnz, 2 nnz/r, 4 subms, 3 lsubms, 4.0000 bpnz (tpop: 0.001067 Mflops: 0.022) -Merge (3 -> 1 leaves) took w.c.t. of 3.314e-05s, ~1.216e-05s of computing time (of which 1.907e-06s sorting, 7.153e-06s analysis) -3 iterations (4 th.) took 5.198e-05s; avg 1.733e-05s ( +/- 94.50/188.99 %); best 9.537e-07s; worst 5.007e-05s; std dev. 2.315e-05 (taking best). +3 iterations (4 th.) took 0.01097s; avg 0.003657s ( +/- 37.09/ 28.43 %); best 0.002301s; worst 0.004697s; std dev. 0.001003 (taking best). +Reference operation time is 0.00230098 s (0.01043 Mflops) with 4 threads. +Starting merge (same threads) based auto-tuning procedure (transA=N, nrhs=1, order=rows) (max 6 steps, inclusive 3 grace steps) on: 3 x 3, type D, 6 nnz, 2 nnz/r, 4 subms, 3 lsubms, 4.0000 bpnz (tpop: 0.002301 Mflops: 0.010) +Merge (3 -> 1 leaves) took w.c.t. of 3.314e-05s, ~1.216e-05s of computing time (of which 1.907e-06s sorting, 5.96e-06s analysis) +3 iterations (4 th.) took 0.000108s; avg 3.6e-05s ( +/- 97.35/192.05 %); best 9.537e-07s; worst 0.0001051s; std dev. 4.889e-05 (taking best). Reference operation time is 9.53674e-07 s (25.17 Mflops) with 4 threads. After merge step 1: tpop: 9.537e-07 s ~Mflops: 25.166 nsubm:1 otn:4 -Applying merge (3 -> 1 leaves, 4 th.) yielded SPEEDUP of 1118.750x: 0.001067s -> 9.537e-07s, so taking this instance. +Applying merge (3 -> 1 leaves, 4 th.) yielded SPEEDUP of 2412.750x: 0.002301s -> 9.537e-07s, so taking this instance. Merged all the matrix leaves: no reason to continue merging. -A total of 1 merge steps (of max 6) (3 -> 1 subms) took 0.003318s (of which 4.005e-05s partitioning, 0s I/O); computing times: 1.216e-05s in par. loops, 1.907e-06s sorting, 7.153e-06s analyzing) -Total merge + benchmarking process took 0.003318s, equivalent to 3479.0/3.1 new/old ops (0.006534s for 2 clones -- as 6851.5/6.1 ops, or 3425.8/3.1 ops per clone), SPEEDUP of 1118.750x -Applying multi-merge (3 -> 1 leaves, 1 steps, 0 -> 4 th.sp.) yielded SPEEDUP of 1118.750x (0.001067s -> 9.537e-07s), will amortize in 3.1 ops by saving 0.001066s per op. -In 1 tuning rounds (tot. 0.01s, 0.0065s for constructor, 2 clones) obtained a SPEEDUP of 111775.0% (1119x) (from 0.02249 to 25.17 Mflops). +A total of 1 merge steps (of max 6) (3 -> 1 subms) took 0.01064s (of which 3.91e-05s partitioning, 0s I/O); computing times: 1.216e-05s in par. loops, 1.907e-06s sorting, 5.96e-06s analyzing) +Total merge + benchmarking process took 0.01064s, equivalent to 11152.8/4.6 new/old ops (0.02025s for 2 clones -- as 21230.5/8.8 ops, or 10615.2/4.4 ops per clone), SPEEDUP of 2412.750x +Applying multi-merge (3 -> 1 leaves, 1 steps, 0 -> 4 th.sp.) yielded SPEEDUP of 2412.750x (0.002301s -> 9.537e-07s), will amortize in 4.6 ops by saving 0.0023s per op. +In 1 tuning rounds (tot. 0.031s, 0.02s for constructor, 2 clones) obtained a SPEEDUP of 241175.0% (2413x) (from 0.01043 to 25.17 Mflops). #pr: updating sample at index 1 (0^th of 16), 0^th touch for (0,0,0,0,0,0,0). -First run of RSB Autotuner took 0.0101309 s (1.067e-03 s -> 9.537e-07 s per spmv_sxsa) (tuned: 3 -> 1 lsubm). +First run of RSB Autotuner took 0.031518 s (2.301e-03 s -> 9.537e-07 s per spmv_sxsa) (tuned: 3 -> 1 lsubm). RSB Sparse Blocks Autotuner invoked requesting max 0 splits and max 0 merges in 1 rounds, auto threads spec. -Second run of RSB Autotuner took 0.084084 s and estimated a speedup of 1.000000 x (9.537e-07 s -> 9.537e-07 s per op) in same matrix (1 -> 1 lsubm) +Second run of RSB Autotuner took 0.178941 s and estimated a speedup of 1.000000 x (9.010e-08 s -> 9.010e-08 s per op) in same matrix (1 -> 1 lsubm) #min:1 #max:1 #sum:3 #norm:1.7320508075688772 #used index storage compared to COO:28 vs 48 bytes (58.33%) ; compared to CSR:28 vs 40 bytes (77.78%) #%:CONSTRUCTOR_*:SORT SCAN INSERT SCAN+INSERT -%:CONSTRUCTOR_TIMES:A.mtx S N 4 3 3 6 0.000000 0.002170 0.002237 0.004407 -%:UNSORTEDCOO2RSB_TIME:A.mtx S N 4 3 3 6 0.004407 -%:RSB_SUBDIVISION_TIME:A.mtx S N 4 3 3 6 0.002170 -%:RSB_SHUFFLE_TIME:A.mtx S N 4 3 3 6 0.002237 +%:CONSTRUCTOR_TIMES:A.mtx S N 4 3 3 6 0.000000 0.007072 0.006880 0.013952 +%:UNSORTEDCOO2RSB_TIME:A.mtx S N 4 3 3 6 0.013952 +%:RSB_SUBDIVISION_TIME:A.mtx S N 4 3 3 6 0.007072 +%:RSB_SHUFFLE_TIME:A.mtx S N 4 3 3 6 0.006880 %:ROW_MAJOR_SORT_TIME:A.mtx S N 4 3 3 6 0.000000 %:ROW_MAJOR_SORT_SCALING:A.mtx S N 4 3 3 6 nan -%:SORTEDCOO2RSB_TIME:A.mtx S N 4 3 3 6 0.004407 +%:SORTEDCOO2RSB_TIME:A.mtx S N 4 3 3 6 0.013952 %:ROW_MAJOR_SORT_TO_MOP:A.mtx S N 4 3 3 6 0.000 %:UNSORTEDCOO2RSB_SCALING:A.mtx S N 4 3 3 6 1.00 %:SORTEDCOO2RSB_SCALING:A.mtx S N 4 3 3 6 1.00 @@ -5453,50 +5490,50 @@ %:SM_MINMAXAVGNNZ:A.mtx S N 4 3 3 6 6 6 6 # %operation:matrix CONSTRUCTOR[4] SPMV[4] SPMV[4] -%operation:A.mtx 0.00650001 1e+09 1e+09 +%operation:A.mtx 0.0213909 1e+09 1e+09 %constructor:matrix SORT[4] SCAN[4] SHUFFLE[4] INSERT[4] -%constructor:A.mtx 0 0.00217009 0 0.00223708 +%constructor:A.mtx 0 0.00707197 0 0.00688004 # symmetric matrix --- skipping transposed benchmarking # multi-nrhs benchmarking (1,4) -- now using nrhs 4. # Using alpha=1 beta=1 order=rows for rsb_spmv/rsb_spsv/rsb_spmm/rsb_spsm. # multi-transpose benchmarking -- now using transA = N. # will use input matrix flags: RSB_FLAG_USE_HALFWORD_INDICES, RSB_FLAG_SORTED_INPUT, RSB_FLAG_QUAD_PARTITIONING, RSB_FLAG_SYMMETRIC, RSB_FLAG_OWN_PARTITIONING_ARRAYS # Using 4 threads -# Constructed matrix (took 0.006s): (3 x 3)[0x19ce3e0]{D} @ (0(0..0),0(0..0)) (6 nnz, 2 nnz/r) flags 0x2442186 (coo:1, csr:0, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'S' +# Constructed matrix (took 0.023s): (3 x 3)[0x19d37f0]{D} @ (0(0..0),0(0..0)) (6 nnz, 2 nnz/r) flags 0x2442186 (coo:1, csr:0, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'S' # matrix consistency check took 0.000s (ok) RSB Sparse Blocks Autotuner invoked requesting max 6 splits and max 6 merges in 1 rounds, threads spec.0 (specify negative values to enable threads tuning). Will autotune matrix: 3 x 3, type D, 6 nnz, 2 nnz/r, 4 subms, 3 lsubms, 4.0000 bpnz. Parameters: verbosity:1 mintimes:3 maxtimes:10 mindt:0 maxdt:3 -3 iterations (4 th.) took 0.003265s; avg 0.001088s ( +/- 5.93/ 6.32 %); best 0.001024s; worst 0.001157s; std dev. 5.449e-05 (taking best). -Reference operation time is 0.00102377 s (0.09377 Mflops) with 4 threads. -Starting merge (same threads) based auto-tuning procedure (transA=N, nrhs=4, order=rows) (max 6 steps, inclusive 3 grace steps) on: 3 x 3, type D, 6 nnz, 2 nnz/r, 4 subms, 3 lsubms, 4.0000 bpnz (tpop: 0.001024 Mflops: 0.094) -Merge (3 -> 1 leaves) took w.c.t. of 2.313e-05s, ~7.868e-06s of computing time (of which 1.907e-06s sorting, 5.007e-06s analysis) -3 iterations (4 th.) took 3.099e-05s; avg 1.033e-05s ( +/- 90.77/170.00 %); best 9.537e-07s; worst 2.789e-05s; std dev. 1.243e-05 (taking best). -Reference operation time is 9.53674e-07 s (100.7 Mflops) with 4 threads. -After merge step 1: tpop: 9.537e-07 s ~Mflops: 100.663 nsubm:1 otn:4 -Applying merge (3 -> 1 leaves, 4 th.) yielded SPEEDUP of 1073.500x: 0.001024s -> 9.537e-07s, so taking this instance. +3 iterations (4 th.) took 0.009285s; avg 0.003095s ( +/- 29.63/ 36.48 %); best 0.002178s; worst 0.004224s; std dev. 0.0008487 (taking best). +Reference operation time is 0.00217795 s (0.04408 Mflops) with 4 threads. +Starting merge (same threads) based auto-tuning procedure (transA=N, nrhs=4, order=rows) (max 6 steps, inclusive 3 grace steps) on: 3 x 3, type D, 6 nnz, 2 nnz/r, 4 subms, 3 lsubms, 4.0000 bpnz (tpop: 0.002178 Mflops: 0.044) +Merge (3 -> 1 leaves) took w.c.t. of 2.193e-05s, ~8.106e-06s of computing time (of which 2.146e-06s sorting, 5.007e-06s analysis) +3 iterations (4 th.) took 3.719e-05s; avg 1.24e-05s ( +/- 90.38/175.00 %); best 1.192e-06s; worst 3.409e-05s; std dev. 1.534e-05 (taking best). +Reference operation time is 1.19209e-06 s (80.53 Mflops) with 4 threads. +After merge step 1: tpop: 1.192e-06 s ~Mflops: 80.531 nsubm:1 otn:4 +Applying merge (3 -> 1 leaves, 4 th.) yielded SPEEDUP of 1827.000x: 0.002178s -> 1.192e-06s, so taking this instance. Merged all the matrix leaves: no reason to continue merging. -A total of 1 merge steps (of max 6) (3 -> 1 subms) took 0.003124s (of which 2.909e-05s partitioning, 0s I/O); computing times: 7.868e-06s in par. loops, 1.907e-06s sorting, 5.007e-06s analyzing) -Total merge + benchmarking process took 0.003124s, equivalent to 3275.8/3.1 new/old ops (0.006096s for 2 clones -- as 6392.2/6.0 ops, or 3196.1/3.0 ops per clone), SPEEDUP of 1073.500x -Applying multi-merge (3 -> 1 leaves, 1 steps, 0 -> 4 th.sp.) yielded SPEEDUP of 1073.500x (0.001024s -> 9.537e-07s), will amortize in 3.1 ops by saving 0.001023s per op. -In 1 tuning rounds (tot. 0.0095s, 0.0061s for constructor, 2 clones) obtained a SPEEDUP of 107250.0% (1074x) (from 0.09377 to 100.7 Mflops). +A total of 1 merge steps (of max 6) (3 -> 1 subms) took 0.01038s (of which 2.789e-05s partitioning, 0s I/O); computing times: 8.106e-06s in par. loops, 2.146e-06s sorting, 5.007e-06s analyzing) +Total merge + benchmarking process took 0.01038s, equivalent to 8706.6/4.8 new/old ops (0.02558s for 2 clones -- as 21458.8/11.7 ops, or 10729.4/5.9 ops per clone), SPEEDUP of 1827.000x +Applying multi-merge (3 -> 1 leaves, 1 steps, 0 -> 4 th.sp.) yielded SPEEDUP of 1827.000x (0.002178s -> 1.192e-06s), will amortize in 4.8 ops by saving 0.002177s per op. +In 1 tuning rounds (tot. 0.035s, 0.026s for constructor, 2 clones) obtained a SPEEDUP of 182600.0% (1827x) (from 0.04408 to 80.53 Mflops). #pr: updating sample at index 9 (1^th of 16), 0^th touch for (0,0,0,0,1,0,0). -First run of RSB Autotuner took 0.00953102 s (1.024e-03 s -> 9.537e-07 s per spmv_sxsa) (tuned: 3 -> 1 lsubm). +First run of RSB Autotuner took 0.0350449 s (2.178e-03 s -> 1.192e-06 s per spmv_sxsa) (tuned: 3 -> 1 lsubm). RSB Sparse Blocks Autotuner invoked requesting max 0 splits and max 0 merges in 1 rounds, auto threads spec. -Second run of RSB Autotuner took 0.0568531 s and estimated a speedup of 1.000000 x (9.537e-07 s -> 9.537e-07 s per op) in same matrix (1 -> 1 lsubm) +Second run of RSB Autotuner took 0.179083 s and estimated a speedup of 1.000000 x (9.537e-07 s -> 9.537e-07 s per op) in same matrix (1 -> 1 lsubm) #min:1 #max:1 #sum:3 #norm:1.7320508075688772 #used index storage compared to COO:28 vs 48 bytes (58.33%) ; compared to CSR:28 vs 40 bytes (77.78%) #%:CONSTRUCTOR_*:SORT SCAN INSERT SCAN+INSERT -%:CONSTRUCTOR_TIMES:A.mtx S N 4 3 3 6 0.000000 0.002170 0.002070 0.004240 -%:UNSORTEDCOO2RSB_TIME:A.mtx S N 4 3 3 6 0.004240 -%:RSB_SUBDIVISION_TIME:A.mtx S N 4 3 3 6 0.002170 -%:RSB_SHUFFLE_TIME:A.mtx S N 4 3 3 6 0.002070 +%:CONSTRUCTOR_TIMES:A.mtx S N 4 3 3 6 0.000000 0.007071 0.010245 0.017316 +%:UNSORTEDCOO2RSB_TIME:A.mtx S N 4 3 3 6 0.017316 +%:RSB_SUBDIVISION_TIME:A.mtx S N 4 3 3 6 0.007071 +%:RSB_SHUFFLE_TIME:A.mtx S N 4 3 3 6 0.010245 %:ROW_MAJOR_SORT_TIME:A.mtx S N 4 3 3 6 0.000000 %:ROW_MAJOR_SORT_SCALING:A.mtx S N 4 3 3 6 nan -%:SORTEDCOO2RSB_TIME:A.mtx S N 4 3 3 6 0.004240 +%:SORTEDCOO2RSB_TIME:A.mtx S N 4 3 3 6 0.017316 %:ROW_MAJOR_SORT_TO_MOP:A.mtx S N 4 3 3 6 0.000 %:UNSORTEDCOO2RSB_SCALING:A.mtx S N 4 3 3 6 1.00 %:SORTEDCOO2RSB_SCALING:A.mtx S N 4 3 3 6 1.00 @@ -5511,60 +5548,59 @@ %:SM_MINMAXAVGNNZ:A.mtx S N 4 3 3 6 6 6 6 # %operation:matrix CONSTRUCTOR[4] SPMV[4] SPMV[4] -%operation:A.mtx 0.006392 1e+09 1e+09 +%operation:A.mtx 0.0225339 1e+09 1e+09 %constructor:matrix SORT[4] SCAN[4] SHUFFLE[4] INSERT[4] -%constructor:A.mtx 0 0.00216985 0 0.00206995 +%constructor:A.mtx 0 0.00707102 0 0.0102448 # symmetric matrix --- skipping transposed benchmarking -# so far, program took 6.348s of wall clock time; ancillary tests 0.000s; I/O 0.000s; checks 0.000s; conversions 0.000s; rsb/mkl tuning 0.161s/0.000s . +# so far, program took 6.833s of wall clock time; ancillary tests 0.000s; I/O 0.000s; checks 0.000s; conversions 0.000s; rsb/mkl tuning 0.425s/0.000s . getrusage() stats: -ru_maxrss: 7 (maximum resident set size -- MB) -ru_stime : 0.03201s (system CPU time used) -ru_utime : 6.692s (user CPU time used) +ru_maxrss: 5 (maximum resident set size -- MB) +ru_stime : 0.07626s (system CPU time used) +ru_utime : 6.755s (user CPU time used) # multi-type benchmarking (DSCZ) -- now using typecode S (last was D). # Cache block size total 524288 bytes, per-thread 131072 bytes -# so far, program took 6.348s of wall clock time; ancillary tests 0.000s; I/O 0.000s; checks 0.000s; conversions 0.000s; rsb/mkl tuning 0.161s/0.000s . +# so far, program took 6.833s of wall clock time; ancillary tests 0.000s; I/O 0.000s; checks 0.000s; conversions 0.000s; rsb/mkl tuning 0.425s/0.000s . # Reusing type converted (D->S) arrays from last iteration instead of reloading matrix file. # multi-nrhs benchmarking (1,4) -- now using nrhs 1. # Using alpha=1 beta=1 order=rows for rsb_spmv/rsb_spsv/rsb_spmm/rsb_spsm. # multi-transpose benchmarking -- now using transA = N. # will use input matrix flags: RSB_FLAG_USE_HALFWORD_INDICES, RSB_FLAG_SORTED_INPUT, RSB_FLAG_QUAD_PARTITIONING, RSB_FLAG_SYMMETRIC, RSB_FLAG_OWN_PARTITIONING_ARRAYS # Using 4 threads -# Constructed matrix (took 0.006s): (3 x 3)[0x19ce3e0]{S} @ (0(0..0),0(0..0)) (6 nnz, 2 nnz/r) flags 0x2442186 (coo:1, csr:0, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'S' +# Constructed matrix (took 0.026s): (3 x 3)[0x19d37f0]{S} @ (0(0..0),0(0..0)) (6 nnz, 2 nnz/r) flags 0x2442186 (coo:1, csr:0, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'S' # matrix consistency check took 0.000s (ok) RSB Sparse Blocks Autotuner invoked requesting max 6 splits and max 6 merges in 1 rounds, threads spec.0 (specify negative values to enable threads tuning). Will autotune matrix: 3 x 3, type S, 6 nnz, 2 nnz/r, 4 subms, 3 lsubms, 4.0000 bpnz. Parameters: verbosity:1 mintimes:3 maxtimes:10 mindt:0 maxdt:3 -3 iterations (4 th.) took 0.01271s; avg 0.004235s ( +/- 87.11/150.04 %); best 0.000546s; worst 0.01059s; std dev. 0.004512 (taking best). -Reference operation time is 0.000545979 s (0.04396 Mflops) with 4 threads. -Starting merge (same threads) based auto-tuning procedure (transA=N, nrhs=1, order=rows) (max 6 steps, inclusive 3 grace steps) on: 3 x 3, type S, 6 nnz, 2 nnz/r, 4 subms, 3 lsubms, 4.0000 bpnz (tpop: 0.000546 Mflops: 0.044) -Merge (3 -> 1 leaves) took w.c.t. of 2.217e-05s, ~7.153e-06s of computing time (of which 9.537e-07s sorting, 5.007e-06s analysis) -3 iterations (4 th.) took 9.06e-06s; avg 3.02e-06s ( +/- 68.42/128.95 %); best 9.537e-07s; worst 6.914e-06s; std dev. 2.755e-06 (taking best). +3 iterations (4 th.) took 0.009238s; avg 0.003079s ( +/- 26.51/ 51.01 %); best 0.002263s; worst 0.00465s; std dev. 0.001111 (taking best). +Reference operation time is 0.00226307 s (0.01061 Mflops) with 4 threads. +Starting merge (same threads) based auto-tuning procedure (transA=N, nrhs=1, order=rows) (max 6 steps, inclusive 3 grace steps) on: 3 x 3, type S, 6 nnz, 2 nnz/r, 4 subms, 3 lsubms, 4.0000 bpnz (tpop: 0.002263 Mflops: 0.011) +Merge (3 -> 1 leaves) took w.c.t. of 3.004e-05s, ~1.812e-05s of computing time (of which 1.907e-06s sorting, 4.053e-06s analysis) +3 iterations (4 th.) took 6.914e-06s; avg 2.305e-06s ( +/- 58.62/117.24 %); best 9.537e-07s; worst 5.007e-06s; std dev. 1.911e-06 (taking best). Reference operation time is 9.53674e-07 s (25.17 Mflops) with 4 threads. After merge step 1: tpop: 9.537e-07 s ~Mflops: 25.166 nsubm:1 otn:4 -Applying merge (3 -> 1 leaves, 4 th.) yielded SPEEDUP of 572.500x: 0.000546s -> 9.537e-07s, so taking this instance. +Applying merge (3 -> 1 leaves, 4 th.) yielded SPEEDUP of 2373.000x: 0.002263s -> 9.537e-07s, so taking this instance. Merged all the matrix leaves: no reason to continue merging. -A total of 1 merge steps (of max 6) (3 -> 1 subms) took 0.00362s (of which 2.813e-05s partitioning, 0s I/O); computing times: 7.153e-06s in par. loops, 9.537e-07s sorting, 5.007e-06s analyzing) -Total merge + benchmarking process took 0.00362s, equivalent to 3796.0/6.6 new/old ops (0.006697s for 2 clones -- as 7022.0/12.3 ops, or 3511.0/6.1 ops per clone), SPEEDUP of 572.500x -Applying multi-merge (3 -> 1 leaves, 1 steps, 0 -> 4 th.sp.) yielded SPEEDUP of 572.500x (0.000546s -> 9.537e-07s), will amortize in 6.6 ops by saving 0.000545s per op. -In 1 tuning rounds (tot. 0.02s, 0.0067s for constructor, 2 clones) obtained a SPEEDUP of 57150.0% (572.5x) (from 0.04396 to 25.17 Mflops). +A total of 1 merge steps (of max 6) (3 -> 1 subms) took 0.0106s (of which 3.695e-05s partitioning, 0s I/O); computing times: 1.812e-05s in par. loops, 1.907e-06s sorting, 4.053e-06s analyzing) +Total merge + benchmarking process took 0.0106s, equivalent to 11118.0/4.7 new/old ops (0.02079s for 2 clones -- as 21797.8/9.2 ops, or 10898.9/4.6 ops per clone), SPEEDUP of 2373.000x +Applying multi-merge (3 -> 1 leaves, 1 steps, 0 -> 4 th.sp.) yielded SPEEDUP of 2373.000x (0.002263s -> 9.537e-07s), will amortize in 4.7 ops by saving 0.002262s per op. +In 1 tuning rounds (tot. 0.031s, 0.021s for constructor, 2 clones) obtained a SPEEDUP of 237200.0% (2373x) (from 0.01061 to 25.17 Mflops). #pr: updating sample at index 3 (2^th of 16), 0^th touch for (0,0,0,0,0,1,0). -First run of RSB Autotuner took 0.0197251 s (5.460e-04 s -> 9.537e-07 s per spmv_sxsa) (tuned: 3 -> 1 lsubm). +First run of RSB Autotuner took 0.0305221 s (2.263e-03 s -> 9.537e-07 s per spmv_sxsa) (tuned: 3 -> 1 lsubm). RSB Sparse Blocks Autotuner invoked requesting max 0 splits and max 0 merges in 1 rounds, auto threads spec. -Second run of RSB Autotuner took 0.067729 s and estimated a speedup of 9.527212 x (9.537e-07 s -> 1.001e-07 s per op) in new matrix (1 -> 1 lsubm) -RSB Autotuner suggested a new matrix: freeing the old one. +Second run of RSB Autotuner took 0.156955 s and estimated a speedup of 1.000000 x (9.010e-08 s -> 9.010e-08 s per op) in same matrix (1 -> 1 lsubm) #min:1 #max:1 #sum:3 #norm:1.73205078 #used index storage compared to COO:28 vs 48 bytes (58.33%) ; compared to CSR:28 vs 40 bytes (77.78%) #%:CONSTRUCTOR_*:SORT SCAN INSERT SCAN+INSERT -%:CONSTRUCTOR_TIMES:A.mtx S N 4 3 3 6 0.000000 0.002133 0.002141 0.004274 -%:UNSORTEDCOO2RSB_TIME:A.mtx S N 4 3 3 6 0.004274 -%:RSB_SUBDIVISION_TIME:A.mtx S N 4 3 3 6 0.002133 -%:RSB_SHUFFLE_TIME:A.mtx S N 4 3 3 6 0.002141 +%:CONSTRUCTOR_TIMES:A.mtx S N 4 3 3 6 0.000000 0.006863 0.010136 0.016999 +%:UNSORTEDCOO2RSB_TIME:A.mtx S N 4 3 3 6 0.016999 +%:RSB_SUBDIVISION_TIME:A.mtx S N 4 3 3 6 0.006863 +%:RSB_SHUFFLE_TIME:A.mtx S N 4 3 3 6 0.010136 %:ROW_MAJOR_SORT_TIME:A.mtx S N 4 3 3 6 0.000000 %:ROW_MAJOR_SORT_SCALING:A.mtx S N 4 3 3 6 nan -%:SORTEDCOO2RSB_TIME:A.mtx S N 4 3 3 6 0.004274 +%:SORTEDCOO2RSB_TIME:A.mtx S N 4 3 3 6 0.016999 %:ROW_MAJOR_SORT_TO_MOP:A.mtx S N 4 3 3 6 0.000 %:UNSORTEDCOO2RSB_SCALING:A.mtx S N 4 3 3 6 1.00 %:SORTEDCOO2RSB_SCALING:A.mtx S N 4 3 3 6 1.00 @@ -5579,50 +5615,51 @@ %:SM_MINMAXAVGNNZ:A.mtx S N 4 3 3 6 6 6 6 # %operation:matrix CONSTRUCTOR[4] SPMV[4] SPMV[4] -%operation:A.mtx 0.00638199 1e+09 1e+09 +%operation:A.mtx 0.0257308 1e+09 1e+09 %constructor:matrix SORT[4] SCAN[4] SHUFFLE[4] INSERT[4] -%constructor:A.mtx 0 0.00213313 0 0.002141 +%constructor:A.mtx 0 0.00686288 0 0.0101361 # symmetric matrix --- skipping transposed benchmarking # multi-nrhs benchmarking (1,4) -- now using nrhs 4. # Using alpha=1 beta=1 order=rows for rsb_spmv/rsb_spsv/rsb_spmm/rsb_spsm. # multi-transpose benchmarking -- now using transA = N. # will use input matrix flags: RSB_FLAG_USE_HALFWORD_INDICES, RSB_FLAG_SORTED_INPUT, RSB_FLAG_QUAD_PARTITIONING, RSB_FLAG_SYMMETRIC, RSB_FLAG_OWN_PARTITIONING_ARRAYS # Using 4 threads -# Constructed matrix (took 0.007s): (3 x 3)[0x19ce3e0]{S} @ (0(0..0),0(0..0)) (6 nnz, 2 nnz/r) flags 0x2442186 (coo:1, csr:0, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'S' +# Constructed matrix (took 0.025s): (3 x 3)[0x19d37f0]{S} @ (0(0..0),0(0..0)) (6 nnz, 2 nnz/r) flags 0x2442186 (coo:1, csr:0, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'S' # matrix consistency check took 0.000s (ok) RSB Sparse Blocks Autotuner invoked requesting max 6 splits and max 6 merges in 1 rounds, threads spec.0 (specify negative values to enable threads tuning). Will autotune matrix: 3 x 3, type S, 6 nnz, 2 nnz/r, 4 subms, 3 lsubms, 4.0000 bpnz. Parameters: verbosity:1 mintimes:3 maxtimes:10 mindt:0 maxdt:3 -3 iterations (4 th.) took 0.007905s; avg 0.002635s ( +/- 60.80/121.03 %); best 0.001033s; worst 0.005824s; std dev. 0.002255 (taking best). -Reference operation time is 0.00103283 s (0.09295 Mflops) with 4 threads. -Starting merge (same threads) based auto-tuning procedure (transA=N, nrhs=4, order=rows) (max 6 steps, inclusive 3 grace steps) on: 3 x 3, type S, 6 nnz, 2 nnz/r, 4 subms, 3 lsubms, 4.0000 bpnz (tpop: 0.001033 Mflops: 0.093) -Merge (3 -> 1 leaves) took w.c.t. of 2.098e-05s, ~6.914e-06s of computing time (of which 9.537e-07s sorting, 3.815e-06s analysis) -3 iterations (4 th.) took 9.06e-06s; avg 3.02e-06s ( +/- 68.42/128.95 %); best 9.537e-07s; worst 6.914e-06s; std dev. 2.755e-06 (taking best). +3 iterations (4 th.) took 0.01144s; avg 0.003812s ( +/- 37.98/ 28.20 %); best 0.002364s; worst 0.004887s; std dev. 0.001063 (taking best). +Reference operation time is 0.00236416 s (0.04061 Mflops) with 4 threads. +Starting merge (same threads) based auto-tuning procedure (transA=N, nrhs=4, order=rows) (max 6 steps, inclusive 3 grace steps) on: 3 x 3, type S, 6 nnz, 2 nnz/r, 4 subms, 3 lsubms, 4.0000 bpnz (tpop: 0.002364 Mflops: 0.041) +Merge (3 -> 1 leaves) took w.c.t. of 1.788e-05s, ~5.96e-06s of computing time (of which 1.907e-06s sorting, 3.815e-06s analysis) +3 iterations (4 th.) took 8.106e-06s; avg 2.702e-06s ( +/- 64.71/120.59 %); best 9.537e-07s; worst 5.96e-06s; std dev. 2.306e-06 (taking best). Reference operation time is 9.53674e-07 s (100.7 Mflops) with 4 threads. After merge step 1: tpop: 9.537e-07 s ~Mflops: 100.663 nsubm:1 otn:4 -Applying merge (3 -> 1 leaves, 4 th.) yielded SPEEDUP of 1083.000x: 0.001033s -> 9.537e-07s, so taking this instance. +Applying merge (3 -> 1 leaves, 4 th.) yielded SPEEDUP of 2479.000x: 0.002364s -> 9.537e-07s, so taking this instance. Merged all the matrix leaves: no reason to continue merging. -A total of 1 merge steps (of max 6) (3 -> 1 subms) took 0.003113s (of which 2.813e-05s partitioning, 0s I/O); computing times: 6.914e-06s in par. loops, 9.537e-07s sorting, 3.815e-06s analyzing) -Total merge + benchmarking process took 0.003113s, equivalent to 3264.2/3.0 new/old ops (0.006237s for 2 clones -- as 6539.8/6.0 ops, or 3269.9/3.0 ops per clone), SPEEDUP of 1083.000x -Applying multi-merge (3 -> 1 leaves, 1 steps, 0 -> 4 th.sp.) yielded SPEEDUP of 1083.000x (0.001033s -> 9.537e-07s), will amortize in 3.0 ops by saving 0.001032s per op. -In 1 tuning rounds (tot. 0.015s, 0.0062s for constructor, 2 clones) obtained a SPEEDUP of 108200.0% (1083x) (from 0.09295 to 100.7 Mflops). +A total of 1 merge steps (of max 6) (3 -> 1 subms) took 0.009356s (of which 2.408e-05s partitioning, 0s I/O); computing times: 5.96e-06s in par. loops, 1.907e-06s sorting, 3.815e-06s analyzing) +Total merge + benchmarking process took 0.009356s, equivalent to 9810.5/4.0 new/old ops (0.02031s for 2 clones -- as 21301.8/8.6 ops, or 10650.9/4.3 ops per clone), SPEEDUP of 2479.000x +Applying multi-merge (3 -> 1 leaves, 1 steps, 0 -> 4 th.sp.) yielded SPEEDUP of 2479.000x (0.002364s -> 9.537e-07s), will amortize in 4.0 ops by saving 0.002363s per op. +In 1 tuning rounds (tot. 0.033s, 0.02s for constructor, 2 clones) obtained a SPEEDUP of 247800.0% (2479x) (from 0.04061 to 100.7 Mflops). #pr: updating sample at index 11 (3^th of 16), 0^th touch for (0,0,0,0,1,1,0). -First run of RSB Autotuner took 0.014801 s (1.033e-03 s -> 9.537e-07 s per spmv_sxsa) (tuned: 3 -> 1 lsubm). +First run of RSB Autotuner took 0.0329158 s (2.364e-03 s -> 9.537e-07 s per spmv_sxsa) (tuned: 3 -> 1 lsubm). RSB Sparse Blocks Autotuner invoked requesting max 0 splits and max 0 merges in 1 rounds, auto threads spec. -Second run of RSB Autotuner took 0.055743 s and estimated a speedup of 1.000000 x (9.537e-07 s -> 9.537e-07 s per op) in same matrix (1 -> 1 lsubm) +Second run of RSB Autotuner took 0.156562 s and estimated a speedup of 10.584811 x (9.537e-07 s -> 9.010e-08 s per op) in new matrix (1 -> 1 lsubm) +RSB Autotuner suggested a new matrix: freeing the old one. #min:1 #max:1 #sum:3 #norm:1.73205078 #used index storage compared to COO:28 vs 48 bytes (58.33%) ; compared to CSR:28 vs 40 bytes (77.78%) #%:CONSTRUCTOR_*:SORT SCAN INSERT SCAN+INSERT -%:CONSTRUCTOR_TIMES:A.mtx S N 4 3 3 6 0.000000 0.002312 0.002662 0.004974 -%:UNSORTEDCOO2RSB_TIME:A.mtx S N 4 3 3 6 0.004974 -%:RSB_SUBDIVISION_TIME:A.mtx S N 4 3 3 6 0.002312 -%:RSB_SHUFFLE_TIME:A.mtx S N 4 3 3 6 0.002662 +%:CONSTRUCTOR_TIMES:A.mtx S N 4 3 3 6 0.000000 0.012041 0.007074 0.019115 +%:UNSORTEDCOO2RSB_TIME:A.mtx S N 4 3 3 6 0.019115 +%:RSB_SUBDIVISION_TIME:A.mtx S N 4 3 3 6 0.012041 +%:RSB_SHUFFLE_TIME:A.mtx S N 4 3 3 6 0.007074 %:ROW_MAJOR_SORT_TIME:A.mtx S N 4 3 3 6 0.000000 %:ROW_MAJOR_SORT_SCALING:A.mtx S N 4 3 3 6 nan -%:SORTEDCOO2RSB_TIME:A.mtx S N 4 3 3 6 0.004974 +%:SORTEDCOO2RSB_TIME:A.mtx S N 4 3 3 6 0.019115 %:ROW_MAJOR_SORT_TO_MOP:A.mtx S N 4 3 3 6 0.000 %:UNSORTEDCOO2RSB_SCALING:A.mtx S N 4 3 3 6 1.00 %:SORTEDCOO2RSB_SCALING:A.mtx S N 4 3 3 6 1.00 @@ -5637,59 +5674,59 @@ %:SM_MINMAXAVGNNZ:A.mtx S N 4 3 3 6 6 6 6 # %operation:matrix CONSTRUCTOR[4] SPMV[4] SPMV[4] -%operation:A.mtx 0.00654602 1e+09 1e+09 +%operation:A.mtx 0.0248251 1e+09 1e+09 %constructor:matrix SORT[4] SCAN[4] SHUFFLE[4] INSERT[4] -%constructor:A.mtx 0 0.00231218 0 0.00266194 +%constructor:A.mtx 0 0.0120411 0 0.00707412 # symmetric matrix --- skipping transposed benchmarking -# so far, program took 6.536s of wall clock time; ancillary tests 0.000s; I/O 0.000s; checks 0.000s; conversions 0.000s; rsb/mkl tuning 0.319s/0.000s . +# so far, program took 7.316s of wall clock time; ancillary tests 0.000s; I/O 0.000s; checks 0.000s; conversions 0.000s; rsb/mkl tuning 0.802s/0.000s . getrusage() stats: -ru_maxrss: 7 (maximum resident set size -- MB) -ru_stime : 0.0519s (system CPU time used) -ru_utime : 7.219s (user CPU time used) +ru_maxrss: 5 (maximum resident set size -- MB) +ru_stime : 0.09636s (system CPU time used) +ru_utime : 7.207s (user CPU time used) # multi-type benchmarking (DSCZ) -- now using typecode C (last was S). # Cache block size total 524288 bytes, per-thread 131072 bytes -# so far, program took 6.536s of wall clock time; ancillary tests 0.000s; I/O 0.000s; checks 0.000s; conversions 0.000s; rsb/mkl tuning 0.319s/0.000s . +# so far, program took 7.316s of wall clock time; ancillary tests 0.000s; I/O 0.000s; checks 0.000s; conversions 0.000s; rsb/mkl tuning 0.802s/0.000s . # Reusing type converted (S->C) arrays from last iteration instead of reloading matrix file. # multi-nrhs benchmarking (1,4) -- now using nrhs 1. # Using alpha=1 beta=1 order=rows for rsb_spmv/rsb_spsv/rsb_spmm/rsb_spsm. # multi-transpose benchmarking -- now using transA = N. # will use input matrix flags: RSB_FLAG_USE_HALFWORD_INDICES, RSB_FLAG_SORTED_INPUT, RSB_FLAG_QUAD_PARTITIONING, RSB_FLAG_SYMMETRIC, RSB_FLAG_OWN_PARTITIONING_ARRAYS # Using 4 threads -# Constructed matrix (took 0.006s): (3 x 3)[0x19ce8a0]{C} @ (0(0..0),0(0..0)) (6 nnz, 2 nnz/r) flags 0x2442186 (coo:1, csr:0, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'S' +# Constructed matrix (took 0.025s): (3 x 3)[0x19d4ff0]{C} @ (0(0..0),0(0..0)) (6 nnz, 2 nnz/r) flags 0x2442186 (coo:1, csr:0, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'S' # matrix consistency check took 0.000s (ok) RSB Sparse Blocks Autotuner invoked requesting max 6 splits and max 6 merges in 1 rounds, threads spec.0 (specify negative values to enable threads tuning). Will autotune matrix: 3 x 3, type C, 6 nnz, 2 nnz/r, 4 subms, 3 lsubms, 4.0000 bpnz. Parameters: verbosity:1 mintimes:3 maxtimes:10 mindt:0 maxdt:3 -3 iterations (4 th.) took 0.01547s; avg 0.005158s ( +/- 78.67/156.49 %); best 0.0011s; worst 0.01323s; std dev. 0.005707 (taking best). -Reference operation time is 0.00110006 s (0.08727 Mflops) with 4 threads. -Starting merge (same threads) based auto-tuning procedure (transA=N, nrhs=1, order=rows) (max 6 steps, inclusive 3 grace steps) on: 3 x 3, type C, 6 nnz, 2 nnz/r, 4 subms, 3 lsubms, 4.0000 bpnz (tpop: 0.0011 Mflops: 0.087) -Merge (3 -> 1 leaves) took w.c.t. of 3.099e-05s, ~9.06e-06s of computing time (of which 9.537e-07s sorting, 7.153e-06s analysis) -3 iterations (4 th.) took 4.387e-05s; avg 1.462e-05s ( +/- 93.48/180.43 %); best 9.537e-07s; worst 4.101e-05s; std dev. 1.866e-05 (taking best). +3 iterations (4 th.) took 0.009296s; avg 0.003099s ( +/- 26.65/ 52.94 %); best 0.002273s; worst 0.004739s; std dev. 0.00116 (taking best). +Reference operation time is 0.00227284 s (0.04224 Mflops) with 4 threads. +Starting merge (same threads) based auto-tuning procedure (transA=N, nrhs=1, order=rows) (max 6 steps, inclusive 3 grace steps) on: 3 x 3, type C, 6 nnz, 2 nnz/r, 4 subms, 3 lsubms, 4.0000 bpnz (tpop: 0.002273 Mflops: 0.042) +Merge (3 -> 1 leaves) took w.c.t. of 1.979e-05s, ~8.106e-06s of computing time (of which 9.537e-07s sorting, 3.815e-06s analysis) +3 iterations (4 th.) took 7.796e-05s; avg 2.599e-05s ( +/- 96.33/188.07 %); best 9.537e-07s; worst 7.486e-05s; std dev. 3.456e-05 (taking best). Reference operation time is 9.53674e-07 s (100.7 Mflops) with 4 threads. After merge step 1: tpop: 9.537e-07 s ~Mflops: 100.663 nsubm:1 otn:4 -Applying merge (3 -> 1 leaves, 4 th.) yielded SPEEDUP of 1153.500x: 0.0011s -> 9.537e-07s, so taking this instance. +Applying merge (3 -> 1 leaves, 4 th.) yielded SPEEDUP of 2383.250x: 0.002273s -> 9.537e-07s, so taking this instance. Merged all the matrix leaves: no reason to continue merging. -A total of 1 merge steps (of max 6) (3 -> 1 subms) took 0.003758s (of which 3.695e-05s partitioning, 0s I/O); computing times: 9.06e-06s in par. loops, 9.537e-07s sorting, 7.153e-06s analyzing) -Total merge + benchmarking process took 0.003758s, equivalent to 3940.5/3.4 new/old ops (0.006396s for 2 clones -- as 6706.8/5.8 ops, or 3353.4/2.9 ops per clone), SPEEDUP of 1153.500x -Applying multi-merge (3 -> 1 leaves, 1 steps, 0 -> 4 th.sp.) yielded SPEEDUP of 1153.500x (0.0011s -> 9.537e-07s), will amortize in 3.4 ops by saving 0.001099s per op. -In 1 tuning rounds (tot. 0.022s, 0.0064s for constructor, 2 clones) obtained a SPEEDUP of 115250.0% (1154x) (from 0.08727 to 100.7 Mflops). +A total of 1 merge steps (of max 6) (3 -> 1 subms) took 0.01032s (of which 2.718e-05s partitioning, 0s I/O); computing times: 8.106e-06s in par. loops, 9.537e-07s sorting, 3.815e-06s analyzing) +Total merge + benchmarking process took 0.01032s, equivalent to 10818.2/4.5 new/old ops (0.022s for 2 clones -- as 23073.0/9.7 ops, or 11536.5/4.8 ops per clone), SPEEDUP of 2383.250x +Applying multi-merge (3 -> 1 leaves, 1 steps, 0 -> 4 th.sp.) yielded SPEEDUP of 2383.250x (0.002273s -> 9.537e-07s), will amortize in 4.5 ops by saving 0.002272s per op. +In 1 tuning rounds (tot. 0.031s, 0.022s for constructor, 2 clones) obtained a SPEEDUP of 238225.0% (2383x) (from 0.04224 to 100.7 Mflops). #pr: updating sample at index 5 (4^th of 16), 0^th touch for (0,0,0,0,0,2,0). -First run of RSB Autotuner took 0.0225821 s (1.100e-03 s -> 9.537e-07 s per spmv_sxsa) (tuned: 3 -> 1 lsubm). +First run of RSB Autotuner took 0.0324521 s (2.273e-03 s -> 9.537e-07 s per spmv_sxsa) (tuned: 3 -> 1 lsubm). RSB Sparse Blocks Autotuner invoked requesting max 0 splits and max 0 merges in 1 rounds, auto threads spec. -Second run of RSB Autotuner took 0.0584369 s and estimated a speedup of 1.000000 x (1.001e-07 s -> 1.001e-07 s per op) in same matrix (1 -> 1 lsubm) +Second run of RSB Autotuner took 0.176269 s and estimated a speedup of 1.000000 x (9.537e-07 s -> 9.537e-07 s per op) in same matrix (1 -> 1 lsubm) #min:1 0 #max:1 0 #sum:3 0 #norm:1.73205078 0 #used index storage compared to COO:28 vs 48 bytes (58.33%) ; compared to CSR:28 vs 40 bytes (77.78%) #%:CONSTRUCTOR_*:SORT SCAN INSERT SCAN+INSERT -%:CONSTRUCTOR_TIMES:A.mtx S N 4 3 3 6 0.000000 0.002214 0.002127 0.004341 -%:UNSORTEDCOO2RSB_TIME:A.mtx S N 4 3 3 6 0.004341 -%:RSB_SUBDIVISION_TIME:A.mtx S N 4 3 3 6 0.002214 -%:RSB_SHUFFLE_TIME:A.mtx S N 4 3 3 6 0.002127 +%:CONSTRUCTOR_TIMES:A.mtx S N 4 3 3 6 0.000000 0.012739 0.006287 0.019026 +%:UNSORTEDCOO2RSB_TIME:A.mtx S N 4 3 3 6 0.019026 +%:RSB_SUBDIVISION_TIME:A.mtx S N 4 3 3 6 0.012739 +%:RSB_SHUFFLE_TIME:A.mtx S N 4 3 3 6 0.006287 %:ROW_MAJOR_SORT_TIME:A.mtx S N 4 3 3 6 0.000000 %:ROW_MAJOR_SORT_SCALING:A.mtx S N 4 3 3 6 nan -%:SORTEDCOO2RSB_TIME:A.mtx S N 4 3 3 6 0.004341 +%:SORTEDCOO2RSB_TIME:A.mtx S N 4 3 3 6 0.019026 %:ROW_MAJOR_SORT_TO_MOP:A.mtx S N 4 3 3 6 0.000 %:UNSORTEDCOO2RSB_SCALING:A.mtx S N 4 3 3 6 1.00 %:SORTEDCOO2RSB_SCALING:A.mtx S N 4 3 3 6 1.00 @@ -5704,50 +5741,50 @@ %:SM_MINMAXAVGNNZ:A.mtx S N 4 3 3 6 6 6 6 # %operation:matrix CONSTRUCTOR[4] SPMV[4] SPMV[4] -%operation:A.mtx 0.00646091 1e+09 1e+09 +%operation:A.mtx 0.0249979 1e+09 1e+09 %constructor:matrix SORT[4] SCAN[4] SHUFFLE[4] INSERT[4] -%constructor:A.mtx 0 0.00221395 0 0.00212693 +%constructor:A.mtx 0 0.0127389 0 0.0062871 # symmetric matrix --- skipping transposed benchmarking # multi-nrhs benchmarking (1,4) -- now using nrhs 4. # Using alpha=1 beta=1 order=rows for rsb_spmv/rsb_spsv/rsb_spmm/rsb_spsm. # multi-transpose benchmarking -- now using transA = N. # will use input matrix flags: RSB_FLAG_USE_HALFWORD_INDICES, RSB_FLAG_SORTED_INPUT, RSB_FLAG_QUAD_PARTITIONING, RSB_FLAG_SYMMETRIC, RSB_FLAG_OWN_PARTITIONING_ARRAYS # Using 4 threads -# Constructed matrix (took 0.007s): (3 x 3)[0x19ce8a0]{C} @ (0(0..0),0(0..0)) (6 nnz, 2 nnz/r) flags 0x2442186 (coo:1, csr:0, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'S' +# Constructed matrix (took 0.022s): (3 x 3)[0x19d4ff0]{C} @ (0(0..0),0(0..0)) (6 nnz, 2 nnz/r) flags 0x2442186 (coo:1, csr:0, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'S' # matrix consistency check took 0.000s (ok) RSB Sparse Blocks Autotuner invoked requesting max 6 splits and max 6 merges in 1 rounds, threads spec.0 (specify negative values to enable threads tuning). Will autotune matrix: 3 x 3, type C, 6 nnz, 2 nnz/r, 4 subms, 3 lsubms, 4.0000 bpnz. Parameters: verbosity:1 mintimes:3 maxtimes:10 mindt:0 maxdt:3 -3 iterations (4 th.) took 0.002699s; avg 0.0008997s ( +/- 33.96/ 18.80 %); best 0.0005941s; worst 0.001069s; std dev. 0.0002165 (taking best). -Reference operation time is 0.000594139 s (0.6463 Mflops) with 4 threads. -Starting merge (same threads) based auto-tuning procedure (transA=N, nrhs=4, order=rows) (max 6 steps, inclusive 3 grace steps) on: 3 x 3, type C, 6 nnz, 2 nnz/r, 4 subms, 3 lsubms, 4.0000 bpnz (tpop: 0.0005941 Mflops: 0.646) -Merge (3 -> 1 leaves) took w.c.t. of 2.599e-05s, ~7.868e-06s of computing time (of which 1.907e-06s sorting, 5.96e-06s analysis) -3 iterations (4 th.) took 1.097e-05s; avg 3.656e-06s ( +/- 73.91/121.74 %); best 9.537e-07s; worst 8.106e-06s; std dev. 3.171e-06 (taking best). -Reference operation time is 9.53674e-07 s (402.7 Mflops) with 4 threads. -After merge step 1: tpop: 9.537e-07 s ~Mflops: 402.653 nsubm:1 otn:4 -Applying merge (3 -> 1 leaves, 4 th.) yielded SPEEDUP of 623.000x: 0.0005941s -> 9.537e-07s, so taking this instance. +3 iterations (4 th.) took 0.01147s; avg 0.003822s ( +/- 36.76/ 26.88 %); best 0.002417s; worst 0.00485s; std dev. 0.001028 (taking best). +Reference operation time is 0.00241709 s (0.1589 Mflops) with 4 threads. +Starting merge (same threads) based auto-tuning procedure (transA=N, nrhs=4, order=rows) (max 6 steps, inclusive 3 grace steps) on: 3 x 3, type C, 6 nnz, 2 nnz/r, 4 subms, 3 lsubms, 4.0000 bpnz (tpop: 0.002417 Mflops: 0.159) +Merge (3 -> 1 leaves) took w.c.t. of 2.003e-05s, ~7.153e-06s of computing time (of which 2.146e-06s sorting, 4.053e-06s analysis) +3 iterations (4 th.) took 1.001e-05s; avg 3.338e-06s ( +/- 64.29/107.14 %); best 1.192e-06s; worst 6.914e-06s; std dev. 2.546e-06 (taking best). +Reference operation time is 1.19209e-06 s (322.1 Mflops) with 4 threads. +After merge step 1: tpop: 1.192e-06 s ~Mflops: 322.123 nsubm:1 otn:4 +Applying merge (3 -> 1 leaves, 4 th.) yielded SPEEDUP of 2027.600x: 0.002417s -> 1.192e-06s, so taking this instance. Merged all the matrix leaves: no reason to continue merging. -A total of 1 merge steps (of max 6) (3 -> 1 subms) took 0.00313s (of which 3.195e-05s partitioning, 0s I/O); computing times: 7.868e-06s in par. loops, 1.907e-06s sorting, 5.96e-06s analyzing) -Total merge + benchmarking process took 0.00313s, equivalent to 3282.2/5.3 new/old ops (0.006211s for 2 clones -- as 6512.8/10.5 ops, or 3256.4/5.2 ops per clone), SPEEDUP of 623.000x -Applying multi-merge (3 -> 1 leaves, 1 steps, 0 -> 4 th.sp.) yielded SPEEDUP of 623.000x (0.0005941s -> 9.537e-07s), will amortize in 5.3 ops by saving 0.0005932s per op. -In 1 tuning rounds (tot. 0.009s, 0.0062s for constructor, 2 clones) obtained a SPEEDUP of 62200.0% (623x) (from 0.6463 to 402.7 Mflops). +A total of 1 merge steps (of max 6) (3 -> 1 subms) took 0.009005s (of which 2.503e-05s partitioning, 0s I/O); computing times: 7.153e-06s in par. loops, 2.146e-06s sorting, 4.053e-06s analyzing) +Total merge + benchmarking process took 0.009005s, equivalent to 7553.8/3.7 new/old ops (0.01888s for 2 clones -- as 15841.8/7.8 ops, or 7920.9/3.9 ops per clone), SPEEDUP of 2027.600x +Applying multi-merge (3 -> 1 leaves, 1 steps, 0 -> 4 th.sp.) yielded SPEEDUP of 2027.600x (0.002417s -> 1.192e-06s), will amortize in 3.7 ops by saving 0.002416s per op. +In 1 tuning rounds (tot. 0.03s, 0.019s for constructor, 2 clones) obtained a SPEEDUP of 202660.0% (2028x) (from 0.1589 to 322.1 Mflops). #pr: updating sample at index 13 (5^th of 16), 0^th touch for (0,0,0,0,1,2,0). -First run of RSB Autotuner took 0.00906801 s (5.941e-04 s -> 9.537e-07 s per spmv_sxsa) (tuned: 3 -> 1 lsubm). +First run of RSB Autotuner took 0.030489 s (2.417e-03 s -> 1.192e-06 s per spmv_sxsa) (tuned: 3 -> 1 lsubm). RSB Sparse Blocks Autotuner invoked requesting max 0 splits and max 0 merges in 1 rounds, auto threads spec. -Second run of RSB Autotuner took 0.0640042 s and estimated a speedup of 1.000000 x (9.537e-07 s -> 9.537e-07 s per op) in same matrix (1 -> 1 lsubm) +Second run of RSB Autotuner took 0.180747 s and estimated a speedup of 1.000000 x (9.537e-07 s -> 9.537e-07 s per op) in same matrix (1 -> 1 lsubm) #min:1 0 #max:1 0 #sum:3 0 #norm:1.73205078 0 #used index storage compared to COO:28 vs 48 bytes (58.33%) ; compared to CSR:28 vs 40 bytes (77.78%) #%:CONSTRUCTOR_*:SORT SCAN INSERT SCAN+INSERT -%:CONSTRUCTOR_TIMES:A.mtx S N 4 3 3 6 0.000000 0.002348 0.002119 0.004467 -%:UNSORTEDCOO2RSB_TIME:A.mtx S N 4 3 3 6 0.004467 -%:RSB_SUBDIVISION_TIME:A.mtx S N 4 3 3 6 0.002348 -%:RSB_SHUFFLE_TIME:A.mtx S N 4 3 3 6 0.002119 +%:CONSTRUCTOR_TIMES:A.mtx S N 4 3 3 6 0.000000 0.006953 0.008264 0.015217 +%:UNSORTEDCOO2RSB_TIME:A.mtx S N 4 3 3 6 0.015217 +%:RSB_SUBDIVISION_TIME:A.mtx S N 4 3 3 6 0.006953 +%:RSB_SHUFFLE_TIME:A.mtx S N 4 3 3 6 0.008264 %:ROW_MAJOR_SORT_TIME:A.mtx S N 4 3 3 6 0.000000 %:ROW_MAJOR_SORT_SCALING:A.mtx S N 4 3 3 6 nan -%:SORTEDCOO2RSB_TIME:A.mtx S N 4 3 3 6 0.004467 +%:SORTEDCOO2RSB_TIME:A.mtx S N 4 3 3 6 0.015217 %:ROW_MAJOR_SORT_TO_MOP:A.mtx S N 4 3 3 6 0.000 %:UNSORTEDCOO2RSB_SCALING:A.mtx S N 4 3 3 6 1.00 %:SORTEDCOO2RSB_SCALING:A.mtx S N 4 3 3 6 1.00 @@ -5762,59 +5799,59 @@ %:SM_MINMAXAVGNNZ:A.mtx S N 4 3 3 6 6 6 6 # %operation:matrix CONSTRUCTOR[4] SPMV[4] SPMV[4] -%operation:A.mtx 0.00653005 1e+09 1e+09 +%operation:A.mtx 0.0223269 1e+09 1e+09 %constructor:matrix SORT[4] SCAN[4] SHUFFLE[4] INSERT[4] -%constructor:A.mtx 0 0.00234818 0 0.00211906 +%constructor:A.mtx 0 0.006953 0 0.00826406 # symmetric matrix --- skipping transposed benchmarking -# so far, program took 6.724s of wall clock time; ancillary tests 0.000s; I/O 0.000s; checks 0.000s; conversions 0.000s; rsb/mkl tuning 0.473s/0.000s . +# so far, program took 7.841s of wall clock time; ancillary tests 0.000s; I/O 0.000s; checks 0.000s; conversions 0.000s; rsb/mkl tuning 1.221s/0.000s . getrusage() stats: -ru_maxrss: 7 (maximum resident set size -- MB) -ru_stime : 0.06389s (system CPU time used) -ru_utime : 7.746s (user CPU time used) +ru_maxrss: 5 (maximum resident set size -- MB) +ru_stime : 0.1045s (system CPU time used) +ru_utime : 7.711s (user CPU time used) # multi-type benchmarking (DSCZ) -- now using typecode Z (last was C). # Cache block size total 524288 bytes, per-thread 131072 bytes -# so far, program took 6.724s of wall clock time; ancillary tests 0.000s; I/O 0.000s; checks 0.000s; conversions 0.000s; rsb/mkl tuning 0.473s/0.000s . +# so far, program took 7.841s of wall clock time; ancillary tests 0.000s; I/O 0.000s; checks 0.000s; conversions 0.000s; rsb/mkl tuning 1.221s/0.000s . # Reusing type converted (C->Z) arrays from last iteration instead of reloading matrix file. # multi-nrhs benchmarking (1,4) -- now using nrhs 1. # Using alpha=1 beta=1 order=rows for rsb_spmv/rsb_spsv/rsb_spmm/rsb_spsm. # multi-transpose benchmarking -- now using transA = N. # will use input matrix flags: RSB_FLAG_USE_HALFWORD_INDICES, RSB_FLAG_SORTED_INPUT, RSB_FLAG_QUAD_PARTITIONING, RSB_FLAG_SYMMETRIC, RSB_FLAG_OWN_PARTITIONING_ARRAYS # Using 4 threads -# Constructed matrix (took 0.007s): (3 x 3)[0x19d1570]{Z} @ (0(0..0),0(0..0)) (6 nnz, 2 nnz/r) flags 0x2442186 (coo:1, csr:0, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'S' +# Constructed matrix (took 0.023s): (3 x 3)[0x19d4ff0]{Z} @ (0(0..0),0(0..0)) (6 nnz, 2 nnz/r) flags 0x2442186 (coo:1, csr:0, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'S' # matrix consistency check took 0.000s (ok) RSB Sparse Blocks Autotuner invoked requesting max 6 splits and max 6 merges in 1 rounds, threads spec.0 (specify negative values to enable threads tuning). Will autotune matrix: 3 x 3, type Z, 6 nnz, 2 nnz/r, 4 subms, 3 lsubms, 4.0000 bpnz. Parameters: verbosity:1 mintimes:3 maxtimes:10 mindt:0 maxdt:3 -3 iterations (4 th.) took 0.003691s; avg 0.00123s ( +/- 56.01/ 28.24 %); best 0.0005412s; worst 0.001578s; std dev. 0.0004873 (taking best). -Reference operation time is 0.00054121 s (0.1774 Mflops) with 4 threads. -Starting merge (same threads) based auto-tuning procedure (transA=N, nrhs=1, order=rows) (max 6 steps, inclusive 3 grace steps) on: 3 x 3, type Z, 6 nnz, 2 nnz/r, 4 subms, 3 lsubms, 4.0000 bpnz (tpop: 0.0005412 Mflops: 0.177) -Merge (3 -> 1 leaves) took w.c.t. of 2.289e-05s, ~7.868e-06s of computing time (of which 1.907e-06s sorting, 5.007e-06s analysis) -3 iterations (4 th.) took 2.503e-05s; avg 8.345e-06s ( +/- 88.57/162.86 %); best 9.537e-07s; worst 2.193e-05s; std dev. 9.622e-06 (taking best). -Reference operation time is 9.53674e-07 s (100.7 Mflops) with 4 threads. -After merge step 1: tpop: 9.537e-07 s ~Mflops: 100.663 nsubm:1 otn:4 -Applying merge (3 -> 1 leaves, 4 th.) yielded SPEEDUP of 567.500x: 0.0005412s -> 9.537e-07s, so taking this instance. +3 iterations (4 th.) took 0.009539s; avg 0.00318s ( +/- 27.41/ 51.74 %); best 0.002308s; worst 0.004825s; std dev. 0.001164 (taking best). +Reference operation time is 0.00230813 s (0.04159 Mflops) with 4 threads. +Starting merge (same threads) based auto-tuning procedure (transA=N, nrhs=1, order=rows) (max 6 steps, inclusive 3 grace steps) on: 3 x 3, type Z, 6 nnz, 2 nnz/r, 4 subms, 3 lsubms, 4.0000 bpnz (tpop: 0.002308 Mflops: 0.042) +Merge (3 -> 1 leaves) took w.c.t. of 2.098e-05s, ~7.868e-06s of computing time (of which 9.537e-07s sorting, 4.053e-06s analysis) +3 iterations (4 th.) took 2.503e-05s; avg 8.345e-06s ( +/- 98.92/177.14 %); best 9.01e-08s; worst 2.313e-05s; std dev. 1.048e-05 (taking best). +Reference operation time is 9.00984e-08 s (1066 Mflops) with 4 threads. +After merge step 1: tpop: 9.01e-08 s ~Mflops: 1065.502 nsubm:1 otn:4 +Applying merge (3 -> 1 leaves, 4 th.) yielded SPEEDUP of 25617.888x: 0.002308s -> 9.01e-08s, so taking this instance. Merged all the matrix leaves: no reason to continue merging. -A total of 1 merge steps (of max 6) (3 -> 1 subms) took 0.003089s (of which 2.909e-05s partitioning, 0s I/O); computing times: 7.868e-06s in par. loops, 1.907e-06s sorting, 5.007e-06s analyzing) -Total merge + benchmarking process took 0.003089s, equivalent to 3239.0/5.7 new/old ops (0.006616s for 2 clones -- as 6937.5/12.2 ops, or 3468.8/6.1 ops per clone), SPEEDUP of 567.500x -Applying multi-merge (3 -> 1 leaves, 1 steps, 0 -> 4 th.sp.) yielded SPEEDUP of 567.500x (0.0005412s -> 9.537e-07s), will amortize in 5.7 ops by saving 0.0005403s per op. -In 1 tuning rounds (tot. 0.01s, 0.0066s for constructor, 2 clones) obtained a SPEEDUP of 56650.0% (567.5x) (from 0.1774 to 100.7 Mflops). +A total of 1 merge steps (of max 6) (3 -> 1 subms) took 0.011s (of which 2.599e-05s partitioning, 0s I/O); computing times: 7.868e-06s in par. loops, 9.537e-07s sorting, 4.053e-06s analyzing) +Total merge + benchmarking process took 0.011s, equivalent to 122122.3/4.8 new/old ops (0.02207s for 2 clones -- as 244921.9/9.6 ops, or 122461.0/4.8 ops per clone), SPEEDUP of 25617.888x +Applying multi-merge (3 -> 1 leaves, 1 steps, 0 -> 4 th.sp.) yielded SPEEDUP of 25617.888x (0.002308s -> 9.01e-08s), will amortize in 4.8 ops by saving 0.002308s per op. +In 1 tuning rounds (tot. 0.032s, 0.022s for constructor, 2 clones) obtained a SPEEDUP of 2561688.8% (2.562e+04x) (from 0.04159 to 1066 Mflops). #pr: updating sample at index 7 (6^th of 16), 0^th touch for (0,0,0,0,0,3,0). -First run of RSB Autotuner took 0.0104759 s (5.412e-04 s -> 9.537e-07 s per spmv_sxsa) (tuned: 3 -> 1 lsubm). +First run of RSB Autotuner took 0.0317609 s (2.308e-03 s -> 9.010e-08 s per spmv_sxsa) (tuned: 3 -> 1 lsubm). RSB Sparse Blocks Autotuner invoked requesting max 0 splits and max 0 merges in 1 rounds, auto threads spec. -Second run of RSB Autotuner took 0.053458 s and estimated a speedup of 1.000000 x (1.001e-07 s -> 1.001e-07 s per op) in same matrix (1 -> 1 lsubm) +Second run of RSB Autotuner took 0.180491 s and estimated a speedup of 1.000000 x (9.537e-07 s -> 9.537e-07 s per op) in same matrix (1 -> 1 lsubm) #min:1 0 #max:1 0 #sum:3 0 #norm:1.7320508075688772 0 #used index storage compared to COO:28 vs 48 bytes (58.33%) ; compared to CSR:28 vs 40 bytes (77.78%) #%:CONSTRUCTOR_*:SORT SCAN INSERT SCAN+INSERT -%:CONSTRUCTOR_TIMES:A.mtx S N 4 3 3 6 0.000000 0.002285 0.002211 0.004496 -%:UNSORTEDCOO2RSB_TIME:A.mtx S N 4 3 3 6 0.004496 -%:RSB_SUBDIVISION_TIME:A.mtx S N 4 3 3 6 0.002285 -%:RSB_SHUFFLE_TIME:A.mtx S N 4 3 3 6 0.002211 +%:CONSTRUCTOR_TIMES:A.mtx S N 4 3 3 6 0.000000 0.010002 0.006759 0.016761 +%:UNSORTEDCOO2RSB_TIME:A.mtx S N 4 3 3 6 0.016761 +%:RSB_SUBDIVISION_TIME:A.mtx S N 4 3 3 6 0.010002 +%:RSB_SHUFFLE_TIME:A.mtx S N 4 3 3 6 0.006759 %:ROW_MAJOR_SORT_TIME:A.mtx S N 4 3 3 6 0.000000 %:ROW_MAJOR_SORT_SCALING:A.mtx S N 4 3 3 6 nan -%:SORTEDCOO2RSB_TIME:A.mtx S N 4 3 3 6 0.004496 +%:SORTEDCOO2RSB_TIME:A.mtx S N 4 3 3 6 0.016761 %:ROW_MAJOR_SORT_TO_MOP:A.mtx S N 4 3 3 6 0.000 %:UNSORTEDCOO2RSB_SCALING:A.mtx S N 4 3 3 6 1.00 %:SORTEDCOO2RSB_SCALING:A.mtx S N 4 3 3 6 1.00 @@ -5829,56 +5866,56 @@ %:SM_MINMAXAVGNNZ:A.mtx S N 4 3 3 6 6 6 6 # %operation:matrix CONSTRUCTOR[4] SPMV[4] SPMV[4] -%operation:A.mtx 0.00658083 1e+09 1e+09 +%operation:A.mtx 0.0232742 1e+09 1e+09 %constructor:matrix SORT[4] SCAN[4] SHUFFLE[4] INSERT[4] -%constructor:A.mtx 0 0.002285 0 0.00221109 +%constructor:A.mtx 0 0.0100019 0 0.00675917 # symmetric matrix --- skipping transposed benchmarking # multi-nrhs benchmarking (1,4) -- now using nrhs 4. # Using alpha=1 beta=1 order=rows for rsb_spmv/rsb_spsv/rsb_spmm/rsb_spsm. # multi-transpose benchmarking -- now using transA = N. # will use input matrix flags: RSB_FLAG_USE_HALFWORD_INDICES, RSB_FLAG_SORTED_INPUT, RSB_FLAG_QUAD_PARTITIONING, RSB_FLAG_SYMMETRIC, RSB_FLAG_OWN_PARTITIONING_ARRAYS # Using 4 threads -# Constructed matrix (took 0.006s): (3 x 3)[0x19d1570]{Z} @ (0(0..0),0(0..0)) (6 nnz, 2 nnz/r) flags 0x2442186 (coo:1, csr:0, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'S' +# Constructed matrix (took 0.023s): (3 x 3)[0x19d7d20]{Z} @ (0(0..0),0(0..0)) (6 nnz, 2 nnz/r) flags 0x2442186 (coo:1, csr:0, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'S' # matrix consistency check took 0.000s (ok) RSB Sparse Blocks Autotuner invoked requesting max 6 splits and max 6 merges in 1 rounds, threads spec.0 (specify negative values to enable threads tuning). Will autotune matrix: 3 x 3, type Z, 6 nnz, 2 nnz/r, 4 subms, 3 lsubms, 4.0000 bpnz. Parameters: verbosity:1 mintimes:3 maxtimes:10 mindt:0 maxdt:3 -3 iterations (4 th.) took 0.003383s; avg 0.001128s ( +/- 50.42/ 43.21 %); best 0.0005591s; worst 0.001615s; std dev. 0.0004349 (taking best). -Reference operation time is 0.000559092 s (0.6868 Mflops) with 4 threads. -Starting merge (same threads) based auto-tuning procedure (transA=N, nrhs=4, order=rows) (max 6 steps, inclusive 3 grace steps) on: 3 x 3, type Z, 6 nnz, 2 nnz/r, 4 subms, 3 lsubms, 4.0000 bpnz (tpop: 0.0005591 Mflops: 0.687) -Merge (3 -> 1 leaves) took w.c.t. of 2.789e-05s, ~8.821e-06s of computing time (of which 9.537e-07s sorting, 5.96e-06s analysis) -3 iterations (4 th.) took 1.311e-05s; avg 4.371e-06s ( +/- 56.36/107.27 %); best 1.907e-06s; worst 9.06e-06s; std dev. 3.317e-06 (taking best). -Reference operation time is 1.90735e-06 s (201.3 Mflops) with 4 threads. -After merge step 1: tpop: 1.907e-06 s ~Mflops: 201.327 nsubm:1 otn:4 -Applying merge (3 -> 1 leaves, 4 th.) yielded SPEEDUP of 293.125x: 0.0005591s -> 1.907e-06s, so taking this instance. +3 iterations (4 th.) took 0.01003s; avg 0.003342s ( +/- 33.30/ 61.19 %); best 0.002229s; worst 0.005387s; std dev. 0.001448 (taking best). +Reference operation time is 0.00222898 s (0.1723 Mflops) with 4 threads. +Starting merge (same threads) based auto-tuning procedure (transA=N, nrhs=4, order=rows) (max 6 steps, inclusive 3 grace steps) on: 3 x 3, type Z, 6 nnz, 2 nnz/r, 4 subms, 3 lsubms, 4.0000 bpnz (tpop: 0.002229 Mflops: 0.172) +Merge (3 -> 1 leaves) took w.c.t. of 1.788e-05s, ~5.96e-06s of computing time (of which 1.907e-06s sorting, 4.053e-06s analysis) +3 iterations (4 th.) took 8.821e-06s; avg 2.94e-06s ( +/- 67.57/102.70 %); best 9.537e-07s; worst 5.96e-06s; std dev. 2.171e-06 (taking best). +Reference operation time is 9.53674e-07 s (402.7 Mflops) with 4 threads. +After merge step 1: tpop: 9.537e-07 s ~Mflops: 402.653 nsubm:1 otn:4 +Applying merge (3 -> 1 leaves, 4 th.) yielded SPEEDUP of 2337.250x: 0.002229s -> 9.537e-07s, so taking this instance. Merged all the matrix leaves: no reason to continue merging. -A total of 1 merge steps (of max 6) (3 -> 1 subms) took 0.003117s (of which 3.6e-05s partitioning, 0s I/O); computing times: 8.821e-06s in par. loops, 9.537e-07s sorting, 5.96e-06s analyzing) -Total merge + benchmarking process took 0.003117s, equivalent to 1634.2/5.6 new/old ops (0.00639s for 2 clones -- as 3350.2/11.4 ops, or 1675.1/5.7 ops per clone), SPEEDUP of 293.125x -Applying multi-merge (3 -> 1 leaves, 1 steps, 0 -> 4 th.sp.) yielded SPEEDUP of 293.125x (0.0005591s -> 1.907e-06s), will amortize in 5.6 ops by saving 0.0005572s per op. -In 1 tuning rounds (tot. 0.0099s, 0.0064s for constructor, 2 clones) obtained a SPEEDUP of 29212.5% (293.1x) (from 0.6868 to 201.3 Mflops). +A total of 1 merge steps (of max 6) (3 -> 1 subms) took 0.01105s (of which 2.384e-05s partitioning, 0s I/O); computing times: 5.96e-06s in par. loops, 1.907e-06s sorting, 4.053e-06s analyzing) +Total merge + benchmarking process took 0.01105s, equivalent to 11586.8/5.0 new/old ops (0.02223s for 2 clones -- as 23309.0/10.0 ops, or 11654.5/5.0 ops per clone), SPEEDUP of 2337.250x +Applying multi-merge (3 -> 1 leaves, 1 steps, 0 -> 4 th.sp.) yielded SPEEDUP of 2337.250x (0.002229s -> 9.537e-07s), will amortize in 5.0 ops by saving 0.002228s per op. +In 1 tuning rounds (tot. 0.032s, 0.022s for constructor, 2 clones) obtained a SPEEDUP of 233625.0% (2337x) (from 0.1723 to 402.7 Mflops). #pr: updating sample at index 15 (7^th of 16), 0^th touch for (0,0,0,0,1,3,0). -First run of RSB Autotuner took 0.00995207 s (5.591e-04 s -> 1.907e-06 s per spmv_sxsa) (tuned: 3 -> 1 lsubm). +First run of RSB Autotuner took 0.0323942 s (2.229e-03 s -> 9.537e-07 s per spmv_sxsa) (tuned: 3 -> 1 lsubm). RSB Sparse Blocks Autotuner invoked requesting max 0 splits and max 0 merges in 1 rounds, auto threads spec. -Second run of RSB Autotuner took 0.0542798 s and estimated a speedup of 1.000000 x (9.537e-07 s -> 9.537e-07 s per op) in same matrix (1 -> 1 lsubm) +Second run of RSB Autotuner took 0.181846 s and estimated a speedup of 1.000000 x (9.537e-07 s -> 9.537e-07 s per op) in same matrix (1 -> 1 lsubm) #min:1 0 #max:1 0 #sum:3 0 #norm:1.7320508075688772 0 #used index storage compared to COO:28 vs 48 bytes (58.33%) ; compared to CSR:28 vs 40 bytes (77.78%) #%:CONSTRUCTOR_*:SORT SCAN INSERT SCAN+INSERT -%:CONSTRUCTOR_TIMES:A.mtx S N 4 3 3 6 0.000000 0.002143 0.002125 0.004268 -%:UNSORTEDCOO2RSB_TIME:A.mtx S N 4 3 3 6 0.004268 -%:RSB_SUBDIVISION_TIME:A.mtx S N 4 3 3 6 0.002143 -%:RSB_SHUFFLE_TIME:A.mtx S N 4 3 3 6 0.002125 -%:ROW_MAJOR_SORT_TIME:A.mtx S N 4 3 3 6 0.000000 -%:ROW_MAJOR_SORT_SCALING:A.mtx S N 4 3 3 6 nan -%:SORTEDCOO2RSB_TIME:A.mtx S N 4 3 3 6 0.004268 +%:CONSTRUCTOR_TIMES:A.mtx S N 4 3 3 6 0.000001 0.008178 0.007100 0.015278 +%:UNSORTEDCOO2RSB_TIME:A.mtx S N 4 3 3 6 0.015279 +%:RSB_SUBDIVISION_TIME:A.mtx S N 4 3 3 6 0.008178 +%:RSB_SHUFFLE_TIME:A.mtx S N 4 3 3 6 0.007100 +%:ROW_MAJOR_SORT_TIME:A.mtx S N 4 3 3 6 0.000001 +%:ROW_MAJOR_SORT_SCALING:A.mtx S N 4 3 3 6 1.000 +%:SORTEDCOO2RSB_TIME:A.mtx S N 4 3 3 6 0.015278 %:ROW_MAJOR_SORT_TO_MOP:A.mtx S N 4 3 3 6 0.000 %:UNSORTEDCOO2RSB_SCALING:A.mtx S N 4 3 3 6 1.00 %:SORTEDCOO2RSB_SCALING:A.mtx S N 4 3 3 6 1.00 %:RSB_SUBDIVISION_SCALING:A.mtx S N 4 3 3 6 1.00 %:RSB_SHUFFLE_SCALING:A.mtx S N 4 3 3 6 1.00 -%:CONSTRUCTOR_SCALING:A.mtx S N 4 3 3 6 nan 1.00 1.00 1.00 +%:CONSTRUCTOR_SCALING:A.mtx S N 4 3 3 6 1.00 1.00 1.00 1.00 #%:SM_COUNTS: Tot HalfwordCsr FullwordCsr HalfwordCoo FullwordCoo %:SM_COUNTS:A.mtx S N 4 3 3 6 1 1 0 0 0 %:SM_IDXOCCUPATIONRSBVSCOOANDCSR:A.mtx S N 4 3 3 6 28 48 36 @@ -5887,64 +5924,64 @@ %:SM_MINMAXAVGNNZ:A.mtx S N 4 3 3 6 6 6 6 # %operation:matrix CONSTRUCTOR[4] SPMV[4] SPMV[4] -%operation:A.mtx 0.00637102 1e+09 1e+09 +%operation:A.mtx 0.0225701 1e+09 1e+09 %constructor:matrix SORT[4] SCAN[4] SHUFFLE[4] INSERT[4] -%constructor:A.mtx 0 0.00214314 0 0.00212502 +%constructor:A.mtx 1.19209e-06 0.008178 0 0.00709987 # symmetric matrix --- skipping transposed benchmarking -# so far, program took 6.886s of wall clock time; ancillary tests 0.000s; I/O 0.000s; checks 0.000s; conversions 0.000s; rsb/mkl tuning 0.601s/0.000s . +# so far, program took 8.369s of wall clock time; ancillary tests 0.000s; I/O 0.000s; checks 0.000s; conversions 0.000s; rsb/mkl tuning 1.648s/0.000s . getrusage() stats: -ru_maxrss: 7 (maximum resident set size -- MB) -ru_stime : 0.08393s (system CPU time used) -ru_utime : 8.191s (user CPU time used) +ru_maxrss: 5 (maximum resident set size -- MB) +ru_stime : 0.1208s (system CPU time used) +ru_utime : 8.211s (user CPU time used) # benchmarking terminated --- finalizing run. # ====== BEGIN Total summary record. #pr: ======== Limiting to type D: #pr: 2 samples (out of 8) matched the dump limiting criteria. #pr: Dump from a base of 8 samples (of max 16) ordered by (1,1,1,1,2,4,2) = (filename x cores x incX x incY x nrhs x typecode x transA). pr: BESTCODE MTX NR NC NNZ NRHS TYPE SYM TRANS NT AT-NT AT-MKL-NT BPNZ AT-BPNZ NSUBM AT-SUBM RSBBEST-MFLOPS OPTIME MKL-OPTIME AT-OPTIME AT-MKL-OPTIME AT-TIME RWminBW-GBps CB-bpf AT-MS CMFLOPS -pr: 1:R_R A 3 3 6 1 D S N 4 4 0 4.0000 4.6667 3 1 25.17 1.067e-03 0.000e+00 9.537e-07 0.000e+00 1.013e-02 1.55e-01 5.17e+00 1 2.40e-05 -pr: 9:R_R A 3 3 6 4 D S N 4 4 0 4.0000 4.6667 3 1 100.66 1.024e-03 0.000e+00 9.537e-07 0.000e+00 9.531e-03 3.82e-01 2.79e+00 1 9.60e-05 +pr: 1:R_R A 3 3 6 1 D S N 4 4 0 4.0000 4.6667 3 1 25.17 2.301e-03 0.000e+00 9.537e-07 0.000e+00 3.152e-02 1.55e-01 5.17e+00 1 2.40e-05 +pr: 9:R_R A 3 3 6 4 D S N 4 4 0 4.0000 4.6667 3 1 80.53 2.178e-03 0.000e+00 1.192e-06 0.000e+00 3.504e-02 3.05e-01 2.79e+00 1 9.60e-05 #pr: 2 samples (out of 8) matched the dump limiting criteria. #pr: below, we define 'successful' autotuning when speedup of 1.010000x is exceeded, and 'tuned' results even the ones which are same as untuned #pr: rsb autotuning was successful in 2 cases (100.00 %) and unsuccessful in 0 cases (0.00 %) -#pr: (in succ. cases rsb autotuning gave avg. 109512.5 % faster, avg. sp. ratio 1096.125x, max sp. ratio 1118.750x, avg. ratio 0.000x) -#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 10308.5/9994.0/10623.0/20617.0 tuned ops) -#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 9.4/ 9.3/ 9.5/ 18.8 untuned ops) -#pr: (and amortizes from untuned rsb in avg. 9.4, min. 9.3, max. 9.5 ops) +#pr: (in succ. cases rsb autotuning gave avg. 211887.5 % faster, avg. sp. ratio 2119.875x, max sp. ratio 2412.750x, avg. ratio 0.000x) +#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 31223.4/29397.8/33049.0/62446.8 tuned ops) +#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 14.9/ 13.7/ 16.1/ 29.8 untuned ops) +#pr: (and amortizes from untuned rsb in avg. 14.9, min. 13.7, max. 16.1 ops) #pr: (avg/min/max (avg) nnz per subm before successful tuning were 2/ 2/ 2) #pr: (avg/min/max (avg) nnz per subm after successful tuning were 6/ 6/ 6) #pr: (avg/min/max (avg) bytes per subm before successful tuning were 16/ 16/ 16) #pr: (avg/min/max (avg) bytes per subm after successful tuning were 48/ 48/ 48) #pr: (avg/min/max (avg) bytes per nnz before successful tuning were 4.000/ 4.000/ 4.000) -#pr: (avg/min/max operands (mtx,lhs,rhs) read bandwidth lower bound 0.206/ 0.130/ 0.281,GBps) -#pr: (avg/min/max operands (mtx,rhs:r;lhs:rw) bandwidth lower bound 0.537/ 0.155/ 0.382,GBps) +#pr: (avg/min/max operands (mtx,lhs,rhs) read bandwidth lower bound 0.177/ 0.130/ 0.225,GBps) +#pr: (avg/min/max operands (mtx,rhs:r;lhs:rw) bandwidth lower bound 0.461/ 0.155/ 0.305,GBps) #pr: (avg/min/max code balance (bytes read at least once per flop) 3.979/ 2.792/ 5.167) #pr: (avg/min/max (avg) bytes per nnz after successful tuning were 4.667/ 4.667/ 4.667) #pr: (matrix has been subdivided more/less/same in resp. 0 / 2 /0 cases) #pr: (matrix has used more/less/same threads in resp. 0 / 0 /2 cases) #pr: no unsuccessful rsb autotuning attempt (according to 1.01x threshold) -#pr: rsb auto tuning (either succ. or uns.) time was: on avg.: 0.01 s, min 0.01 s, max 0.01 s, tot 0.02 s (2 samples) -#pr: rsb auto tuning ( only successful ) time was: on avg.: 0.01 s, min 0.01 s, max 0.01 s, tot 0.02 s (2 samples) -#pr: best tun. rsb canon. mflops were: on avg. 6.291e+01, min 2.517e+01, max 1.007e+02 (2 samples) -#pr: ref. unt. rsb canon. mflops were: on avg. 5.813e-02, min 2.249e-02, max 9.377e-02 (2 samples) -#pr: best tun. rsb operation time was: on avg. 9.537e-07s, min 9.537e-07s, max 9.537e-07s, tot 1.907e-06s (2 samples) -#pr: ref. unt. rsb operation time was: on avg. 1.045e-03s, min 1.024e-03s, max 1.067e-03s, tot 2.091e-03s (2 samples) -#pr: min / max ratio of in-memory MEMSET bandwidth to extrapolated read bandwidth ratio: 2.070e+01 4.474e+01 -#pr: in-cache to in-memory MEMSET bandwidth ratio: 1.003e+00 -#pr: rsb nrhs-to-overall-min-rhs speed ratio was: on avg. 4.000e+00 x, min 4.000e+00 x, max 4.000e+00 x (1 samples, the non-min-nrhs ones) +#pr: rsb auto tuning (either succ. or uns.) time was: on avg.: 0.03 s, min 0.03 s, max 0.04 s, tot 0.07 s (2 samples) +#pr: rsb auto tuning ( only successful ) time was: on avg.: 0.03 s, min 0.03 s, max 0.04 s, tot 0.07 s (2 samples) +#pr: best tun. rsb canon. mflops were: on avg. 5.285e+01, min 2.517e+01, max 8.053e+01 (2 samples) +#pr: ref. unt. rsb canon. mflops were: on avg. 2.725e-02, min 1.043e-02, max 4.408e-02 (2 samples) +#pr: best tun. rsb operation time was: on avg. 1.073e-06s, min 9.537e-07s, max 1.192e-06s, tot 2.146e-06s (2 samples) +#pr: ref. unt. rsb operation time was: on avg. 2.239e-03s, min 2.178e-03s, max 2.301e-03s, tot 4.479e-03s (2 samples) +#pr: min / max ratio of in-memory MEMSET bandwidth to extrapolated read bandwidth ratio: 2.618e+01 4.526e+01 +#pr: in-cache to in-memory MEMSET bandwidth ratio: 9.966e-01 +#pr: rsb nrhs-to-overall-min-rhs speed ratio was: on avg. 3.200e+00 x, min 3.200e+00 x, max 3.200e+00 x (1 samples, the non-min-nrhs ones) #pr: ======== Limiting to type S: #pr: 2 samples (out of 8) matched the dump limiting criteria. #pr: Dump from a base of 8 samples (of max 16) ordered by (1,1,1,1,2,4,2) = (filename x cores x incX x incY x nrhs x typecode x transA). pr: BESTCODE MTX NR NC NNZ NRHS TYPE SYM TRANS NT AT-NT AT-MKL-NT BPNZ AT-BPNZ NSUBM AT-SUBM RSBBEST-MFLOPS OPTIME MKL-OPTIME AT-OPTIME AT-MKL-OPTIME AT-TIME RWminBW-GBps CB-bpf AT-MS CMFLOPS -pr: 3:R_R A 3 3 6 1 S S N 4 4 0 4.0000 4.6667 3 1 25.17 5.460e-04 0.000e+00 9.537e-07 0.000e+00 1.973e-02 9.23e-02 3.17e+00 1 2.40e-05 -pr: 11:R_R A 3 3 6 4 S S N 4 4 0 4.0000 4.6667 3 1 100.66 1.033e-03 0.000e+00 9.537e-07 0.000e+00 1.480e-02 2.06e-01 1.54e+00 1 9.60e-05 +pr: 3:R_R A 3 3 6 1 S S N 4 4 0 4.0000 4.6667 3 1 25.17 2.263e-03 0.000e+00 9.537e-07 0.000e+00 3.052e-02 9.23e-02 3.17e+00 1 2.40e-05 +pr: 11:R_R A 3 3 6 4 S S N 4 4 0 4.0000 4.6667 3 1 100.66 2.364e-03 0.000e+00 9.537e-07 0.000e+00 3.292e-02 2.06e-01 1.54e+00 1 9.60e-05 #pr: 2 samples (out of 8) matched the dump limiting criteria. #pr: below, we define 'successful' autotuning when speedup of 1.010000x is exceeded, and 'tuned' results even the ones which are same as untuned #pr: rsb autotuning was successful in 2 cases (100.00 %) and unsuccessful in 0 cases (0.00 %) -#pr: (in succ. cases rsb autotuning gave avg. 82675.0 % faster, avg. sp. ratio 827.750x, max sp. ratio 1083.000x, avg. ratio 0.000x) -#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 18101.6/15520.0/20683.2/36203.2 tuned ops) -#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 25.2/ 14.3/ 36.1/ 50.5 untuned ops) -#pr: (and amortizes from untuned rsb in avg. 25.3, min. 14.3, max. 36.2 ops) +#pr: (in succ. cases rsb autotuning gave avg. 242500.0 % faster, avg. sp. ratio 2426.000x, max sp. ratio 2479.000x, avg. ratio 0.000x) +#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 33259.8/32004.8/34514.8/66519.5 tuned ops) +#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 13.7/ 13.5/ 13.9/ 27.4 untuned ops) +#pr: (and amortizes from untuned rsb in avg. 13.7, min. 13.5, max. 13.9 ops) #pr: (avg/min/max (avg) nnz per subm before successful tuning were 2/ 2/ 2) #pr: (avg/min/max (avg) nnz per subm after successful tuning were 6/ 6/ 6) #pr: (avg/min/max (avg) bytes per subm before successful tuning were 8/ 8/ 8) @@ -5957,263 +5994,263 @@ #pr: (matrix has been subdivided more/less/same in resp. 0 / 2 /0 cases) #pr: (matrix has used more/less/same threads in resp. 0 / 0 /2 cases) #pr: no unsuccessful rsb autotuning attempt (according to 1.01x threshold) -#pr: rsb auto tuning (either succ. or uns.) time was: on avg.: 0.02 s, min 0.01 s, max 0.02 s, tot 0.03 s (2 samples) -#pr: rsb auto tuning ( only successful ) time was: on avg.: 0.02 s, min 0.01 s, max 0.02 s, tot 0.03 s (2 samples) +#pr: rsb auto tuning (either succ. or uns.) time was: on avg.: 0.03 s, min 0.03 s, max 0.03 s, tot 0.06 s (2 samples) +#pr: rsb auto tuning ( only successful ) time was: on avg.: 0.03 s, min 0.03 s, max 0.03 s, tot 0.06 s (2 samples) #pr: best tun. rsb canon. mflops were: on avg. 6.291e+01, min 2.517e+01, max 1.007e+02 (2 samples) -#pr: ref. unt. rsb canon. mflops were: on avg. 6.845e-02, min 4.396e-02, max 9.295e-02 (2 samples) +#pr: ref. unt. rsb canon. mflops were: on avg. 2.561e-02, min 1.061e-02, max 4.061e-02 (2 samples) #pr: best tun. rsb operation time was: on avg. 9.537e-07s, min 9.537e-07s, max 9.537e-07s, tot 1.907e-06s (2 samples) -#pr: ref. unt. rsb operation time was: on avg. 7.894e-04s, min 5.460e-04s, max 1.033e-03s, tot 1.579e-03s (2 samples) -#pr: min / max ratio of in-memory MEMSET bandwidth to extrapolated read bandwidth ratio: 3.749e+01 7.300e+01 -#pr: in-cache to in-memory MEMSET bandwidth ratio: 1.003e+00 +#pr: ref. unt. rsb operation time was: on avg. 2.314e-03s, min 2.263e-03s, max 2.364e-03s, tot 4.627e-03s (2 samples) +#pr: min / max ratio of in-memory MEMSET bandwidth to extrapolated read bandwidth ratio: 3.792e+01 7.384e+01 +#pr: in-cache to in-memory MEMSET bandwidth ratio: 9.966e-01 #pr: rsb nrhs-to-overall-min-rhs speed ratio was: on avg. 4.000e+00 x, min 4.000e+00 x, max 4.000e+00 x (1 samples, the non-min-nrhs ones) #pr: ======== Limiting to type C: #pr: 2 samples (out of 8) matched the dump limiting criteria. #pr: Dump from a base of 8 samples (of max 16) ordered by (1,1,1,1,2,4,2) = (filename x cores x incX x incY x nrhs x typecode x transA). pr: BESTCODE MTX NR NC NNZ NRHS TYPE SYM TRANS NT AT-NT AT-MKL-NT BPNZ AT-BPNZ NSUBM AT-SUBM RSBBEST-MFLOPS OPTIME MKL-OPTIME AT-OPTIME AT-MKL-OPTIME AT-TIME RWminBW-GBps CB-bpf AT-MS CMFLOPS -pr: 5:R_R A 3 3 6 1 C S N 4 4 0 4.0000 4.6667 3 1 100.66 1.100e-03 0.000e+00 9.537e-07 0.000e+00 2.258e-02 1.55e-01 1.29e+00 1 9.60e-05 -pr: 13:R_R A 3 3 6 4 C S N 4 4 0 4.0000 4.6667 3 1 402.65 5.941e-04 0.000e+00 9.537e-07 0.000e+00 9.068e-03 3.82e-01 6.98e-01 1 3.84e-04 +pr: 5:R_R A 3 3 6 1 C S N 4 4 0 4.0000 4.6667 3 1 100.66 2.273e-03 0.000e+00 9.537e-07 0.000e+00 3.245e-02 1.55e-01 1.29e+00 1 9.60e-05 +pr: 13:R_R A 3 3 6 4 C S N 4 4 0 4.0000 4.6667 3 1 322.12 2.417e-03 0.000e+00 1.192e-06 0.000e+00 3.049e-02 3.05e-01 6.98e-01 1 3.84e-04 #pr: 2 samples (out of 8) matched the dump limiting criteria. #pr: below, we define 'successful' autotuning when speedup of 1.010000x is exceeded, and 'tuned' results even the ones which are same as untuned #pr: rsb autotuning was successful in 2 cases (100.00 %) and unsuccessful in 0 cases (0.00 %) -#pr: (in succ. cases rsb autotuning gave avg. 88725.0 % faster, avg. sp. ratio 888.250x, max sp. ratio 1153.500x, avg. ratio 0.000x) -#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 16593.8/9508.5/23679.0/33187.5 tuned ops) -#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 17.9/ 15.3/ 20.5/ 35.8 untuned ops) -#pr: (and amortizes from untuned rsb in avg. 17.9, min. 15.3, max. 20.5 ops) +#pr: (in succ. cases rsb autotuning gave avg. 220442.5 % faster, avg. sp. ratio 2205.425x, max sp. ratio 2383.250x, avg. ratio 0.000x) +#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 29802.2/25576.0/34028.5/59604.5 tuned ops) +#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 13.4/ 12.6/ 14.3/ 26.9 untuned ops) +#pr: (and amortizes from untuned rsb in avg. 13.5, min. 12.6, max. 14.3 ops) #pr: (avg/min/max (avg) nnz per subm before successful tuning were 2/ 2/ 2) #pr: (avg/min/max (avg) nnz per subm after successful tuning were 6/ 6/ 6) #pr: (avg/min/max (avg) bytes per subm before successful tuning were 16/ 16/ 16) #pr: (avg/min/max (avg) bytes per subm after successful tuning were 48/ 48/ 48) #pr: (avg/min/max (avg) bytes per nnz before successful tuning were 4.000/ 4.000/ 4.000) -#pr: (avg/min/max operands (mtx,lhs,rhs) read bandwidth lower bound 0.206/ 0.130/ 0.281,GBps) -#pr: (avg/min/max operands (mtx,rhs:r;lhs:rw) bandwidth lower bound 0.537/ 0.155/ 0.382,GBps) +#pr: (avg/min/max operands (mtx,lhs,rhs) read bandwidth lower bound 0.177/ 0.130/ 0.225,GBps) +#pr: (avg/min/max operands (mtx,rhs:r;lhs:rw) bandwidth lower bound 0.461/ 0.155/ 0.305,GBps) #pr: (avg/min/max code balance (bytes read at least once per flop) 0.995/ 0.698/ 1.292) #pr: (avg/min/max (avg) bytes per nnz after successful tuning were 4.667/ 4.667/ 4.667) #pr: (matrix has been subdivided more/less/same in resp. 0 / 2 /0 cases) #pr: (matrix has used more/less/same threads in resp. 0 / 0 /2 cases) #pr: no unsuccessful rsb autotuning attempt (according to 1.01x threshold) -#pr: rsb auto tuning (either succ. or uns.) time was: on avg.: 0.02 s, min 0.01 s, max 0.02 s, tot 0.03 s (2 samples) -#pr: rsb auto tuning ( only successful ) time was: on avg.: 0.02 s, min 0.01 s, max 0.02 s, tot 0.03 s (2 samples) -#pr: best tun. rsb canon. mflops were: on avg. 2.517e+02, min 1.007e+02, max 4.027e+02 (2 samples) -#pr: ref. unt. rsb canon. mflops were: on avg. 3.668e-01, min 8.727e-02, max 6.463e-01 (2 samples) -#pr: best tun. rsb operation time was: on avg. 9.537e-07s, min 9.537e-07s, max 9.537e-07s, tot 1.907e-06s (2 samples) -#pr: ref. unt. rsb operation time was: on avg. 8.471e-04s, min 5.941e-04s, max 1.100e-03s, tot 1.694e-03s (2 samples) -#pr: min / max ratio of in-memory MEMSET bandwidth to extrapolated read bandwidth ratio: 2.070e+01 4.474e+01 -#pr: in-cache to in-memory MEMSET bandwidth ratio: 1.003e+00 -#pr: rsb nrhs-to-overall-min-rhs speed ratio was: on avg. 4.000e+00 x, min 4.000e+00 x, max 4.000e+00 x (1 samples, the non-min-nrhs ones) +#pr: rsb auto tuning (either succ. or uns.) time was: on avg.: 0.03 s, min 0.03 s, max 0.03 s, tot 0.06 s (2 samples) +#pr: rsb auto tuning ( only successful ) time was: on avg.: 0.03 s, min 0.03 s, max 0.03 s, tot 0.06 s (2 samples) +#pr: best tun. rsb canon. mflops were: on avg. 2.114e+02, min 1.007e+02, max 3.221e+02 (2 samples) +#pr: ref. unt. rsb canon. mflops were: on avg. 1.006e-01, min 4.224e-02, max 1.589e-01 (2 samples) +#pr: best tun. rsb operation time was: on avg. 1.073e-06s, min 9.537e-07s, max 1.192e-06s, tot 2.146e-06s (2 samples) +#pr: ref. unt. rsb operation time was: on avg. 2.345e-03s, min 2.273e-03s, max 2.417e-03s, tot 4.690e-03s (2 samples) +#pr: min / max ratio of in-memory MEMSET bandwidth to extrapolated read bandwidth ratio: 2.618e+01 4.526e+01 +#pr: in-cache to in-memory MEMSET bandwidth ratio: 9.966e-01 +#pr: rsb nrhs-to-overall-min-rhs speed ratio was: on avg. 3.200e+00 x, min 3.200e+00 x, max 3.200e+00 x (1 samples, the non-min-nrhs ones) #pr: ======== Limiting to type Z: #pr: 2 samples (out of 8) matched the dump limiting criteria. #pr: Dump from a base of 8 samples (of max 16) ordered by (1,1,1,1,2,4,2) = (filename x cores x incX x incY x nrhs x typecode x transA). pr: BESTCODE MTX NR NC NNZ NRHS TYPE SYM TRANS NT AT-NT AT-MKL-NT BPNZ AT-BPNZ NSUBM AT-SUBM RSBBEST-MFLOPS OPTIME MKL-OPTIME AT-OPTIME AT-MKL-OPTIME AT-TIME RWminBW-GBps CB-bpf AT-MS CMFLOPS -pr: 7:R_R A 3 3 6 1 Z S N 4 4 0 4.0000 4.6667 3 1 100.66 5.412e-04 0.000e+00 9.537e-07 0.000e+00 1.048e-02 2.81e-01 2.29e+00 1 9.60e-05 -pr: 15:R_R A 3 3 6 4 Z S N 4 4 0 4.0000 4.6667 3 1 201.33 5.591e-04 0.000e+00 1.907e-06 0.000e+00 9.952e-03 3.67e-01 1.32e+00 1 3.84e-04 +pr: 7:R_R A 3 3 6 1 Z S N 4 4 0 4.0000 4.6667 3 1 1065.50 2.308e-03 0.000e+00 9.010e-08 0.000e+00 3.176e-02 2.97e+00 2.29e+00 1 9.60e-05 +pr: 15:R_R A 3 3 6 4 Z S N 4 4 0 4.0000 4.6667 3 1 402.65 2.229e-03 0.000e+00 9.537e-07 0.000e+00 3.239e-02 7.34e-01 1.32e+00 1 3.84e-04 #pr: 2 samples (out of 8) matched the dump limiting criteria. #pr: below, we define 'successful' autotuning when speedup of 1.010000x is exceeded, and 'tuned' results even the ones which are same as untuned #pr: rsb autotuning was successful in 2 cases (100.00 %) and unsuccessful in 0 cases (0.00 %) -#pr: (in succ. cases rsb autotuning gave avg. 42931.2 % faster, avg. sp. ratio 430.312x, max sp. ratio 567.500x, avg. ratio 0.000x) -#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 8101.2/5217.8/10984.8/16202.5 tuned ops) -#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 18.6/ 17.8/ 19.4/ 37.2 untuned ops) -#pr: (and amortizes from untuned rsb in avg. 18.6, min. 17.9, max. 19.4 ops) +#pr: (in succ. cases rsb autotuning gave avg. 1397656.9 % faster, avg. sp. ratio 13977.569x, max sp. ratio 25617.888x, avg. ratio 0.000x) +#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 193240.8/33967.8/352513.9/386481.6 tuned ops) +#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 14.1/ 13.8/ 14.5/ 28.3 untuned ops) +#pr: (and amortizes from untuned rsb in avg. 14.2, min. 13.8, max. 14.5 ops) #pr: (avg/min/max (avg) nnz per subm before successful tuning were 2/ 2/ 2) #pr: (avg/min/max (avg) nnz per subm after successful tuning were 6/ 6/ 6) #pr: (avg/min/max (avg) bytes per subm before successful tuning were 32/ 32/ 32) #pr: (avg/min/max (avg) bytes per subm after successful tuning were 96/ 96/ 96) #pr: (avg/min/max (avg) bytes per nnz before successful tuning were 4.000/ 4.000/ 4.000) -#pr: (avg/min/max operands (mtx,lhs,rhs) read bandwidth lower bound 0.249/ 0.231/ 0.266,GBps) -#pr: (avg/min/max operands (mtx,rhs:r;lhs:rw) bandwidth lower bound 0.648/ 0.281/ 0.367,GBps) +#pr: (avg/min/max operands (mtx,lhs,rhs) read bandwidth lower bound 1.487/ 0.533/ 2.442,GBps) +#pr: (avg/min/max operands (mtx,rhs:r;lhs:rw) bandwidth lower bound 3.709/ 0.734/ 2.975,GBps) #pr: (avg/min/max code balance (bytes read at least once per flop) 1.807/ 1.323/ 2.292) #pr: (avg/min/max (avg) bytes per nnz after successful tuning were 4.667/ 4.667/ 4.667) #pr: (matrix has been subdivided more/less/same in resp. 0 / 2 /0 cases) #pr: (matrix has used more/less/same threads in resp. 0 / 0 /2 cases) #pr: no unsuccessful rsb autotuning attempt (according to 1.01x threshold) -#pr: rsb auto tuning (either succ. or uns.) time was: on avg.: 0.01 s, min 0.01 s, max 0.01 s, tot 0.02 s (2 samples) -#pr: rsb auto tuning ( only successful ) time was: on avg.: 0.01 s, min 0.01 s, max 0.01 s, tot 0.02 s (2 samples) -#pr: best tun. rsb canon. mflops were: on avg. 1.510e+02, min 1.007e+02, max 2.013e+02 (2 samples) -#pr: ref. unt. rsb canon. mflops were: on avg. 4.321e-01, min 1.774e-01, max 6.868e-01 (2 samples) -#pr: best tun. rsb operation time was: on avg. 1.431e-06s, min 9.537e-07s, max 1.907e-06s, tot 2.861e-06s (2 samples) -#pr: ref. unt. rsb operation time was: on avg. 5.502e-04s, min 5.412e-04s, max 5.591e-04s, tot 1.100e-03s (2 samples) -#pr: min / max ratio of in-memory MEMSET bandwidth to extrapolated read bandwidth ratio: 2.184e+01 2.522e+01 -#pr: in-cache to in-memory MEMSET bandwidth ratio: 1.003e+00 -#pr: rsb nrhs-to-overall-min-rhs speed ratio was: on avg. 2.000e+00 x, min 2.000e+00 x, max 2.000e+00 x (1 samples, the non-min-nrhs ones) +#pr: rsb auto tuning (either succ. or uns.) time was: on avg.: 0.03 s, min 0.03 s, max 0.03 s, tot 0.06 s (2 samples) +#pr: rsb auto tuning ( only successful ) time was: on avg.: 0.03 s, min 0.03 s, max 0.03 s, tot 0.06 s (2 samples) +#pr: best tun. rsb canon. mflops were: on avg. 7.341e+02, min 4.027e+02, max 1.066e+03 (2 samples) +#pr: ref. unt. rsb canon. mflops were: on avg. 1.069e-01, min 4.159e-02, max 1.723e-01 (2 samples) +#pr: best tun. rsb operation time was: on avg. 5.219e-07s, min 9.010e-08s, max 9.537e-07s, tot 1.044e-06s (2 samples) +#pr: ref. unt. rsb operation time was: on avg. 2.269e-03s, min 2.229e-03s, max 2.308e-03s, tot 4.537e-03s (2 samples) +#pr: min / max ratio of in-memory MEMSET bandwidth to extrapolated read bandwidth ratio: 2.410e+00 1.105e+01 +#pr: in-cache to in-memory MEMSET bandwidth ratio: 9.966e-01 +#pr: rsb nrhs-to-overall-min-rhs speed ratio was: on avg. 3.779e-01 x, min 3.779e-01 x, max 3.779e-01 x (1 samples, the non-min-nrhs ones) #pr: ======== Limiting to nrhs=1: #pr: 4 samples (out of 8) matched the dump limiting criteria. #pr: Dump from a base of 8 samples (of max 16) ordered by (1,1,1,1,2,4,2) = (filename x cores x incX x incY x nrhs x typecode x transA). pr: BESTCODE MTX NR NC NNZ NRHS TYPE SYM TRANS NT AT-NT AT-MKL-NT BPNZ AT-BPNZ NSUBM AT-SUBM RSBBEST-MFLOPS OPTIME MKL-OPTIME AT-OPTIME AT-MKL-OPTIME AT-TIME RWminBW-GBps CB-bpf AT-MS CMFLOPS -pr: 1:R_R A 3 3 6 1 D S N 4 4 0 4.0000 4.6667 3 1 25.17 1.067e-03 0.000e+00 9.537e-07 0.000e+00 1.013e-02 1.55e-01 5.17e+00 1 2.40e-05 -pr: 3:R_R A 3 3 6 1 S S N 4 4 0 4.0000 4.6667 3 1 25.17 5.460e-04 0.000e+00 9.537e-07 0.000e+00 1.973e-02 9.23e-02 3.17e+00 1 2.40e-05 -pr: 5:R_R A 3 3 6 1 C S N 4 4 0 4.0000 4.6667 3 1 100.66 1.100e-03 0.000e+00 9.537e-07 0.000e+00 2.258e-02 1.55e-01 1.29e+00 1 9.60e-05 -pr: 7:R_R A 3 3 6 1 Z S N 4 4 0 4.0000 4.6667 3 1 100.66 5.412e-04 0.000e+00 9.537e-07 0.000e+00 1.048e-02 2.81e-01 2.29e+00 1 9.60e-05 +pr: 1:R_R A 3 3 6 1 D S N 4 4 0 4.0000 4.6667 3 1 25.17 2.301e-03 0.000e+00 9.537e-07 0.000e+00 3.152e-02 1.55e-01 5.17e+00 1 2.40e-05 +pr: 3:R_R A 3 3 6 1 S S N 4 4 0 4.0000 4.6667 3 1 25.17 2.263e-03 0.000e+00 9.537e-07 0.000e+00 3.052e-02 9.23e-02 3.17e+00 1 2.40e-05 +pr: 5:R_R A 3 3 6 1 C S N 4 4 0 4.0000 4.6667 3 1 100.66 2.273e-03 0.000e+00 9.537e-07 0.000e+00 3.245e-02 1.55e-01 1.29e+00 1 9.60e-05 +pr: 7:R_R A 3 3 6 1 Z S N 4 4 0 4.0000 4.6667 3 1 1065.50 2.308e-03 0.000e+00 9.010e-08 0.000e+00 3.176e-02 2.97e+00 2.29e+00 1 9.60e-05 #pr: 4 samples (out of 8) matched the dump limiting criteria. #pr: below, we define 'successful' autotuning when speedup of 1.010000x is exceeded, and 'tuned' results even the ones which are same as untuned #pr: rsb autotuning was successful in 4 cases (100.00 %) and unsuccessful in 0 cases (0.00 %) -#pr: (in succ. cases rsb autotuning gave avg. 85206.2 % faster, avg. sp. ratio 853.062x, max sp. ratio 1153.500x, avg. ratio 0.000x) -#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 16492.5/10623.0/23679.0/65970.0 tuned ops) -#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 21.4/ 9.5/ 36.1/ 85.5 untuned ops) -#pr: (and amortizes from untuned rsb in avg. 21.4, min. 9.5, max. 36.2 ops) +#pr: (in succ. cases rsb autotuning gave avg. 819572.2 % faster, avg. sp. ratio 8196.722x, max sp. ratio 25617.888x, avg. ratio 0.000x) +#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 112899.0/32004.8/352513.9/451596.1 tuned ops) +#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 13.8/ 13.5/ 14.3/ 55.2 untuned ops) +#pr: (and amortizes from untuned rsb in avg. 13.8, min. 13.5, max. 14.3 ops) #pr: (avg/min/max (avg) nnz per subm before successful tuning were 2/ 2/ 2) #pr: (avg/min/max (avg) nnz per subm after successful tuning were 6/ 6/ 6) #pr: (avg/min/max (avg) bytes per subm before successful tuning were 18/ 8/ 32) #pr: (avg/min/max (avg) bytes per subm after successful tuning were 54/ 24/ 96) #pr: (avg/min/max (avg) bytes per nnz before successful tuning were 4.000/ 4.000/ 4.000) -#pr: (avg/min/max operands (mtx,lhs,rhs) read bandwidth lower bound 0.143/ 0.080/ 0.231,GBps) -#pr: (avg/min/max operands (mtx,rhs:r;lhs:rw) bandwidth lower bound 0.684/ 0.092/ 0.281,GBps) +#pr: (avg/min/max operands (mtx,lhs,rhs) read bandwidth lower bound 0.695/ 0.080/ 2.442,GBps) +#pr: (avg/min/max operands (mtx,rhs:r;lhs:rw) bandwidth lower bound 3.377/ 0.092/ 2.975,GBps) #pr: (avg/min/max code balance (bytes read at least once per flop) 2.979/ 1.292/ 5.167) #pr: (avg/min/max (avg) bytes per nnz after successful tuning were 4.667/ 4.667/ 4.667) #pr: (matrix has been subdivided more/less/same in resp. 0 / 4 /0 cases) #pr: (matrix has used more/less/same threads in resp. 0 / 0 /4 cases) #pr: no unsuccessful rsb autotuning attempt (according to 1.01x threshold) -#pr: rsb auto tuning (either succ. or uns.) time was: on avg.: 0.02 s, min 0.01 s, max 0.02 s, tot 0.06 s (4 samples) -#pr: rsb auto tuning ( only successful ) time was: on avg.: 0.02 s, min 0.01 s, max 0.02 s, tot 0.06 s (4 samples) -#pr: best tun. rsb canon. mflops were: on avg. 6.291e+01, min 2.517e+01, max 1.007e+02 (4 samples) -#pr: ref. unt. rsb canon. mflops were: on avg. 8.278e-02, min 2.249e-02, max 1.774e-01 (4 samples) -#pr: best tun. rsb operation time was: on avg. 9.537e-07s, min 9.537e-07s, max 9.537e-07s, tot 3.815e-06s (4 samples) -#pr: ref. unt. rsb operation time was: on avg. 8.135e-04s, min 5.412e-04s, max 1.100e-03s, tot 3.254e-03s (4 samples) -#pr: min / max ratio of in-memory MEMSET bandwidth to extrapolated read bandwidth ratio: 2.522e+01 7.300e+01 -#pr: in-cache to in-memory MEMSET bandwidth ratio: 1.003e+00 +#pr: rsb auto tuning (either succ. or uns.) time was: on avg.: 0.03 s, min 0.03 s, max 0.03 s, tot 0.13 s (4 samples) +#pr: rsb auto tuning ( only successful ) time was: on avg.: 0.03 s, min 0.03 s, max 0.03 s, tot 0.13 s (4 samples) +#pr: best tun. rsb canon. mflops were: on avg. 3.041e+02, min 2.517e+01, max 1.066e+03 (4 samples) +#pr: ref. unt. rsb canon. mflops were: on avg. 2.622e-02, min 1.043e-02, max 4.224e-02 (4 samples) +#pr: best tun. rsb operation time was: on avg. 7.378e-07s, min 9.010e-08s, max 9.537e-07s, tot 2.951e-06s (4 samples) +#pr: ref. unt. rsb operation time was: on avg. 2.286e-03s, min 2.263e-03s, max 2.308e-03s, tot 9.145e-03s (4 samples) +#pr: min / max ratio of in-memory MEMSET bandwidth to extrapolated read bandwidth ratio: 2.410e+00 7.384e+01 +#pr: in-cache to in-memory MEMSET bandwidth ratio: 9.966e-01 #pr: ======== Limiting to nrhs=4: #pr: 4 samples (out of 8) matched the dump limiting criteria. #pr: Dump from a base of 8 samples (of max 16) ordered by (1,1,1,1,2,4,2) = (filename x cores x incX x incY x nrhs x typecode x transA). pr: BESTCODE MTX NR NC NNZ NRHS TYPE SYM TRANS NT AT-NT AT-MKL-NT BPNZ AT-BPNZ NSUBM AT-SUBM RSBBEST-MFLOPS OPTIME MKL-OPTIME AT-OPTIME AT-MKL-OPTIME AT-TIME RWminBW-GBps CB-bpf AT-MS CMFLOPS -pr: 9:R_R A 3 3 6 4 D S N 4 4 0 4.0000 4.6667 3 1 100.66 1.024e-03 0.000e+00 9.537e-07 0.000e+00 9.531e-03 3.82e-01 2.79e+00 1 9.60e-05 -pr: 11:R_R A 3 3 6 4 S S N 4 4 0 4.0000 4.6667 3 1 100.66 1.033e-03 0.000e+00 9.537e-07 0.000e+00 1.480e-02 2.06e-01 1.54e+00 1 9.60e-05 -pr: 13:R_R A 3 3 6 4 C S N 4 4 0 4.0000 4.6667 3 1 402.65 5.941e-04 0.000e+00 9.537e-07 0.000e+00 9.068e-03 3.82e-01 6.98e-01 1 3.84e-04 -pr: 15:R_R A 3 3 6 4 Z S N 4 4 0 4.0000 4.6667 3 1 201.33 5.591e-04 0.000e+00 1.907e-06 0.000e+00 9.952e-03 3.67e-01 1.32e+00 1 3.84e-04 +pr: 9:R_R A 3 3 6 4 D S N 4 4 0 4.0000 4.6667 3 1 80.53 2.178e-03 0.000e+00 1.192e-06 0.000e+00 3.504e-02 3.05e-01 2.79e+00 1 9.60e-05 +pr: 11:R_R A 3 3 6 4 S S N 4 4 0 4.0000 4.6667 3 1 100.66 2.364e-03 0.000e+00 9.537e-07 0.000e+00 3.292e-02 2.06e-01 1.54e+00 1 9.60e-05 +pr: 13:R_R A 3 3 6 4 C S N 4 4 0 4.0000 4.6667 3 1 322.12 2.417e-03 0.000e+00 1.192e-06 0.000e+00 3.049e-02 3.05e-01 6.98e-01 1 3.84e-04 +pr: 15:R_R A 3 3 6 4 Z S N 4 4 0 4.0000 4.6667 3 1 402.65 2.229e-03 0.000e+00 9.537e-07 0.000e+00 3.239e-02 7.34e-01 1.32e+00 1 3.84e-04 #pr: 4 samples (out of 8) matched the dump limiting criteria. #pr: below, we define 'successful' autotuning when speedup of 1.010000x is exceeded, and 'tuned' results even the ones which are same as untuned #pr: rsb autotuning was successful in 4 cases (100.00 %) and unsuccessful in 0 cases (0.00 %) -#pr: (in succ. cases rsb autotuning gave avg. 76715.6 % faster, avg. sp. ratio 768.156x, max sp. ratio 1083.000x, avg. ratio 0.000x) -#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 10060.1/5217.8/15520.0/40240.2 tuned ops) -#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 14.2/ 9.3/ 17.8/ 56.7 untuned ops) -#pr: (and amortizes from untuned rsb in avg. 14.2, min. 9.3, max. 17.9 ops) +#pr: (in succ. cases rsb autotuning gave avg. 216671.2 % faster, avg. sp. ratio 2167.713x, max sp. ratio 2479.000x, avg. ratio 0.000x) +#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 30864.1/25576.0/34514.8/123456.3 tuned ops) +#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 14.3/ 12.6/ 16.1/ 57.2 untuned ops) +#pr: (and amortizes from untuned rsb in avg. 14.3, min. 12.6, max. 16.1 ops) #pr: (avg/min/max (avg) nnz per subm before successful tuning were 2/ 2/ 2) #pr: (avg/min/max (avg) nnz per subm after successful tuning were 6/ 6/ 6) #pr: (avg/min/max (avg) bytes per subm before successful tuning were 18/ 8/ 32) #pr: (avg/min/max (avg) bytes per subm after successful tuning were 54/ 24/ 96) #pr: (avg/min/max (avg) bytes per nnz before successful tuning were 4.000/ 4.000/ 4.000) -#pr: (avg/min/max operands (mtx,lhs,rhs) read bandwidth lower bound 0.246/ 0.155/ 0.281,GBps) -#pr: (avg/min/max operands (mtx,rhs:r;lhs:rw) bandwidth lower bound 1.336/ 0.206/ 0.382,GBps) +#pr: (avg/min/max operands (mtx,lhs,rhs) read bandwidth lower bound 0.284/ 0.155/ 0.533,GBps) +#pr: (avg/min/max operands (mtx,rhs:r;lhs:rw) bandwidth lower bound 1.550/ 0.206/ 0.734,GBps) #pr: (avg/min/max code balance (bytes read at least once per flop) 1.589/ 0.698/ 2.792) #pr: (avg/min/max (avg) bytes per nnz after successful tuning were 4.667/ 4.667/ 4.667) #pr: (matrix has been subdivided more/less/same in resp. 0 / 4 /0 cases) #pr: (matrix has used more/less/same threads in resp. 0 / 0 /4 cases) #pr: no unsuccessful rsb autotuning attempt (according to 1.01x threshold) -#pr: rsb auto tuning (either succ. or uns.) time was: on avg.: 0.01 s, min 0.01 s, max 0.01 s, tot 0.04 s (4 samples) -#pr: rsb auto tuning ( only successful ) time was: on avg.: 0.01 s, min 0.01 s, max 0.01 s, tot 0.04 s (4 samples) -#pr: best tun. rsb canon. mflops were: on avg. 2.013e+02, min 1.007e+02, max 4.027e+02 (4 samples) -#pr: ref. unt. rsb canon. mflops were: on avg. 3.800e-01, min 9.295e-02, max 6.868e-01 (4 samples) -#pr: best tun. rsb operation time was: on avg. 1.192e-06s, min 9.537e-07s, max 1.907e-06s, tot 4.768e-06s (4 samples) -#pr: ref. unt. rsb operation time was: on avg. 8.025e-04s, min 5.591e-04s, max 1.033e-03s, tot 3.210e-03s (4 samples) -#pr: min / max ratio of in-memory MEMSET bandwidth to extrapolated read bandwidth ratio: 2.070e+01 3.749e+01 -#pr: in-cache to in-memory MEMSET bandwidth ratio: 1.003e+00 -#pr: rsb nrhs-to-overall-min-rhs speed ratio was: on avg. 3.500e+00 x, min 2.000e+00 x, max 4.000e+00 x (4 samples, the non-min-nrhs ones) +#pr: rsb auto tuning (either succ. or uns.) time was: on avg.: 0.03 s, min 0.03 s, max 0.04 s, tot 0.13 s (4 samples) +#pr: rsb auto tuning ( only successful ) time was: on avg.: 0.03 s, min 0.03 s, max 0.04 s, tot 0.13 s (4 samples) +#pr: best tun. rsb canon. mflops were: on avg. 2.265e+02, min 8.053e+01, max 4.027e+02 (4 samples) +#pr: ref. unt. rsb canon. mflops were: on avg. 1.040e-01, min 4.061e-02, max 1.723e-01 (4 samples) +#pr: best tun. rsb operation time was: on avg. 1.073e-06s, min 9.537e-07s, max 1.192e-06s, tot 4.292e-06s (4 samples) +#pr: ref. unt. rsb operation time was: on avg. 2.297e-03s, min 2.178e-03s, max 2.417e-03s, tot 9.188e-03s (4 samples) +#pr: min / max ratio of in-memory MEMSET bandwidth to extrapolated read bandwidth ratio: 1.105e+01 3.792e+01 +#pr: in-cache to in-memory MEMSET bandwidth ratio: 9.966e-01 +#pr: rsb nrhs-to-overall-min-rhs speed ratio was: on avg. 2.694e+00 x, min 3.779e-01 x, max 4.000e+00 x (4 samples, the non-min-nrhs ones) #pr: ======== Limiting to transA=N: #pr: Dump from a base of 8 samples (of max 16) ordered by (1,1,1,1,2,4,2) = (filename x cores x incX x incY x nrhs x typecode x transA). pr: BESTCODE MTX NR NC NNZ NRHS TYPE SYM TRANS NT AT-NT AT-MKL-NT BPNZ AT-BPNZ NSUBM AT-SUBM RSBBEST-MFLOPS OPTIME MKL-OPTIME AT-OPTIME AT-MKL-OPTIME AT-TIME RWminBW-GBps CB-bpf AT-MS CMFLOPS -pr: 1:R_R A 3 3 6 1 D S N 4 4 0 4.0000 4.6667 3 1 25.17 1.067e-03 0.000e+00 9.537e-07 0.000e+00 1.013e-02 1.55e-01 5.17e+00 1 2.40e-05 -pr: 3:R_R A 3 3 6 1 S S N 4 4 0 4.0000 4.6667 3 1 25.17 5.460e-04 0.000e+00 9.537e-07 0.000e+00 1.973e-02 9.23e-02 3.17e+00 1 2.40e-05 -pr: 5:R_R A 3 3 6 1 C S N 4 4 0 4.0000 4.6667 3 1 100.66 1.100e-03 0.000e+00 9.537e-07 0.000e+00 2.258e-02 1.55e-01 1.29e+00 1 9.60e-05 -pr: 7:R_R A 3 3 6 1 Z S N 4 4 0 4.0000 4.6667 3 1 100.66 5.412e-04 0.000e+00 9.537e-07 0.000e+00 1.048e-02 2.81e-01 2.29e+00 1 9.60e-05 -pr: 9:R_R A 3 3 6 4 D S N 4 4 0 4.0000 4.6667 3 1 100.66 1.024e-03 0.000e+00 9.537e-07 0.000e+00 9.531e-03 3.82e-01 2.79e+00 1 9.60e-05 -pr: 11:R_R A 3 3 6 4 S S N 4 4 0 4.0000 4.6667 3 1 100.66 1.033e-03 0.000e+00 9.537e-07 0.000e+00 1.480e-02 2.06e-01 1.54e+00 1 9.60e-05 -pr: 13:R_R A 3 3 6 4 C S N 4 4 0 4.0000 4.6667 3 1 402.65 5.941e-04 0.000e+00 9.537e-07 0.000e+00 9.068e-03 3.82e-01 6.98e-01 1 3.84e-04 -pr: 15:R_R A 3 3 6 4 Z S N 4 4 0 4.0000 4.6667 3 1 201.33 5.591e-04 0.000e+00 1.907e-06 0.000e+00 9.952e-03 3.67e-01 1.32e+00 1 3.84e-04 +pr: 1:R_R A 3 3 6 1 D S N 4 4 0 4.0000 4.6667 3 1 25.17 2.301e-03 0.000e+00 9.537e-07 0.000e+00 3.152e-02 1.55e-01 5.17e+00 1 2.40e-05 +pr: 3:R_R A 3 3 6 1 S S N 4 4 0 4.0000 4.6667 3 1 25.17 2.263e-03 0.000e+00 9.537e-07 0.000e+00 3.052e-02 9.23e-02 3.17e+00 1 2.40e-05 +pr: 5:R_R A 3 3 6 1 C S N 4 4 0 4.0000 4.6667 3 1 100.66 2.273e-03 0.000e+00 9.537e-07 0.000e+00 3.245e-02 1.55e-01 1.29e+00 1 9.60e-05 +pr: 7:R_R A 3 3 6 1 Z S N 4 4 0 4.0000 4.6667 3 1 1065.50 2.308e-03 0.000e+00 9.010e-08 0.000e+00 3.176e-02 2.97e+00 2.29e+00 1 9.60e-05 +pr: 9:R_R A 3 3 6 4 D S N 4 4 0 4.0000 4.6667 3 1 80.53 2.178e-03 0.000e+00 1.192e-06 0.000e+00 3.504e-02 3.05e-01 2.79e+00 1 9.60e-05 +pr: 11:R_R A 3 3 6 4 S S N 4 4 0 4.0000 4.6667 3 1 100.66 2.364e-03 0.000e+00 9.537e-07 0.000e+00 3.292e-02 2.06e-01 1.54e+00 1 9.60e-05 +pr: 13:R_R A 3 3 6 4 C S N 4 4 0 4.0000 4.6667 3 1 322.12 2.417e-03 0.000e+00 1.192e-06 0.000e+00 3.049e-02 3.05e-01 6.98e-01 1 3.84e-04 +pr: 15:R_R A 3 3 6 4 Z S N 4 4 0 4.0000 4.6667 3 1 402.65 2.229e-03 0.000e+00 9.537e-07 0.000e+00 3.239e-02 7.34e-01 1.32e+00 1 3.84e-04 #pr: below, we define 'successful' autotuning when speedup of 1.010000x is exceeded, and 'tuned' results even the ones which are same as untuned #pr: rsb autotuning was successful in 8 cases (100.00 %) and unsuccessful in 0 cases (0.00 %) -#pr: (in succ. cases rsb autotuning gave avg. 80960.9 % faster, avg. sp. ratio 810.609x, max sp. ratio 1153.500x, avg. ratio 0.000x) -#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 13276.3/5217.8/23679.0/106210.2 tuned ops) -#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 17.8/ 9.3/ 36.1/142.2 untuned ops) -#pr: (and amortizes from untuned rsb in avg. 17.8, min. 9.3, max. 36.2 ops) +#pr: (in succ. cases rsb autotuning gave avg. 518121.7 % faster, avg. sp. ratio 5182.217x, max sp. ratio 25617.888x, avg. ratio 0.000x) +#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 71881.6/25576.0/352513.9/575052.4 tuned ops) +#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 14.0/ 12.6/ 16.1/112.4 untuned ops) +#pr: (and amortizes from untuned rsb in avg. 14.1, min. 12.6, max. 16.1 ops) #pr: (avg/min/max (avg) nnz per subm before successful tuning were 2/ 2/ 2) #pr: (avg/min/max (avg) nnz per subm after successful tuning were 6/ 6/ 6) #pr: (avg/min/max (avg) bytes per subm before successful tuning were 18/ 8/ 32) #pr: (avg/min/max (avg) bytes per subm after successful tuning were 54/ 24/ 96) #pr: (avg/min/max (avg) bytes per nnz before successful tuning were 4.000/ 4.000/ 4.000) -#pr: (avg/min/max operands (mtx,lhs,rhs) read bandwidth lower bound 0.194/ 0.080/ 0.281,GBps) -#pr: (avg/min/max operands (mtx,rhs:r;lhs:rw) bandwidth lower bound 2.020/ 0.092/ 0.382,GBps) +#pr: (avg/min/max operands (mtx,lhs,rhs) read bandwidth lower bound 0.490/ 0.080/ 2.442,GBps) +#pr: (avg/min/max operands (mtx,rhs:r;lhs:rw) bandwidth lower bound 4.927/ 0.092/ 2.975,GBps) #pr: (avg/min/max code balance (bytes read at least once per flop) 2.284/ 0.698/ 5.167) #pr: (avg/min/max (avg) bytes per nnz after successful tuning were 4.667/ 4.667/ 4.667) #pr: (matrix has been subdivided more/less/same in resp. 0 / 8 /0 cases) #pr: (matrix has used more/less/same threads in resp. 0 / 0 /8 cases) #pr: no unsuccessful rsb autotuning attempt (according to 1.01x threshold) -#pr: rsb auto tuning (either succ. or uns.) time was: on avg.: 0.01 s, min 0.01 s, max 0.02 s, tot 0.11 s (8 samples) -#pr: rsb auto tuning ( only successful ) time was: on avg.: 0.01 s, min 0.01 s, max 0.02 s, tot 0.11 s (8 samples) -#pr: best tun. rsb canon. mflops were: on avg. 1.321e+02, min 2.517e+01, max 4.027e+02 (8 samples) -#pr: ref. unt. rsb canon. mflops were: on avg. 2.314e-01, min 2.249e-02, max 6.868e-01 (8 samples) -#pr: best tun. rsb operation time was: on avg. 1.073e-06s, min 9.537e-07s, max 1.907e-06s, tot 8.583e-06s (8 samples) -#pr: ref. unt. rsb operation time was: on avg. 8.080e-04s, min 5.412e-04s, max 1.100e-03s, tot 6.464e-03s (8 samples) -#pr: min / max ratio of in-memory MEMSET bandwidth to extrapolated read bandwidth ratio: 2.070e+01 7.300e+01 -#pr: in-cache to in-memory MEMSET bandwidth ratio: 1.003e+00 -#pr: rsb nrhs-to-overall-min-rhs speed ratio was: on avg. 3.500e+00 x, min 2.000e+00 x, max 4.000e+00 x (4 samples, the non-min-nrhs ones) +#pr: rsb auto tuning (either succ. or uns.) time was: on avg.: 0.03 s, min 0.03 s, max 0.04 s, tot 0.26 s (8 samples) +#pr: rsb auto tuning ( only successful ) time was: on avg.: 0.03 s, min 0.03 s, max 0.04 s, tot 0.26 s (8 samples) +#pr: best tun. rsb canon. mflops were: on avg. 2.653e+02, min 2.517e+01, max 1.066e+03 (8 samples) +#pr: ref. unt. rsb canon. mflops were: on avg. 6.509e-02, min 1.043e-02, max 1.723e-01 (8 samples) +#pr: best tun. rsb operation time was: on avg. 9.053e-07s, min 9.010e-08s, max 1.192e-06s, tot 7.243e-06s (8 samples) +#pr: ref. unt. rsb operation time was: on avg. 2.292e-03s, min 2.178e-03s, max 2.417e-03s, tot 1.833e-02s (8 samples) +#pr: min / max ratio of in-memory MEMSET bandwidth to extrapolated read bandwidth ratio: 2.410e+00 7.384e+01 +#pr: in-cache to in-memory MEMSET bandwidth ratio: 9.966e-01 +#pr: rsb nrhs-to-overall-min-rhs speed ratio was: on avg. 2.694e+00 x, min 3.779e-01 x, max 4.000e+00 x (4 samples, the non-min-nrhs ones) #pr: ======== Limiting to both transA=N and nrhs=1: #pr: 4 samples (out of 8) matched the dump limiting criteria. #pr: Dump from a base of 8 samples (of max 16) ordered by (1,1,1,1,2,4,2) = (filename x cores x incX x incY x nrhs x typecode x transA). pr: BESTCODE MTX NR NC NNZ NRHS TYPE SYM TRANS NT AT-NT AT-MKL-NT BPNZ AT-BPNZ NSUBM AT-SUBM RSBBEST-MFLOPS OPTIME MKL-OPTIME AT-OPTIME AT-MKL-OPTIME AT-TIME RWminBW-GBps CB-bpf AT-MS CMFLOPS -pr: 1:R_R A 3 3 6 1 D S N 4 4 0 4.0000 4.6667 3 1 25.17 1.067e-03 0.000e+00 9.537e-07 0.000e+00 1.013e-02 1.55e-01 5.17e+00 1 2.40e-05 -pr: 3:R_R A 3 3 6 1 S S N 4 4 0 4.0000 4.6667 3 1 25.17 5.460e-04 0.000e+00 9.537e-07 0.000e+00 1.973e-02 9.23e-02 3.17e+00 1 2.40e-05 -pr: 5:R_R A 3 3 6 1 C S N 4 4 0 4.0000 4.6667 3 1 100.66 1.100e-03 0.000e+00 9.537e-07 0.000e+00 2.258e-02 1.55e-01 1.29e+00 1 9.60e-05 -pr: 7:R_R A 3 3 6 1 Z S N 4 4 0 4.0000 4.6667 3 1 100.66 5.412e-04 0.000e+00 9.537e-07 0.000e+00 1.048e-02 2.81e-01 2.29e+00 1 9.60e-05 +pr: 1:R_R A 3 3 6 1 D S N 4 4 0 4.0000 4.6667 3 1 25.17 2.301e-03 0.000e+00 9.537e-07 0.000e+00 3.152e-02 1.55e-01 5.17e+00 1 2.40e-05 +pr: 3:R_R A 3 3 6 1 S S N 4 4 0 4.0000 4.6667 3 1 25.17 2.263e-03 0.000e+00 9.537e-07 0.000e+00 3.052e-02 9.23e-02 3.17e+00 1 2.40e-05 +pr: 5:R_R A 3 3 6 1 C S N 4 4 0 4.0000 4.6667 3 1 100.66 2.273e-03 0.000e+00 9.537e-07 0.000e+00 3.245e-02 1.55e-01 1.29e+00 1 9.60e-05 +pr: 7:R_R A 3 3 6 1 Z S N 4 4 0 4.0000 4.6667 3 1 1065.50 2.308e-03 0.000e+00 9.010e-08 0.000e+00 3.176e-02 2.97e+00 2.29e+00 1 9.60e-05 #pr: 4 samples (out of 8) matched the dump limiting criteria. #pr: below, we define 'successful' autotuning when speedup of 1.010000x is exceeded, and 'tuned' results even the ones which are same as untuned #pr: rsb autotuning was successful in 4 cases (100.00 %) and unsuccessful in 0 cases (0.00 %) -#pr: (in succ. cases rsb autotuning gave avg. 85206.2 % faster, avg. sp. ratio 853.062x, max sp. ratio 1153.500x, avg. ratio 0.000x) -#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 16492.5/10623.0/23679.0/65970.0 tuned ops) -#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 21.4/ 9.5/ 36.1/ 85.5 untuned ops) -#pr: (and amortizes from untuned rsb in avg. 21.4, min. 9.5, max. 36.2 ops) +#pr: (in succ. cases rsb autotuning gave avg. 819572.2 % faster, avg. sp. ratio 8196.722x, max sp. ratio 25617.888x, avg. ratio 0.000x) +#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 112899.0/32004.8/352513.9/451596.1 tuned ops) +#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 13.8/ 13.5/ 14.3/ 55.2 untuned ops) +#pr: (and amortizes from untuned rsb in avg. 13.8, min. 13.5, max. 14.3 ops) #pr: (avg/min/max (avg) nnz per subm before successful tuning were 2/ 2/ 2) #pr: (avg/min/max (avg) nnz per subm after successful tuning were 6/ 6/ 6) #pr: (avg/min/max (avg) bytes per subm before successful tuning were 18/ 8/ 32) #pr: (avg/min/max (avg) bytes per subm after successful tuning were 54/ 24/ 96) #pr: (avg/min/max (avg) bytes per nnz before successful tuning were 4.000/ 4.000/ 4.000) -#pr: (avg/min/max operands (mtx,lhs,rhs) read bandwidth lower bound 0.143/ 0.080/ 0.231,GBps) -#pr: (avg/min/max operands (mtx,rhs:r;lhs:rw) bandwidth lower bound 0.684/ 0.092/ 0.281,GBps) +#pr: (avg/min/max operands (mtx,lhs,rhs) read bandwidth lower bound 0.695/ 0.080/ 2.442,GBps) +#pr: (avg/min/max operands (mtx,rhs:r;lhs:rw) bandwidth lower bound 3.377/ 0.092/ 2.975,GBps) #pr: (avg/min/max code balance (bytes read at least once per flop) 2.979/ 1.292/ 5.167) #pr: (avg/min/max (avg) bytes per nnz after successful tuning were 4.667/ 4.667/ 4.667) #pr: (matrix has been subdivided more/less/same in resp. 0 / 4 /0 cases) #pr: (matrix has used more/less/same threads in resp. 0 / 0 /4 cases) #pr: no unsuccessful rsb autotuning attempt (according to 1.01x threshold) -#pr: rsb auto tuning (either succ. or uns.) time was: on avg.: 0.02 s, min 0.01 s, max 0.02 s, tot 0.06 s (4 samples) -#pr: rsb auto tuning ( only successful ) time was: on avg.: 0.02 s, min 0.01 s, max 0.02 s, tot 0.06 s (4 samples) -#pr: best tun. rsb canon. mflops were: on avg. 6.291e+01, min 2.517e+01, max 1.007e+02 (4 samples) -#pr: ref. unt. rsb canon. mflops were: on avg. 8.278e-02, min 2.249e-02, max 1.774e-01 (4 samples) -#pr: best tun. rsb operation time was: on avg. 9.537e-07s, min 9.537e-07s, max 9.537e-07s, tot 3.815e-06s (4 samples) -#pr: ref. unt. rsb operation time was: on avg. 8.135e-04s, min 5.412e-04s, max 1.100e-03s, tot 3.254e-03s (4 samples) -#pr: min / max ratio of in-memory MEMSET bandwidth to extrapolated read bandwidth ratio: 2.522e+01 7.300e+01 -#pr: in-cache to in-memory MEMSET bandwidth ratio: 1.003e+00 +#pr: rsb auto tuning (either succ. or uns.) time was: on avg.: 0.03 s, min 0.03 s, max 0.03 s, tot 0.13 s (4 samples) +#pr: rsb auto tuning ( only successful ) time was: on avg.: 0.03 s, min 0.03 s, max 0.03 s, tot 0.13 s (4 samples) +#pr: best tun. rsb canon. mflops were: on avg. 3.041e+02, min 2.517e+01, max 1.066e+03 (4 samples) +#pr: ref. unt. rsb canon. mflops were: on avg. 2.622e-02, min 1.043e-02, max 4.224e-02 (4 samples) +#pr: best tun. rsb operation time was: on avg. 7.378e-07s, min 9.010e-08s, max 9.537e-07s, tot 2.951e-06s (4 samples) +#pr: ref. unt. rsb operation time was: on avg. 2.286e-03s, min 2.263e-03s, max 2.308e-03s, tot 9.145e-03s (4 samples) +#pr: min / max ratio of in-memory MEMSET bandwidth to extrapolated read bandwidth ratio: 2.410e+00 7.384e+01 +#pr: in-cache to in-memory MEMSET bandwidth ratio: 9.966e-01 #pr: ======== Limiting to both transA=N and nrhs=4: #pr: 4 samples (out of 8) matched the dump limiting criteria. #pr: Dump from a base of 8 samples (of max 16) ordered by (1,1,1,1,2,4,2) = (filename x cores x incX x incY x nrhs x typecode x transA). pr: BESTCODE MTX NR NC NNZ NRHS TYPE SYM TRANS NT AT-NT AT-MKL-NT BPNZ AT-BPNZ NSUBM AT-SUBM RSBBEST-MFLOPS OPTIME MKL-OPTIME AT-OPTIME AT-MKL-OPTIME AT-TIME RWminBW-GBps CB-bpf AT-MS CMFLOPS -pr: 9:R_R A 3 3 6 4 D S N 4 4 0 4.0000 4.6667 3 1 100.66 1.024e-03 0.000e+00 9.537e-07 0.000e+00 9.531e-03 3.82e-01 2.79e+00 1 9.60e-05 -pr: 11:R_R A 3 3 6 4 S S N 4 4 0 4.0000 4.6667 3 1 100.66 1.033e-03 0.000e+00 9.537e-07 0.000e+00 1.480e-02 2.06e-01 1.54e+00 1 9.60e-05 -pr: 13:R_R A 3 3 6 4 C S N 4 4 0 4.0000 4.6667 3 1 402.65 5.941e-04 0.000e+00 9.537e-07 0.000e+00 9.068e-03 3.82e-01 6.98e-01 1 3.84e-04 -pr: 15:R_R A 3 3 6 4 Z S N 4 4 0 4.0000 4.6667 3 1 201.33 5.591e-04 0.000e+00 1.907e-06 0.000e+00 9.952e-03 3.67e-01 1.32e+00 1 3.84e-04 +pr: 9:R_R A 3 3 6 4 D S N 4 4 0 4.0000 4.6667 3 1 80.53 2.178e-03 0.000e+00 1.192e-06 0.000e+00 3.504e-02 3.05e-01 2.79e+00 1 9.60e-05 +pr: 11:R_R A 3 3 6 4 S S N 4 4 0 4.0000 4.6667 3 1 100.66 2.364e-03 0.000e+00 9.537e-07 0.000e+00 3.292e-02 2.06e-01 1.54e+00 1 9.60e-05 +pr: 13:R_R A 3 3 6 4 C S N 4 4 0 4.0000 4.6667 3 1 322.12 2.417e-03 0.000e+00 1.192e-06 0.000e+00 3.049e-02 3.05e-01 6.98e-01 1 3.84e-04 +pr: 15:R_R A 3 3 6 4 Z S N 4 4 0 4.0000 4.6667 3 1 402.65 2.229e-03 0.000e+00 9.537e-07 0.000e+00 3.239e-02 7.34e-01 1.32e+00 1 3.84e-04 #pr: 4 samples (out of 8) matched the dump limiting criteria. #pr: below, we define 'successful' autotuning when speedup of 1.010000x is exceeded, and 'tuned' results even the ones which are same as untuned #pr: rsb autotuning was successful in 4 cases (100.00 %) and unsuccessful in 0 cases (0.00 %) -#pr: (in succ. cases rsb autotuning gave avg. 76715.6 % faster, avg. sp. ratio 768.156x, max sp. ratio 1083.000x, avg. ratio 0.000x) -#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 10060.1/5217.8/15520.0/40240.2 tuned ops) -#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 14.2/ 9.3/ 17.8/ 56.7 untuned ops) -#pr: (and amortizes from untuned rsb in avg. 14.2, min. 9.3, max. 17.9 ops) +#pr: (in succ. cases rsb autotuning gave avg. 216671.2 % faster, avg. sp. ratio 2167.713x, max sp. ratio 2479.000x, avg. ratio 0.000x) +#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 30864.1/25576.0/34514.8/123456.3 tuned ops) +#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 14.3/ 12.6/ 16.1/ 57.2 untuned ops) +#pr: (and amortizes from untuned rsb in avg. 14.3, min. 12.6, max. 16.1 ops) #pr: (avg/min/max (avg) nnz per subm before successful tuning were 2/ 2/ 2) #pr: (avg/min/max (avg) nnz per subm after successful tuning were 6/ 6/ 6) #pr: (avg/min/max (avg) bytes per subm before successful tuning were 18/ 8/ 32) #pr: (avg/min/max (avg) bytes per subm after successful tuning were 54/ 24/ 96) #pr: (avg/min/max (avg) bytes per nnz before successful tuning were 4.000/ 4.000/ 4.000) -#pr: (avg/min/max operands (mtx,lhs,rhs) read bandwidth lower bound 0.246/ 0.155/ 0.281,GBps) -#pr: (avg/min/max operands (mtx,rhs:r;lhs:rw) bandwidth lower bound 1.336/ 0.206/ 0.382,GBps) +#pr: (avg/min/max operands (mtx,lhs,rhs) read bandwidth lower bound 0.284/ 0.155/ 0.533,GBps) +#pr: (avg/min/max operands (mtx,rhs:r;lhs:rw) bandwidth lower bound 1.550/ 0.206/ 0.734,GBps) #pr: (avg/min/max code balance (bytes read at least once per flop) 1.589/ 0.698/ 2.792) #pr: (avg/min/max (avg) bytes per nnz after successful tuning were 4.667/ 4.667/ 4.667) #pr: (matrix has been subdivided more/less/same in resp. 0 / 4 /0 cases) #pr: (matrix has used more/less/same threads in resp. 0 / 0 /4 cases) #pr: no unsuccessful rsb autotuning attempt (according to 1.01x threshold) -#pr: rsb auto tuning (either succ. or uns.) time was: on avg.: 0.01 s, min 0.01 s, max 0.01 s, tot 0.04 s (4 samples) -#pr: rsb auto tuning ( only successful ) time was: on avg.: 0.01 s, min 0.01 s, max 0.01 s, tot 0.04 s (4 samples) -#pr: best tun. rsb canon. mflops were: on avg. 2.013e+02, min 1.007e+02, max 4.027e+02 (4 samples) -#pr: ref. unt. rsb canon. mflops were: on avg. 3.800e-01, min 9.295e-02, max 6.868e-01 (4 samples) -#pr: best tun. rsb operation time was: on avg. 1.192e-06s, min 9.537e-07s, max 1.907e-06s, tot 4.768e-06s (4 samples) -#pr: ref. unt. rsb operation time was: on avg. 8.025e-04s, min 5.591e-04s, max 1.033e-03s, tot 3.210e-03s (4 samples) -#pr: min / max ratio of in-memory MEMSET bandwidth to extrapolated read bandwidth ratio: 2.070e+01 3.749e+01 -#pr: in-cache to in-memory MEMSET bandwidth ratio: 1.003e+00 -#pr: rsb nrhs-to-overall-min-rhs speed ratio was: on avg. 3.500e+00 x, min 2.000e+00 x, max 4.000e+00 x (4 samples, the non-min-nrhs ones) +#pr: rsb auto tuning (either succ. or uns.) time was: on avg.: 0.03 s, min 0.03 s, max 0.04 s, tot 0.13 s (4 samples) +#pr: rsb auto tuning ( only successful ) time was: on avg.: 0.03 s, min 0.03 s, max 0.04 s, tot 0.13 s (4 samples) +#pr: best tun. rsb canon. mflops were: on avg. 2.265e+02, min 8.053e+01, max 4.027e+02 (4 samples) +#pr: ref. unt. rsb canon. mflops were: on avg. 1.040e-01, min 4.061e-02, max 1.723e-01 (4 samples) +#pr: best tun. rsb operation time was: on avg. 1.073e-06s, min 9.537e-07s, max 1.192e-06s, tot 4.292e-06s (4 samples) +#pr: ref. unt. rsb operation time was: on avg. 2.297e-03s, min 2.178e-03s, max 2.417e-03s, tot 9.188e-03s (4 samples) +#pr: min / max ratio of in-memory MEMSET bandwidth to extrapolated read bandwidth ratio: 1.105e+01 3.792e+01 +#pr: in-cache to in-memory MEMSET bandwidth ratio: 9.966e-01 +#pr: rsb nrhs-to-overall-min-rhs speed ratio was: on avg. 2.694e+00 x, min 3.779e-01 x, max 4.000e+00 x (4 samples, the non-min-nrhs ones) #pr: ======== Limiting to transA=T: #pr: No sample (out of 8) matched the dump criteria -- skipping dump round. #pr: ======== Limiting to both transA=T and nrhs=1: @@ -6223,68 +6260,68 @@ #pr: ======== All results (not limiting) #pr: Dump from a base of 8 samples (of max 16) ordered by (1,1,1,1,2,4,2) = (filename x cores x incX x incY x nrhs x typecode x transA). pr: BESTCODE MTX NR NC NNZ NRHS TYPE SYM TRANS NT AT-NT AT-MKL-NT BPNZ AT-BPNZ NSUBM AT-SUBM RSBBEST-MFLOPS OPTIME MKL-OPTIME AT-OPTIME AT-MKL-OPTIME AT-TIME RWminBW-GBps CB-bpf AT-MS CMFLOPS -pr: 1:R_R A 3 3 6 1 D S N 4 4 0 4.0000 4.6667 3 1 25.17 1.067e-03 0.000e+00 9.537e-07 0.000e+00 1.013e-02 1.55e-01 5.17e+00 1 2.40e-05 -pr: 3:R_R A 3 3 6 1 S S N 4 4 0 4.0000 4.6667 3 1 25.17 5.460e-04 0.000e+00 9.537e-07 0.000e+00 1.973e-02 9.23e-02 3.17e+00 1 2.40e-05 -pr: 5:R_R A 3 3 6 1 C S N 4 4 0 4.0000 4.6667 3 1 100.66 1.100e-03 0.000e+00 9.537e-07 0.000e+00 2.258e-02 1.55e-01 1.29e+00 1 9.60e-05 -pr: 7:R_R A 3 3 6 1 Z S N 4 4 0 4.0000 4.6667 3 1 100.66 5.412e-04 0.000e+00 9.537e-07 0.000e+00 1.048e-02 2.81e-01 2.29e+00 1 9.60e-05 -pr: 9:R_R A 3 3 6 4 D S N 4 4 0 4.0000 4.6667 3 1 100.66 1.024e-03 0.000e+00 9.537e-07 0.000e+00 9.531e-03 3.82e-01 2.79e+00 1 9.60e-05 -pr: 11:R_R A 3 3 6 4 S S N 4 4 0 4.0000 4.6667 3 1 100.66 1.033e-03 0.000e+00 9.537e-07 0.000e+00 1.480e-02 2.06e-01 1.54e+00 1 9.60e-05 -pr: 13:R_R A 3 3 6 4 C S N 4 4 0 4.0000 4.6667 3 1 402.65 5.941e-04 0.000e+00 9.537e-07 0.000e+00 9.068e-03 3.82e-01 6.98e-01 1 3.84e-04 -pr: 15:R_R A 3 3 6 4 Z S N 4 4 0 4.0000 4.6667 3 1 201.33 5.591e-04 0.000e+00 1.907e-06 0.000e+00 9.952e-03 3.67e-01 1.32e+00 1 3.84e-04 +pr: 1:R_R A 3 3 6 1 D S N 4 4 0 4.0000 4.6667 3 1 25.17 2.301e-03 0.000e+00 9.537e-07 0.000e+00 3.152e-02 1.55e-01 5.17e+00 1 2.40e-05 +pr: 3:R_R A 3 3 6 1 S S N 4 4 0 4.0000 4.6667 3 1 25.17 2.263e-03 0.000e+00 9.537e-07 0.000e+00 3.052e-02 9.23e-02 3.17e+00 1 2.40e-05 +pr: 5:R_R A 3 3 6 1 C S N 4 4 0 4.0000 4.6667 3 1 100.66 2.273e-03 0.000e+00 9.537e-07 0.000e+00 3.245e-02 1.55e-01 1.29e+00 1 9.60e-05 +pr: 7:R_R A 3 3 6 1 Z S N 4 4 0 4.0000 4.6667 3 1 1065.50 2.308e-03 0.000e+00 9.010e-08 0.000e+00 3.176e-02 2.97e+00 2.29e+00 1 9.60e-05 +pr: 9:R_R A 3 3 6 4 D S N 4 4 0 4.0000 4.6667 3 1 80.53 2.178e-03 0.000e+00 1.192e-06 0.000e+00 3.504e-02 3.05e-01 2.79e+00 1 9.60e-05 +pr: 11:R_R A 3 3 6 4 S S N 4 4 0 4.0000 4.6667 3 1 100.66 2.364e-03 0.000e+00 9.537e-07 0.000e+00 3.292e-02 2.06e-01 1.54e+00 1 9.60e-05 +pr: 13:R_R A 3 3 6 4 C S N 4 4 0 4.0000 4.6667 3 1 322.12 2.417e-03 0.000e+00 1.192e-06 0.000e+00 3.049e-02 3.05e-01 6.98e-01 1 3.84e-04 +pr: 15:R_R A 3 3 6 4 Z S N 4 4 0 4.0000 4.6667 3 1 402.65 2.229e-03 0.000e+00 9.537e-07 0.000e+00 3.239e-02 7.34e-01 1.32e+00 1 3.84e-04 #pr: below, we define 'successful' autotuning when speedup of 1.010000x is exceeded, and 'tuned' results even the ones which are same as untuned #pr: rsb autotuning was successful in 8 cases (100.00 %) and unsuccessful in 0 cases (0.00 %) -#pr: (in succ. cases rsb autotuning gave avg. 80960.9 % faster, avg. sp. ratio 810.609x, max sp. ratio 1153.500x, avg. ratio 0.000x) -#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 13276.3/5217.8/23679.0/106210.2 tuned ops) -#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 17.8/ 9.3/ 36.1/142.2 untuned ops) -#pr: (and amortizes from untuned rsb in avg. 17.8, min. 9.3, max. 36.2 ops) +#pr: (in succ. cases rsb autotuning gave avg. 518121.7 % faster, avg. sp. ratio 5182.217x, max sp. ratio 25617.888x, avg. ratio 0.000x) +#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 71881.6/25576.0/352513.9/575052.4 tuned ops) +#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 14.0/ 12.6/ 16.1/112.4 untuned ops) +#pr: (and amortizes from untuned rsb in avg. 14.1, min. 12.6, max. 16.1 ops) #pr: (avg/min/max (avg) nnz per subm before successful tuning were 2/ 2/ 2) #pr: (avg/min/max (avg) nnz per subm after successful tuning were 6/ 6/ 6) #pr: (avg/min/max (avg) bytes per subm before successful tuning were 18/ 8/ 32) #pr: (avg/min/max (avg) bytes per subm after successful tuning were 54/ 24/ 96) #pr: (avg/min/max (avg) bytes per nnz before successful tuning were 4.000/ 4.000/ 4.000) -#pr: (avg/min/max operands (mtx,lhs,rhs) read bandwidth lower bound 0.194/ 0.080/ 0.281,GBps) -#pr: (avg/min/max operands (mtx,rhs:r;lhs:rw) bandwidth lower bound 2.020/ 0.092/ 0.382,GBps) +#pr: (avg/min/max operands (mtx,lhs,rhs) read bandwidth lower bound 0.490/ 0.080/ 2.442,GBps) +#pr: (avg/min/max operands (mtx,rhs:r;lhs:rw) bandwidth lower bound 4.927/ 0.092/ 2.975,GBps) #pr: (avg/min/max code balance (bytes read at least once per flop) 2.284/ 0.698/ 5.167) #pr: (avg/min/max (avg) bytes per nnz after successful tuning were 4.667/ 4.667/ 4.667) #pr: (matrix has been subdivided more/less/same in resp. 0 / 8 /0 cases) #pr: (matrix has used more/less/same threads in resp. 0 / 0 /8 cases) #pr: no unsuccessful rsb autotuning attempt (according to 1.01x threshold) -#pr: rsb auto tuning (either succ. or uns.) time was: on avg.: 0.01 s, min 0.01 s, max 0.02 s, tot 0.11 s (8 samples) -#pr: rsb auto tuning ( only successful ) time was: on avg.: 0.01 s, min 0.01 s, max 0.02 s, tot 0.11 s (8 samples) -#pr: best tun. rsb canon. mflops were: on avg. 1.321e+02, min 2.517e+01, max 4.027e+02 (8 samples) -#pr: ref. unt. rsb canon. mflops were: on avg. 2.314e-01, min 2.249e-02, max 6.868e-01 (8 samples) -#pr: best tun. rsb operation time was: on avg. 1.073e-06s, min 9.537e-07s, max 1.907e-06s, tot 8.583e-06s (8 samples) -#pr: ref. unt. rsb operation time was: on avg. 8.080e-04s, min 5.412e-04s, max 1.100e-03s, tot 6.464e-03s (8 samples) -#pr: min / max ratio of in-memory MEMSET bandwidth to extrapolated read bandwidth ratio: 2.070e+01 7.300e+01 -#pr: in-cache to in-memory MEMSET bandwidth ratio: 1.003e+00 -#pr: rsb nrhs-to-overall-min-rhs speed ratio was: on avg. 3.500e+00 x, min 2.000e+00 x, max 4.000e+00 x (4 samples, the non-min-nrhs ones) -#pr: Record collection took 0.67 s. +#pr: rsb auto tuning (either succ. or uns.) time was: on avg.: 0.03 s, min 0.03 s, max 0.04 s, tot 0.26 s (8 samples) +#pr: rsb auto tuning ( only successful ) time was: on avg.: 0.03 s, min 0.03 s, max 0.04 s, tot 0.26 s (8 samples) +#pr: best tun. rsb canon. mflops were: on avg. 2.653e+02, min 2.517e+01, max 1.066e+03 (8 samples) +#pr: ref. unt. rsb canon. mflops were: on avg. 6.509e-02, min 1.043e-02, max 1.723e-01 (8 samples) +#pr: best tun. rsb operation time was: on avg. 9.053e-07s, min 9.010e-08s, max 1.192e-06s, tot 7.243e-06s (8 samples) +#pr: ref. unt. rsb operation time was: on avg. 2.292e-03s, min 2.178e-03s, max 2.417e-03s, tot 1.833e-02s (8 samples) +#pr: min / max ratio of in-memory MEMSET bandwidth to extrapolated read bandwidth ratio: 2.410e+00 7.384e+01 +#pr: in-cache to in-memory MEMSET bandwidth ratio: 9.966e-01 +#pr: rsb nrhs-to-overall-min-rhs speed ratio was: on avg. 2.694e+00 x, min 3.779e-01 x, max 4.000e+00 x (4 samples, the non-min-nrhs ones) +#pr: Record collection took 1.86 s. #pr: Record comprises 40 memory benchmark samples (prepend RSB_PR_MBW=1 to dump this). -#pr: Record comprises 90 environment variables in 3809 bytes (prepend RSB_PR_ENV=1 to dump this). +#pr: Record comprises 90 environment variables in 3863 bytes (prepend RSB_PR_ENV=1 to dump this). # ====== END Total summary record. -#pr: ======== Saved a performance record of 16 samples to rsbench_pr__1710619221_gcc-12.2.rpr -# Removing the temporary record file rsbench_pr__1710619221_gcc-12.2.rpr.tmp. -# terminating run at 1710619228 (after 6.9s of w.c.t.) -srcdir="/build/reproducible-path/librsb-1.3.0.2+dfsg" /bin/bash ./scripts/doc-tests.sh +#pr: ======== Saved a performance record of 16 samples to rsbench_pr__1710622475_gcc-12.2.rpr +# Removing the temporary record file rsbench_pr__1710622475_gcc-12.2.rpr.tmp. +# terminating run at 1710622484 (after 8.4s of w.c.t.) +srcdir="/build/reproducible-path/librsb-1.3.0.2+dfsg" /bin/sh ./scripts/doc-tests.sh + set -o pipefail + test x/build/reproducible-path/librsb-1.3.0.2+dfsg = x -+ cat /build/reproducible-path/librsb-1.3.0.2+dfsg/examples/autotune.c /build/reproducible-path/librsb-1.3.0.2+dfsg/examples/backsolve.c /build/reproducible-path/librsb-1.3.0.2+dfsg/examples/hello-spblas.c /build/reproducible-path/librsb-1.3.0.2+dfsg/examples/hello.c /build/reproducible-path/librsb-1.3.0.2+dfsg/examples/io-spblas.c /build/reproducible-path/librsb-1.3.0.2+dfsg/examples/power.c /build/reproducible-path/librsb-1.3.0.2+dfsg/examples/snippets.c /build/reproducible-path/librsb-1.3.0.2+dfsg/examples/transpose.c + grep '^.\{71,\}' ++ cat /build/reproducible-path/librsb-1.3.0.2+dfsg/examples/autotune.c /build/reproducible-path/librsb-1.3.0.2+dfsg/examples/backsolve.c /build/reproducible-path/librsb-1.3.0.2+dfsg/examples/hello-spblas.c /build/reproducible-path/librsb-1.3.0.2+dfsg/examples/hello.c /build/reproducible-path/librsb-1.3.0.2+dfsg/examples/io-spblas.c /build/reproducible-path/librsb-1.3.0.2+dfsg/examples/power.c /build/reproducible-path/librsb-1.3.0.2+dfsg/examples/snippets.c /build/reproducible-path/librsb-1.3.0.2+dfsg/examples/transpose.c + true -+ cat /build/reproducible-path/librsb-1.3.0.2+dfsg/README + grep '^[^ ].\{80,\}' ++ cat /build/reproducible-path/librsb-1.3.0.2+dfsg/README + true -++ /build/reproducible-path/librsb-1.3.0.2+dfsg/rsbench -h ++ wc -l -+ test 63 -ge 61 ++ /build/reproducible-path/librsb-1.3.0.2+dfsg/rsbench -h ++ test 63 -ge 61 ++ wc -c +++ /build/reproducible-path/librsb-1.3.0.2+dfsg/rsbench -h + test 2014 -ge 1966 -++ /build/reproducible-path/librsb-1.3.0.2+dfsg/rsbench -oa -Ob -h ++ wc -l -+ test 182 -ge 157 ++ /build/reproducible-path/librsb-1.3.0.2+dfsg/rsbench -oa -Ob -h ++ test 182 -ge 157 ++ wc -c +++ /build/reproducible-path/librsb-1.3.0.2+dfsg/rsbench -oa -Ob -h + test 5369 -ge 4600 + exit 0 if ! ./librsb-config --help ; then echo "Problem executing the librsb-config script!"; false; fi; @@ -6319,7 +6356,7 @@ type char codes:D S C Z gmake[4]: Entering directory '/build/reproducible-path/librsb-1.3.0.2+dfsg/examples' if test /build/reproducible-path/librsb-1.3.0.2+dfsg != /build/reproducible-path/librsb-1.3.0.2+dfsg ; then cp /build/reproducible-path/librsb-1.3.0.2+dfsg/pd.mtx /build/reproducible-path/librsb-1.3.0.2+dfsg/vf.mtx /build/reproducible-path/librsb-1.3.0.2+dfsg/examples ; fi -( PATH="/build/reproducible-path/librsb-1.3.0.2+dfsg:/usr/sbin:/usr/bin:/sbin:/bin:/usr/games" /bin/bash /build/reproducible-path/librsb-1.3.0.2+dfsg/examples/bench.sh; ) +( PATH="/build/reproducible-path/librsb-1.3.0.2+dfsg:/usr/sbin:/usr/bin:/sbin:/bin:/usr/games:/i/capture/the/path" /bin/sh /build/reproducible-path/librsb-1.3.0.2+dfsg/examples/bench.sh; ) + which rsbench /build/reproducible-path/librsb-1.3.0.2+dfsg/rsbench + BRF=test.rpr @@ -6329,15 +6366,15 @@ Will invoke autotuning for ~10.000000 s x 1 rounds, specifying verbosity=0 and threads=0. (>0 means no structure tuning; 0 means only structure tuning, <0 means tuning of both with (negated) thread count suggestion). # Requested no transposition. # performance record file set to: test.rpr -# beginning run at 1710619228 +# beginning run at 1710622484 # /build/reproducible-path/librsb-1.3.0.2+dfsg/.libs/rsbench -oa -Ob --bench --lower 100 --as-symmetric --types : -n 1 --notranspose --compare-competitors --verbose --verbose --write-performance-record=test.rpr # compiled with: CC=gcc CFLAGS=-g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -# average timer granularity: 9.79e-08 s +# average timer granularity: 8.86e-08 s # Will write a final performance record to file test.rpr and periodic checkpoints to test.rpr.tmp # will NOT perform ancillary tests. # will flush cache memory: between each operation measurement series, and NOT between each operation. # will keep any zero encountered in the matrix. -# env: export PATH=/build/reproducible-path/librsb-1.3.0.2+dfsg:/usr/sbin:/usr/bin:/sbin:/bin:/usr/games +# env: export PATH=/build/reproducible-path/librsb-1.3.0.2+dfsg:/usr/sbin:/usr/bin:/sbin:/bin:/usr/games:/i/capture/the/path # env: export LD_LIBRARY_PATH=/build/reproducible-path/librsb-1.3.0.2+dfsg/.libs # env: HOSTNAME is not set # env: KMP_AFFINITY is not set @@ -6376,7 +6413,7 @@ # env: SLURM_NTASKS is not set # env: SLURM_STEP_TASKS_PER_NODE is not set # env: SLURM_TASKS_PER_NODE is not set -# detected hostname: virt64c +# detected hostname: i-capture-the-hostname # user specified a verbosity level of 2 (each --verbose occurrence counts +1) # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 524288 bytes, per-thread 131072 bytes @@ -6396,29 +6433,29 @@ # This test will measure times in scanning arrays sized and aligned to fit in caches. # 2 cache levels detected Will fill struct with 40 samples... -# Memory benchmark took 6.085s +# Memory benchmark took 6.094s # auto-tuning oriented output implies times==0 iterations and sort-after-load. #pr: allocated a performance record for 4 samples (1120 bytes). # multi-type benchmarking (DSCZ) -- now using typecode D (last was D). # Cache block size total 524288 bytes, per-thread 131072 bytes -# so far, program took 6.089s of wall clock time; ancillary tests 0.000s; I/O 0.000s; checks 0.000s; conversions 0.000s; rsb/mkl tuning 0.000s/0.000s . +# so far, program took 6.099s of wall clock time; ancillary tests 0.000s; I/O 0.000s; checks 0.000s; conversions 0.000s; rsb/mkl tuning 0.000s/0.000s . # Using 1 threads # Using alpha=1 beta=1 order=cols for rsb_spmv/rsb_spsv/rsb_spmm/rsb_spsm. # will use input matrix flags: RSB_FLAG_USE_HALFWORD_INDICES, RSB_FLAG_SORTED_INPUT, RSB_FLAG_LOWER, RSB_FLAG_QUAD_PARTITIONING, RSB_FLAG_SYMMETRIC, RSB_FLAG_OWN_PARTITIONING_ARRAYS # Using 1 threads Building a matrix with 5050 nnz, 100 x 100 Duplicates check: 5050 - 0 = 5050 - converted COO to RSB in 8.587e-03 s (100.00 %) - analyzed arrays in 2.020e-03 s (23.52 %) - cleaned-up arrays in 6.413e-05 s (0.75 %) - deduplicated arrays in 1.693e-05 s (0.20 %) - sorted arrays in 0.000e+00 s (0.00 %) - shuffled partitions in 4.332e-03 s (50.45 %) - memory allocations took 2.098e-05 s (0.24 %) - leafs setup took 9.060e-06 s (0.11 %) - halfword conversion took 2.119e-03 s (24.68 %) -Built (100 x 100)[0x1d7f8a0]{D} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x2446196 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'LS' -# Constructed matrix (took 0.009s): (100 x 100)[0x1d7f8a0]{D} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x2446196 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'LS' + converted COO to RSB in 2.771e-02 s (100.00 %) + analyzed arrays in 6.391e-03 s (23.06 %) + cleaned-up arrays in 6.104e-05 s (0.22 %) + deduplicated arrays in 1.693e-05 s (0.06 %) + sorted arrays in 1.192e-06 s (0.00 %) + shuffled partitions in 1.353e-02 s (48.83 %) + memory allocations took 2.789e-05 s (0.10 %) + leafs setup took 7.868e-06 s (0.03 %) + halfword conversion took 7.667e-03 s (27.67 %) +Built (100 x 100)[0x17e4870]{D} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x2446196 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'LS' +# Constructed matrix (took 0.028s): (100 x 100)[0x17e4870]{D} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x2446196 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'LS' # matrix consistency check took 0.000s (ok) RSB Sparse Blocks Autotuner invoked requesting max 6 splits and max 6 merges in 1 rounds, threads spec.0 (specify negative values to enable threads tuning). Will autotune matrix: 100 x 100, type D, 5050 nnz, 50 nnz/r, 4 subms, 3 lsubms, 2.1212 bpnz. @@ -6469,10 +6506,10 @@ # RSB_IO_WANT_SORT_METHOD: 0 # RSB_IO_WANT_SUBDIVISION_MULTIPLIER: 1 # librsb version 1.3.0.2 - 202212201855: Initialization success -3 iterations (1 th.) took 0.003181s; avg 0.00106s ( +/- 9.36/ 12.99 %); best 0.0009611s; worst 0.001198s; std dev. 0.0001005 (taking best). -Reference operation time is 0.000961065 s (21.02 Mflops) with 1 threads. -Starting merge (same threads) based auto-tuning procedure (transA=N, nrhs=1, order=cols) (max 6 steps, inclusive 3 grace steps) on: 100 x 100, type D, 5050 nnz, 50 nnz/r, 4 subms, 3 lsubms, 2.1212 bpnz (tpop: 0.0009611 Mflops: 21.018) -Merge (3 -> 1 leaves) took w.c.t. of 0.0001822s, ~0.0001559s of computing time (of which 6.294e-05s sorting, 8.106e-06s analysis) +3 iterations (1 th.) took 0.00977s; avg 0.003257s ( +/- 26.31/ 32.87 %); best 0.0024s; worst 0.004327s; std dev. 0.0008011 (taking best). +Reference operation time is 0.00239992 s (8.417 Mflops) with 1 threads. +Starting merge (same threads) based auto-tuning procedure (transA=N, nrhs=1, order=cols) (max 6 steps, inclusive 3 grace steps) on: 100 x 100, type D, 5050 nnz, 50 nnz/r, 4 subms, 3 lsubms, 2.1212 bpnz (tpop: 0.0024 Mflops: 8.417) +Merge (3 -> 1 leaves) took w.c.t. of 0.00014s, ~0.000119s of computing time (of which 5.698e-05s sorting, 7.153e-06s analysis) # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 524288 bytes, per-thread 524288 bytes # RSB_IO_WANT_MEMORY_HIERARCHY_INFO_STRING: unset @@ -6503,8 +6540,8 @@ # RSB_IO_WANT_SORT_METHOD: 0 # RSB_IO_WANT_SUBDIVISION_MULTIPLIER: 1 # librsb version 1.3.0.2 - 202212201855: Initialization success -3 iterations (1 th.) took 7.486e-05s; avg 2.495e-05s ( +/- 12.10/ 15.61 %); best 2.193e-05s; worst 2.885e-05s; std dev. 2.89e-06 (taking best). -Reference operation time is 2.19345e-05 s (920.9 Mflops) with 1 threads. +3 iterations (1 th.) took 7.606e-05s; avg 2.535e-05s ( +/- 9.72/ 18.50 %); best 2.289e-05s; worst 3.004e-05s; std dev. 3.317e-06 (taking best). +Reference operation time is 2.28882e-05 s (882.6 Mflops) with 1 threads. # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 524288 bytes, per-thread 524288 bytes # RSB_IO_WANT_MEMORY_HIERARCHY_INFO_STRING: unset @@ -6520,16 +6557,16 @@ # RSB_IO_WANT_SORT_METHOD: 0 # RSB_IO_WANT_SUBDIVISION_MULTIPLIER: 1 # librsb version 1.3.0.2 - 202212201855: Initialization success -After merge step 1: tpop: 2.193e-05 s ~Mflops: 920.923 nsubm:1 otn:1 -Applying merge (3 -> 1 leaves, 1 th.) yielded SPEEDUP of 43.815x: 0.0009611s -> 2.193e-05s, so taking this instance. +After merge step 1: tpop: 2.289e-05 s ~Mflops: 882.551 nsubm:1 otn:1 +Applying merge (3 -> 1 leaves, 1 th.) yielded SPEEDUP of 104.854x: 0.0024s -> 2.289e-05s, so taking this instance. Saved plot to test-tuning-lower-100x100-5050nz--D-N-1--mv-tuned_merge1_1x1th.eps Merged all the matrix leaves: no reason to continue merging. -A total of 1 merge steps (of max 6) (3 -> 1 subms) took 0.01559s (of which 0.000195s partitioning, 0.0122s I/O); computing times: 0.0001559s in par. loops, 6.294e-05s sorting, 8.106e-06s analyzing) -Total merge + benchmarking process took 0.01559s, equivalent to 710.6/16.2 new/old ops (0.00593s for 2 clones -- as 270.4/6.2 ops, or 135.2/3.1 ops per clone), SPEEDUP of 43.815x -Applying multi-merge (3 -> 1 leaves, 1 steps, 0 -> 1 th.sp.) yielded SPEEDUP of 43.815x (0.0009611s -> 2.193e-05s), will amortize in 16.6 ops by saving 0.0009391s per op. -In 1 tuning rounds (tot. 0.022s, 0.0059s for constructor, 2 clones) obtained a SPEEDUP of 4281.5% (43.82x) (from 21.02 to 920.9 Mflops). Employed 0.012s for I/O of matrix plots. +A total of 1 merge steps (of max 6) (3 -> 1 subms) took 0.03963s (of which 0.0001481s partitioning, 0.02861s I/O); computing times: 0.000119s in par. loops, 5.698e-05s sorting, 7.153e-06s analyzing) +Total merge + benchmarking process took 0.03963s, equivalent to 1731.5/16.5 new/old ops (0.01762s for 2 clones -- as 769.9/7.3 ops, or 384.9/3.7 ops per clone), SPEEDUP of 104.854x +Applying multi-merge (3 -> 1 leaves, 1 steps, 0 -> 1 th.sp.) yielded SPEEDUP of 104.854x (0.0024s -> 2.289e-05s), will amortize in 16.7 ops by saving 0.002377s per op. +In 1 tuning rounds (tot. 0.058s, 0.018s for constructor, 2 clones) obtained a SPEEDUP of 10385.4% (104.9x) (from 8.417 to 882.6 Mflops). Employed 0.026s for I/O of matrix plots. #pr: updating sample at index 1 (0^th of 4), 0^th touch for (0,0,0,0,0,0,0). -First run of RSB Autotuner took 0.0339861 s (9.611e-04 s -> 2.193e-05 s per spmv_sxsa) (tuned: 3 -> 1 lsubm). +First run of RSB Autotuner took 0.0844982 s (2.400e-03 s -> 2.289e-05 s per spmv_sxsa) (tuned: 3 -> 1 lsubm). RSB Sparse Blocks Autotuner invoked requesting max 0 splits and max 0 merges in 1 rounds, auto threads spec. Will autotune matrix: 100 x 100, type D, 5050 nnz, 50 nnz/r, 1 subms, 1 lsubms, 2.0800 bpnz. Parameters: verbosity:1 mintimes:3 maxtimes:10 mindt:0 maxdt:10 @@ -6595,20 +6632,20 @@ # RSB_IO_WANT_SORT_METHOD: 0 # RSB_IO_WANT_SUBDIVISION_MULTIPLIER: 1 # librsb version 1.3.0.2 - 202212201855: Initialization success -3 iterations (1 th.) took 7.915e-05s; avg 2.638e-05s ( +/- 13.25/ 25.60 %); best 2.289e-05s; worst 3.314e-05s; std dev. 4.778e-06 (taking best). +3 iterations (1 th.) took 8.011e-05s; avg 2.67e-05s ( +/- 14.29/ 24.11 %); best 2.289e-05s; worst 3.314e-05s; std dev. 4.578e-06 (taking best). Reference operation time is 2.28882e-05 s (882.6 Mflops) with 1 threads. Building a matrix with 5050 nnz, 100 x 100 Duplicates check: 5050 - 0 = 5050 - converted COO to RSB in 3.395e-03 s (100.00 %) - analyzed arrays in 1.117e-03 s (32.90 %) - cleaned-up arrays in 5.889e-05 s (1.73 %) - deduplicated arrays in 1.383e-05 s (0.41 %) - sorted arrays in 1.192e-06 s (0.04 %) - shuffled partitions in 2.174e-03 s (64.03 %) - memory allocations took 9.298e-06 s (0.27 %) - leafs setup took 3.099e-06 s (0.09 %) - halfword conversion took 1.597e-05 s (0.47 %) -Built (100 x 100)[0x1d81a10]{D} @ (0(0..100),0(0..100)) (5050 nnz, 50 nnz/r) flags 0x42644094 (coo:0, csr:1, hw:0, ic:1, fi:0), storage: 1, subm: 1, symflags:'LS' + converted COO to RSB in 9.970e-03 s (100.00 %) + analyzed arrays in 3.360e-03 s (33.70 %) + cleaned-up arrays in 5.889e-05 s (0.59 %) + deduplicated arrays in 1.502e-05 s (0.15 %) + sorted arrays in 0.000e+00 s (0.00 %) + shuffled partitions in 6.506e-03 s (65.26 %) + memory allocations took 9.298e-06 s (0.09 %) + leafs setup took 1.907e-06 s (0.02 %) + halfword conversion took 1.693e-05 s (0.17 %) +Built (100 x 100)[0x17e69c0]{D} @ (0(0..100),0(0..100)) (5050 nnz, 50 nnz/r) flags 0x42644094 (coo:0, csr:1, hw:0, ic:1, fi:0), storage: 1, subm: 1, symflags:'LS' Starting autotuning stage, with subdivision of 1 (current threads=1, requested threads=0, max threads = 4). # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 524288 bytes, per-thread 524288 bytes @@ -6642,16 +6679,16 @@ # librsb version 1.3.0.2 - 202212201855: Initialization success Building a matrix with 5050 nnz, 100 x 100 Duplicates check: 5050 - 0 = 5050 - converted COO to RSB in 8.869e-03 s (100.00 %) - analyzed arrays in 2.885e-03 s (32.53 %) - cleaned-up arrays in 5.889e-05 s (0.66 %) - deduplicated arrays in 1.502e-05 s (0.17 %) + converted COO to RSB in 3.009e-02 s (100.00 %) + analyzed arrays in 9.246e-03 s (30.73 %) + cleaned-up arrays in 5.817e-05 s (0.19 %) + deduplicated arrays in 1.502e-05 s (0.05 %) sorted arrays in 0.000e+00 s (0.00 %) - shuffled partitions in 3.748e-03 s (42.26 %) - memory allocations took 1.097e-05 s (0.12 %) - leafs setup took 2.861e-06 s (0.03 %) - halfword conversion took 2.146e-03 s (24.20 %) -Built (100 x 100)[0x1d80080]{D} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x42646096 (coo:0, csr:1, hw:1, ic:1, fi:0), storage: 1, subm: 3, symflags:'LS' + shuffled partitions in 1.416e-02 s (47.07 %) + memory allocations took 8.583e-06 s (0.03 %) + leafs setup took 3.099e-06 s (0.01 %) + halfword conversion took 6.595e-03 s (21.92 %) +Built (100 x 100)[0x17e4870]{D} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x42646096 (coo:0, csr:1, hw:1, ic:1, fi:0), storage: 1, subm: 3, symflags:'LS' # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 524288 bytes, per-thread 524288 bytes # RSB_IO_WANT_MEMORY_HIERARCHY_INFO_STRING: unset @@ -6697,9 +6734,9 @@ # RSB_IO_WANT_SORT_METHOD: 0 # RSB_IO_WANT_SUBDIVISION_MULTIPLIER: 0.25 # librsb version 1.3.0.2 - 202212201855: Initialization success -3 iterations (1 th.) took 0.0028s; avg 0.0009334s ( +/- 35.50/ 22.68 %); best 0.000602s; worst 0.001145s; std dev. 0.0002373 (taking best). -Reference operation time is 0.000602007 s (33.55 Mflops) with 1 threads. -Challenging best inner round reference (2.28882e-05 s/1 threads) with: subdivision 0.25, 3 leaves, 2.121 bytes/nz, 0.000602007 s/0 threads (speedup 0.0380198 x), same?n. +3 iterations (1 th.) took 0.01057s; avg 0.003525s ( +/- 29.61/ 27.44 %); best 0.002481s; worst 0.004492s; std dev. 0.0008227 (taking best). +Reference operation time is 0.00248098 s (8.142 Mflops) with 1 threads. +Challenging best inner round reference (2.28882e-05 s/1 threads) with: subdivision 0.25, 3 leaves, 2.121 bytes/nz, 0.00248098 s/0 threads (speedup 0.00922545 x), same?n. New candidate clone performs slowly; discarding it: 100 x 100, type D, 5050 nnz, 50 nnz/r, 4 subms, 3 lsubms, 2.1212 bpnz # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 524288 bytes, per-thread 524288 bytes @@ -6733,16 +6770,16 @@ # librsb version 1.3.0.2 - 202212201855: Initialization success Building a matrix with 5050 nnz, 100 x 100 Duplicates check: 5050 - 0 = 5050 - converted COO to RSB in 9.096e-03 s (100.00 %) - analyzed arrays in 2.901e-03 s (31.89 %) - cleaned-up arrays in 5.913e-05 s (0.65 %) - deduplicated arrays in 1.502e-05 s (0.17 %) + converted COO to RSB in 3.078e-02 s (100.00 %) + analyzed arrays in 1.161e-02 s (37.73 %) + cleaned-up arrays in 7.701e-05 s (0.25 %) + deduplicated arrays in 1.502e-05 s (0.05 %) sorted arrays in 0.000e+00 s (0.00 %) - shuffled partitions in 3.808e-03 s (41.87 %) - memory allocations took 1.264e-05 s (0.14 %) - leafs setup took 5.007e-06 s (0.06 %) - halfword conversion took 2.294e-03 s (25.22 %) -Built (100 x 100)[0x1d70b60]{D} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x42646096 (coo:0, csr:1, hw:1, ic:1, fi:0), storage: 1, subm: 10, symflags:'LS' + shuffled partitions in 1.196e-02 s (38.86 %) + memory allocations took 1.216e-05 s (0.04 %) + leafs setup took 5.007e-06 s (0.02 %) + halfword conversion took 7.098e-03 s (23.06 %) +Built (100 x 100)[0x17e5600]{D} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x42646096 (coo:0, csr:1, hw:1, ic:1, fi:0), storage: 1, subm: 10, symflags:'LS' # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 524288 bytes, per-thread 524288 bytes # RSB_IO_WANT_MEMORY_HIERARCHY_INFO_STRING: unset @@ -6788,9 +6825,9 @@ # RSB_IO_WANT_SORT_METHOD: 0 # RSB_IO_WANT_SUBDIVISION_MULTIPLIER: 0.5 # librsb version 1.3.0.2 - 202212201855: Initialization success -3 iterations (1 th.) took 0.002735s; avg 0.0009116s ( +/- 22.46/ 17.48 %); best 0.0007069s; worst 0.001071s; std dev. 0.0001521 (taking best). -Reference operation time is 0.000706911 s (28.58 Mflops) with 1 threads. -Challenging best inner round reference (2.28882e-05 s/1 threads) with: subdivision 0.5, 10 leaves, 2.206 bytes/nz, 0.000706911 s/0 threads (speedup 0.0323777 x), same?n. +3 iterations (1 th.) took 0.01057s; avg 0.003523s ( +/- 29.63/ 30.03 %); best 0.002479s; worst 0.004581s; std dev. 0.0008582 (taking best). +Reference operation time is 0.00247908 s (8.148 Mflops) with 1 threads. +Challenging best inner round reference (2.28882e-05 s/1 threads) with: subdivision 0.5, 10 leaves, 2.206 bytes/nz, 0.00247908 s/0 threads (speedup 0.00923254 x), same?n. New candidate clone performs slowly; discarding it: 100 x 100, type D, 5050 nnz, 50 nnz/r, 14 subms, 10 lsubms, 2.2059 bpnz # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 524288 bytes, per-thread 524288 bytes @@ -6824,16 +6861,16 @@ # librsb version 1.3.0.2 - 202212201855: Initialization success Building a matrix with 5050 nnz, 100 x 100 Duplicates check: 5050 - 0 = 5050 - converted COO to RSB in 9.045e-03 s (100.00 %) - analyzed arrays in 2.445e-03 s (27.03 %) - cleaned-up arrays in 5.889e-05 s (0.65 %) - deduplicated arrays in 1.502e-05 s (0.17 %) + converted COO to RSB in 2.828e-02 s (100.00 %) + analyzed arrays in 7.492e-03 s (26.49 %) + cleaned-up arrays in 5.889e-05 s (0.21 %) + deduplicated arrays in 1.502e-05 s (0.05 %) sorted arrays in 0.000e+00 s (0.00 %) - shuffled partitions in 4.393e-03 s (48.57 %) - memory allocations took 1.574e-05 s (0.17 %) - leafs setup took 5.960e-06 s (0.07 %) - halfword conversion took 2.110e-03 s (23.33 %) -Built (100 x 100)[0x1d70b60]{D} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x42646096 (coo:0, csr:1, hw:1, ic:1, fi:0), storage: 1, subm: 10, symflags:'LS' + shuffled partitions in 1.398e-02 s (49.45 %) + memory allocations took 1.216e-05 s (0.04 %) + leafs setup took 5.007e-06 s (0.02 %) + halfword conversion took 6.713e-03 s (23.74 %) +Built (100 x 100)[0x17f7790]{D} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x42646096 (coo:0, csr:1, hw:1, ic:1, fi:0), storage: 1, subm: 10, symflags:'LS' # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 524288 bytes, per-thread 524288 bytes # RSB_IO_WANT_MEMORY_HIERARCHY_INFO_STRING: unset @@ -6879,9 +6916,9 @@ # RSB_IO_WANT_SORT_METHOD: 0 # RSB_IO_WANT_SUBDIVISION_MULTIPLIER: 1 # librsb version 1.3.0.2 - 202212201855: Initialization success -3 iterations (1 th.) took 0.002426s; avg 0.0008086s ( +/- 22.84/ 45.68 %); best 0.0006239s; worst 0.001178s; std dev. 0.0002612 (taking best). -Reference operation time is 0.000623941 s (32.37 Mflops) with 1 threads. -Challenging best inner round reference (2.28882e-05 s/1 threads) with: subdivision 1, 10 leaves, 2.206 bytes/nz, 0.000623941 s/0 threads (speedup 0.0366832 x), same?n. +3 iterations (1 th.) took 0.0117s; avg 0.003901s ( +/- 42.54/ 28.42 %); best 0.002242s; worst 0.00501s; std dev. 0.001195 (taking best). +Reference operation time is 0.00224185 s (9.01 Mflops) with 1 threads. +Challenging best inner round reference (2.28882e-05 s/1 threads) with: subdivision 1, 10 leaves, 2.206 bytes/nz, 0.00224185 s/0 threads (speedup 0.0102095 x), same?n. New candidate clone performs slowly; discarding it: 100 x 100, type D, 5050 nnz, 50 nnz/r, 14 subms, 10 lsubms, 2.2059 bpnz # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 524288 bytes, per-thread 524288 bytes @@ -6915,16 +6952,16 @@ # librsb version 1.3.0.2 - 202212201855: Initialization success Building a matrix with 5050 nnz, 100 x 100 Duplicates check: 5050 - 0 = 5050 - converted COO to RSB in 9.023e-03 s (100.00 %) - analyzed arrays in 2.387e-03 s (26.46 %) - cleaned-up arrays in 6.008e-05 s (0.67 %) - deduplicated arrays in 1.502e-05 s (0.17 %) + converted COO to RSB in 2.655e-02 s (100.00 %) + analyzed arrays in 7.543e-03 s (28.41 %) + cleaned-up arrays in 5.913e-05 s (0.22 %) + deduplicated arrays in 1.478e-05 s (0.06 %) sorted arrays in 0.000e+00 s (0.00 %) - shuffled partitions in 4.383e-03 s (48.58 %) - memory allocations took 1.574e-05 s (0.17 %) - leafs setup took 5.007e-06 s (0.06 %) - halfword conversion took 2.156e-03 s (23.89 %) -Built (100 x 100)[0x1d70b60]{D} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x42646096 (coo:0, csr:1, hw:1, ic:1, fi:0), storage: 1, subm: 10, symflags:'LS' + shuffled partitions in 1.212e-02 s (45.64 %) + memory allocations took 1.192e-05 s (0.04 %) + leafs setup took 3.815e-06 s (0.01 %) + halfword conversion took 6.798e-03 s (25.61 %) +Built (100 x 100)[0x17f7790]{D} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x42646096 (coo:0, csr:1, hw:1, ic:1, fi:0), storage: 1, subm: 10, symflags:'LS' # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 524288 bytes, per-thread 524288 bytes # RSB_IO_WANT_MEMORY_HIERARCHY_INFO_STRING: unset @@ -6970,9 +7007,9 @@ # RSB_IO_WANT_SORT_METHOD: 0 # RSB_IO_WANT_SUBDIVISION_MULTIPLIER: 2 # librsb version 1.3.0.2 - 202212201855: Initialization success -3 iterations (1 th.) took 0.003077s; avg 0.001026s ( +/- 15.57/ 12.72 %); best 0.0008659s; worst 0.001156s; std dev. 0.0001203 (taking best). -Reference operation time is 0.000865936 s (23.33 Mflops) with 1 threads. -Challenging best inner round reference (2.28882e-05 s/1 threads) with: subdivision 2, 10 leaves, 2.206 bytes/nz, 0.000865936 s/0 threads (speedup 0.0264317 x), same?n. +3 iterations (1 th.) took 0.0109s; avg 0.003632s ( +/- 33.68/ 26.42 %); best 0.002409s; worst 0.004592s; std dev. 0.0009105 (taking best). +Reference operation time is 0.00240898 s (8.385 Mflops) with 1 threads. +Challenging best inner round reference (2.28882e-05 s/1 threads) with: subdivision 2, 10 leaves, 2.206 bytes/nz, 0.00240898 s/0 threads (speedup 0.00950119 x), same?n. New candidate clone performs slowly; discarding it: 100 x 100, type D, 5050 nnz, 50 nnz/r, 14 subms, 10 lsubms, 2.2059 bpnz # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 524288 bytes, per-thread 524288 bytes @@ -7006,16 +7043,16 @@ # librsb version 1.3.0.2 - 202212201855: Initialization success Building a matrix with 5050 nnz, 100 x 100 Duplicates check: 5050 - 0 = 5050 - converted COO to RSB in 9.178e-03 s (100.00 %) - analyzed arrays in 2.395e-03 s (26.10 %) - cleaned-up arrays in 5.889e-05 s (0.64 %) - deduplicated arrays in 1.502e-05 s (0.16 %) + converted COO to RSB in 2.879e-02 s (100.00 %) + analyzed arrays in 8.086e-03 s (28.08 %) + cleaned-up arrays in 5.794e-05 s (0.20 %) + deduplicated arrays in 1.597e-05 s (0.06 %) sorted arrays in 0.000e+00 s (0.00 %) - shuffled partitions in 4.477e-03 s (48.78 %) - memory allocations took 1.788e-05 s (0.19 %) - leafs setup took 5.007e-06 s (0.05 %) - halfword conversion took 2.208e-03 s (24.06 %) -Built (100 x 100)[0x1db50b0]{D} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x42646096 (coo:0, csr:1, hw:1, ic:1, fi:0), storage: 1, subm: 10, symflags:'LS' + shuffled partitions in 1.347e-02 s (46.79 %) + memory allocations took 1.431e-05 s (0.05 %) + leafs setup took 5.960e-06 s (0.02 %) + halfword conversion took 7.138e-03 s (24.79 %) +Built (100 x 100)[0x181edc0]{D} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x42646096 (coo:0, csr:1, hw:1, ic:1, fi:0), storage: 1, subm: 10, symflags:'LS' # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 524288 bytes, per-thread 524288 bytes # RSB_IO_WANT_MEMORY_HIERARCHY_INFO_STRING: unset @@ -7061,9 +7098,9 @@ # RSB_IO_WANT_SORT_METHOD: 0 # RSB_IO_WANT_SUBDIVISION_MULTIPLIER: 4 # librsb version 1.3.0.2 - 202212201855: Initialization success -3 iterations (1 th.) took 0.002865s; avg 0.0009549s ( +/- 24.83/ 17.82 %); best 0.0007179s; worst 0.001125s; std dev. 0.0001728 (taking best). -Reference operation time is 0.000717878 s (28.14 Mflops) with 1 threads. -Challenging best inner round reference (2.28882e-05 s/1 threads) with: subdivision 4, 10 leaves, 2.206 bytes/nz, 0.000717878 s/0 threads (speedup 0.0318831 x), same?n. +3 iterations (1 th.) took 0.01006s; avg 0.003353s ( +/- 25.84/ 43.59 %); best 0.002487s; worst 0.004815s; std dev. 0.00104 (taking best). +Reference operation time is 0.00248694 s (8.122 Mflops) with 1 threads. +Challenging best inner round reference (2.28882e-05 s/1 threads) with: subdivision 4, 10 leaves, 2.206 bytes/nz, 0.00248694 s/0 threads (speedup 0.00920334 x), same?n. New candidate clone performs slowly; discarding it: 100 x 100, type D, 5050 nnz, 50 nnz/r, 14 subms, 10 lsubms, 2.2059 bpnz Best sparse multiply performance with subdivision multiplier of 1: 882.551 Mflops. # librsb version 1.3.0.2 - 202212201855: Initializing @@ -7081,29 +7118,29 @@ # RSB_IO_WANT_SORT_METHOD: 0 # RSB_IO_WANT_SUBDIVISION_MULTIPLIER: 1 # librsb version 1.3.0.2 - 202212201855: Initialization success -Last tuner inner round (1 of 1) took 0.065563 s (eq. to 3e+03/ 3e+03 old/new op.times), gained local/global speedup 1 x (2.28882e-05 : 2.28882e-05) / 1 x (2.28882e-05 : 2.28882e-05). This is not amortizable ! +Last tuner inner round (1 of 1) took 0.212016 s (eq. to 9e+03/ 9e+03 old/new op.times), gained local/global speedup 1 x (2.28882e-05 : 2.28882e-05) / 1 x (2.28882e-05 : 2.28882e-05). This is not amortizable ! Auto tuning inner round 1 did not find a configuration better than the original. -In 1 tuning rounds (tot. 0.066s, 0.051s for constructor, 0 clones) obtained NO speedup (best stays 882.6 Mflops). -Second run of RSB Autotuner took 0.0656691 s and estimated a speedup of 1.000000 x (2.289e-05 s -> 2.289e-05 s per op) in same matrix (1 -> 1 lsubm) +In 1 tuning rounds (tot. 0.21s, 0.16s for constructor, 0 clones) obtained NO speedup (best stays 882.6 Mflops). +Second run of RSB Autotuner took 0.21209 s and estimated a speedup of 1.000000 x (2.289e-05 s -> 2.289e-05 s per op) in same matrix (1 -> 1 lsubm) #min:1 #max:1 #sum:100 #norm:10 #used index storage compared to COO:10504 vs 40400 bytes (26.00%) ; compared to CSR:10504 vs 20604 bytes (50.99%) #%:CONSTRUCTOR_*:SORT SCAN INSERT SCAN+INSERT -%:CONSTRUCTOR_TIMES:lower-100x100-5050nz S N 1 100 100 5050 0.000000 0.002020 0.004332 0.006352 -%:UNSORTEDCOO2RSB_TIME:lower-100x100-5050nz S N 1 100 100 5050 0.006352 -%:RSB_SUBDIVISION_TIME:lower-100x100-5050nz S N 1 100 100 5050 0.002020 -%:RSB_SHUFFLE_TIME:lower-100x100-5050nz S N 1 100 100 5050 0.004332 -%:ROW_MAJOR_SORT_TIME:lower-100x100-5050nz S N 1 100 100 5050 0.000000 -%:ROW_MAJOR_SORT_SCALING:lower-100x100-5050nz S N 1 100 100 5050 nan -%:SORTEDCOO2RSB_TIME:lower-100x100-5050nz S N 1 100 100 5050 0.006352 +%:CONSTRUCTOR_TIMES:lower-100x100-5050nz S N 1 100 100 5050 0.000001 0.006391 0.013532 0.019923 +%:UNSORTEDCOO2RSB_TIME:lower-100x100-5050nz S N 1 100 100 5050 0.019924 +%:RSB_SUBDIVISION_TIME:lower-100x100-5050nz S N 1 100 100 5050 0.006391 +%:RSB_SHUFFLE_TIME:lower-100x100-5050nz S N 1 100 100 5050 0.013532 +%:ROW_MAJOR_SORT_TIME:lower-100x100-5050nz S N 1 100 100 5050 0.000001 +%:ROW_MAJOR_SORT_SCALING:lower-100x100-5050nz S N 1 100 100 5050 1.000 +%:SORTEDCOO2RSB_TIME:lower-100x100-5050nz S N 1 100 100 5050 0.019923 %:ROW_MAJOR_SORT_TO_MOP:lower-100x100-5050nz S N 1 100 100 5050 0.000 %:UNSORTEDCOO2RSB_SCALING:lower-100x100-5050nz S N 1 100 100 5050 1.00 %:SORTEDCOO2RSB_SCALING:lower-100x100-5050nz S N 1 100 100 5050 1.00 %:RSB_SUBDIVISION_SCALING:lower-100x100-5050nz S N 1 100 100 5050 1.00 %:RSB_SHUFFLE_SCALING:lower-100x100-5050nz S N 1 100 100 5050 1.00 -%:CONSTRUCTOR_SCALING:lower-100x100-5050nz S N 1 100 100 5050 nan 1.00 1.00 1.00 +%:CONSTRUCTOR_SCALING:lower-100x100-5050nz S N 1 100 100 5050 1.00 1.00 1.00 1.00 #%:SM_COUNTS: Tot HalfwordCsr FullwordCsr HalfwordCoo FullwordCoo %:SM_COUNTS:lower-100x100-5050nz S N 1 100 100 5050 1 1 0 0 0 %:SM_IDXOCCUPATIONRSBVSCOOANDCSR:lower-100x100-5050nz S N 1 100 100 5050 10504 40400 20600 @@ -7112,34 +7149,34 @@ %:SM_MINMAXAVGNNZ:lower-100x100-5050nz S N 1 100 100 5050 5050 5050 5050 # %operation:matrix CONSTRUCTOR[1] SPMV[1] SPMV[1] -%operation:lower-100x100-5050nz 0.00858688 1e+09 1e+09 +%operation:lower-100x100-5050nz 0.0277109 1e+09 1e+09 %constructor:matrix SORT[1] SCAN[1] SHUFFLE[1] INSERT[1] -%constructor:lower-100x100-5050nz 0 0.00201988 0 0.00433207 -# so far, program took 6.207s of wall clock time; ancillary tests 0.000s; I/O 0.000s; checks 0.000s; conversions 0.000s; rsb/mkl tuning 0.100s/0.000s . +%constructor:lower-100x100-5050nz 1.19209e-06 0.00639105 0 0.0135319 +# so far, program took 6.452s of wall clock time; ancillary tests 0.000s; I/O 0.000s; checks 0.000s; conversions 0.000s; rsb/mkl tuning 0.297s/0.000s . getrusage() stats: ru_maxrss: 5 (maximum resident set size -- MB) -ru_stime : 0.04412s (system CPU time used) -ru_utime : 6.377s (user CPU time used) +ru_stime : 0.05997s (system CPU time used) +ru_utime : 6.393s (user CPU time used) # multi-type benchmarking (DSCZ) -- now using typecode S (last was D). # Cache block size total 524288 bytes, per-thread 524288 bytes -# so far, program took 6.207s of wall clock time; ancillary tests 0.000s; I/O 0.000s; checks 0.000s; conversions 0.000s; rsb/mkl tuning 0.100s/0.000s . +# so far, program took 6.452s of wall clock time; ancillary tests 0.000s; I/O 0.000s; checks 0.000s; conversions 0.000s; rsb/mkl tuning 0.297s/0.000s . # Using 1 threads # Using alpha=1 beta=1 order=cols for rsb_spmv/rsb_spsv/rsb_spmm/rsb_spsm. # will use input matrix flags: RSB_FLAG_USE_HALFWORD_INDICES, RSB_FLAG_SORTED_INPUT, RSB_FLAG_LOWER, RSB_FLAG_QUAD_PARTITIONING, RSB_FLAG_SYMMETRIC, RSB_FLAG_OWN_PARTITIONING_ARRAYS # Using 1 threads Building a matrix with 5050 nnz, 100 x 100 Duplicates check: 5050 - 0 = 5050 - converted COO to RSB in 7.578e-03 s (100.00 %) - analyzed arrays in 1.148e-03 s (15.15 %) - cleaned-up arrays in 6.199e-05 s (0.82 %) - deduplicated arrays in 1.502e-05 s (0.20 %) + converted COO to RSB in 2.635e-02 s (100.00 %) + analyzed arrays in 3.487e-03 s (13.24 %) + cleaned-up arrays in 5.889e-05 s (0.22 %) + deduplicated arrays in 1.502e-05 s (0.06 %) sorted arrays in 0.000e+00 s (0.00 %) - shuffled partitions in 4.281e-03 s (56.49 %) - memory allocations took 1.097e-05 s (0.14 %) - leafs setup took 5.007e-06 s (0.07 %) - halfword conversion took 2.054e-03 s (27.10 %) -Built (100 x 100)[0x1d71180]{S} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x2446196 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'LS' -# Constructed matrix (took 0.008s): (100 x 100)[0x1d71180]{S} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x2446196 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'LS' + shuffled partitions in 1.497e-02 s (56.81 %) + memory allocations took 1.097e-05 s (0.04 %) + leafs setup took 5.960e-06 s (0.02 %) + halfword conversion took 7.797e-03 s (29.60 %) +Built (100 x 100)[0x17f77c0]{S} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x2446196 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'LS' +# Constructed matrix (took 0.026s): (100 x 100)[0x17f77c0]{S} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x2446196 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'LS' # matrix consistency check took 0.000s (ok) RSB Sparse Blocks Autotuner invoked requesting max 6 splits and max 6 merges in 1 rounds, threads spec.0 (specify negative values to enable threads tuning). Will autotune matrix: 100 x 100, type S, 5050 nnz, 50 nnz/r, 4 subms, 3 lsubms, 2.1212 bpnz. @@ -7190,10 +7227,10 @@ # RSB_IO_WANT_SORT_METHOD: 0 # RSB_IO_WANT_SUBDIVISION_MULTIPLIER: 1 # librsb version 1.3.0.2 - 202212201855: Initialization success -3 iterations (1 th.) took 0.003057s; avg 0.001019s ( +/- 4.52/ 3.74 %); best 0.000973s; worst 0.001057s; std dev. 3.481e-05 (taking best). -Reference operation time is 0.000972986 s (20.76 Mflops) with 1 threads. -Starting merge (same threads) based auto-tuning procedure (transA=N, nrhs=1, order=cols) (max 6 steps, inclusive 3 grace steps) on: 100 x 100, type S, 5050 nnz, 50 nnz/r, 4 subms, 3 lsubms, 2.1212 bpnz (tpop: 0.000973 Mflops: 20.761) -Merge (3 -> 1 leaves) took w.c.t. of 0.000129s, ~0.0001121s of computing time (of which 5.198e-05s sorting, 6.199e-06s analysis) +3 iterations (1 th.) took 0.009989s; avg 0.00333s ( +/- 29.48/ 42.59 %); best 0.002348s; worst 0.004748s; std dev. 0.001027 (taking best). +Reference operation time is 0.00234818 s (8.602 Mflops) with 1 threads. +Starting merge (same threads) based auto-tuning procedure (transA=N, nrhs=1, order=cols) (max 6 steps, inclusive 3 grace steps) on: 100 x 100, type S, 5050 nnz, 50 nnz/r, 4 subms, 3 lsubms, 2.1212 bpnz (tpop: 0.002348 Mflops: 8.602) +Merge (3 -> 1 leaves) took w.c.t. of 0.000124s, ~0.000108s of computing time (of which 5.007e-05s sorting, 5.007e-06s analysis) # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 524288 bytes, per-thread 524288 bytes # RSB_IO_WANT_MEMORY_HIERARCHY_INFO_STRING: unset @@ -7224,7 +7261,7 @@ # RSB_IO_WANT_SORT_METHOD: 0 # RSB_IO_WANT_SUBDIVISION_MULTIPLIER: 1 # librsb version 1.3.0.2 - 202212201855: Initialization success -3 iterations (1 th.) took 7.081e-05s; avg 2.36e-05s ( +/- 7.07/ 10.10 %); best 2.193e-05s; worst 2.599e-05s; std dev. 1.73e-06 (taking best). +3 iterations (1 th.) took 6.89e-05s; avg 2.297e-05s ( +/- 4.50/ 9.00 %); best 2.193e-05s; worst 2.503e-05s; std dev. 1.461e-06 (taking best). Reference operation time is 2.19345e-05 s (920.9 Mflops) with 1 threads. # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 524288 bytes, per-thread 524288 bytes @@ -7242,15 +7279,15 @@ # RSB_IO_WANT_SUBDIVISION_MULTIPLIER: 1 # librsb version 1.3.0.2 - 202212201855: Initialization success After merge step 1: tpop: 2.193e-05 s ~Mflops: 920.923 nsubm:1 otn:1 -Applying merge (3 -> 1 leaves, 1 th.) yielded SPEEDUP of 44.359x: 0.000973s -> 2.193e-05s, so taking this instance. +Applying merge (3 -> 1 leaves, 1 th.) yielded SPEEDUP of 107.054x: 0.002348s -> 2.193e-05s, so taking this instance. Saved plot to test-tuning-lower-100x100-5050nz--S-N-1--mv-tuned_merge1_1x1th.eps Merged all the matrix leaves: no reason to continue merging. -A total of 1 merge steps (of max 6) (3 -> 1 subms) took 0.01493s (of which 0.000138s partitioning, 0.01174s I/O); computing times: 0.0001121s in par. loops, 5.198e-05s sorting, 6.199e-06s analyzing) -Total merge + benchmarking process took 0.01493s, equivalent to 680.4/15.3 new/old ops (0.005702s for 2 clones -- as 259.9/5.9 ops, or 130.0/2.9 ops per clone), SPEEDUP of 44.359x -Applying multi-merge (3 -> 1 leaves, 1 steps, 0 -> 1 th.sp.) yielded SPEEDUP of 44.359x (0.000973s -> 2.193e-05s), will amortize in 15.7 ops by saving 0.0009511s per op. -In 1 tuning rounds (tot. 0.021s, 0.0057s for constructor, 2 clones) obtained a SPEEDUP of 4335.9% (44.36x) (from 20.76 to 920.9 Mflops). Employed 0.012s for I/O of matrix plots. +A total of 1 merge steps (of max 6) (3 -> 1 subms) took 0.0374s (of which 0.0001309s partitioning, 0.02749s I/O); computing times: 0.000108s in par. loops, 5.007e-05s sorting, 5.007e-06s analyzing) +Total merge + benchmarking process took 0.0374s, equivalent to 1705.0/15.9 new/old ops (0.01822s for 2 clones -- as 830.6/7.8 ops, or 415.3/3.9 ops per clone), SPEEDUP of 107.054x +Applying multi-merge (3 -> 1 leaves, 1 steps, 0 -> 1 th.sp.) yielded SPEEDUP of 107.054x (0.002348s -> 2.193e-05s), will amortize in 16.1 ops by saving 0.002326s per op. +In 1 tuning rounds (tot. 0.056s, 0.018s for constructor, 2 clones) obtained a SPEEDUP of 10605.4% (107.1x) (from 8.602 to 920.9 Mflops). Employed 0.027s for I/O of matrix plots. #pr: updating sample at index 2 (1^th of 4), 0^th touch for (0,0,0,0,0,1,0). -First run of RSB Autotuner took 0.0331659 s (9.730e-04 s -> 2.193e-05 s per spmv_sxsa) (tuned: 3 -> 1 lsubm). +First run of RSB Autotuner took 0.0830622 s (2.348e-03 s -> 2.193e-05 s per spmv_sxsa) (tuned: 3 -> 1 lsubm). RSB Sparse Blocks Autotuner invoked requesting max 0 splits and max 0 merges in 1 rounds, auto threads spec. Will autotune matrix: 100 x 100, type S, 5050 nnz, 50 nnz/r, 1 subms, 1 lsubms, 2.0800 bpnz. Parameters: verbosity:1 mintimes:3 maxtimes:10 mindt:0 maxdt:10 @@ -7316,20 +7353,20 @@ # RSB_IO_WANT_SORT_METHOD: 0 # RSB_IO_WANT_SUBDIVISION_MULTIPLIER: 1 # librsb version 1.3.0.2 - 202212201855: Initialization success -3 iterations (1 th.) took 7.391e-05s; avg 2.464e-05s ( +/- 10.97/ 18.06 %); best 2.193e-05s; worst 2.909e-05s; std dev. 3.171e-06 (taking best). -Reference operation time is 2.19345e-05 s (920.9 Mflops) with 1 threads. +3 iterations (1 th.) took 8.011e-05s; avg 2.67e-05s ( +/- 14.29/ 27.68 %); best 2.289e-05s; worst 3.409e-05s; std dev. 5.227e-06 (taking best). +Reference operation time is 2.28882e-05 s (882.6 Mflops) with 1 threads. Building a matrix with 5050 nnz, 100 x 100 Duplicates check: 5050 - 0 = 5050 - converted COO to RSB in 3.342e-03 s (100.00 %) - analyzed arrays in 1.106e-03 s (33.09 %) - cleaned-up arrays in 5.817e-05 s (1.74 %) - deduplicated arrays in 1.478e-05 s (0.44 %) + converted COO to RSB in 9.908e-03 s (100.00 %) + analyzed arrays in 3.374e-03 s (34.05 %) + cleaned-up arrays in 5.913e-05 s (0.60 %) + deduplicated arrays in 1.502e-05 s (0.15 %) sorted arrays in 0.000e+00 s (0.00 %) - shuffled partitions in 2.135e-03 s (63.89 %) - memory allocations took 9.060e-06 s (0.27 %) - leafs setup took 2.861e-06 s (0.09 %) - halfword conversion took 1.311e-05 s (0.39 %) -Built (100 x 100)[0x1d80a20]{S} @ (0(0..100),0(0..100)) (5050 nnz, 50 nnz/r) flags 0x42644094 (coo:0, csr:1, hw:0, ic:1, fi:0), storage: 1, subm: 1, symflags:'LS' + shuffled partitions in 6.432e-03 s (64.92 %) + memory allocations took 1.097e-05 s (0.11 %) + leafs setup took 1.907e-06 s (0.02 %) + halfword conversion took 1.407e-05 s (0.14 %) +Built (100 x 100)[0x17e7970]{S} @ (0(0..100),0(0..100)) (5050 nnz, 50 nnz/r) flags 0x42644094 (coo:0, csr:1, hw:0, ic:1, fi:0), storage: 1, subm: 1, symflags:'LS' Starting autotuning stage, with subdivision of 1 (current threads=1, requested threads=0, max threads = 4). # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 524288 bytes, per-thread 524288 bytes @@ -7363,16 +7400,16 @@ # librsb version 1.3.0.2 - 202212201855: Initialization success Building a matrix with 5050 nnz, 100 x 100 Duplicates check: 5050 - 0 = 5050 - converted COO to RSB in 4.937e-03 s (100.00 %) - analyzed arrays in 2.878e-03 s (58.29 %) - cleaned-up arrays in 5.817e-05 s (1.18 %) - deduplicated arrays in 1.478e-05 s (0.30 %) + converted COO to RSB in 1.885e-02 s (100.00 %) + analyzed arrays in 8.112e-03 s (43.03 %) + cleaned-up arrays in 5.794e-05 s (0.31 %) + deduplicated arrays in 1.502e-05 s (0.08 %) sorted arrays in 0.000e+00 s (0.00 %) - shuffled partitions in 1.949e-03 s (39.48 %) - memory allocations took 1.216e-05 s (0.25 %) - leafs setup took 4.053e-06 s (0.08 %) - halfword conversion took 2.003e-05 s (0.41 %) -Built (100 x 100)[0x1d72e80]{S} @ (0(0..100),0(0..100)) (5050 nnz, 50 nnz/r) flags 0x42644096 (coo:0, csr:1, hw:1, ic:1, fi:0), storage: 1, subm: 1, symflags:'LS' + shuffled partitions in 1.064e-02 s (56.41 %) + memory allocations took 8.821e-06 s (0.05 %) + leafs setup took 2.861e-06 s (0.02 %) + halfword conversion took 2.098e-05 s (0.11 %) +Built (100 x 100)[0x17f94c0]{S} @ (0(0..100),0(0..100)) (5050 nnz, 50 nnz/r) flags 0x42644096 (coo:0, csr:1, hw:1, ic:1, fi:0), storage: 1, subm: 1, symflags:'LS' # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 524288 bytes, per-thread 524288 bytes # RSB_IO_WANT_MEMORY_HIERARCHY_INFO_STRING: unset @@ -7418,10 +7455,9 @@ # RSB_IO_WANT_SORT_METHOD: 0 # RSB_IO_WANT_SUBDIVISION_MULTIPLIER: 0.25 # librsb version 1.3.0.2 - 202212201855: Initialization success -3 iterations (1 th.) took 7.486e-05s; avg 2.495e-05s ( +/- 12.10/ 16.56 %); best 2.193e-05s; worst 2.909e-05s; std dev. 3.024e-06 (taking best). +3 iterations (1 th.) took 7.176e-05s; avg 2.392e-05s ( +/- 8.31/ 16.61 %); best 2.193e-05s; worst 2.789e-05s; std dev. 2.81e-06 (taking best). Reference operation time is 2.19345e-05 s (920.9 Mflops) with 1 threads. -Challenging best inner round reference (2.19345e-05 s/1 threads) with: subdivision 0.25, 1 leaves, 2.08 bytes/nz, 2.19345e-05 s/0 threads (speedup 1 x), same?n. -New candidate clone performs slowly; discarding it: 100 x 100, type S, 5050 nnz, 50 nnz/r, 1 subms, 1 lsubms, 2.0800 bpnz +Challenging best inner round reference (2.28882e-05 s/1 threads) with: subdivision 0.25, 1 leaves, 2.08 bytes/nz, 2.19345e-05 s/0 threads (speedup 1.04348 x), same?n. # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 524288 bytes, per-thread 524288 bytes # RSB_IO_WANT_MEMORY_HIERARCHY_INFO_STRING: unset @@ -7454,16 +7490,16 @@ # librsb version 1.3.0.2 - 202212201855: Initialization success Building a matrix with 5050 nnz, 100 x 100 Duplicates check: 5050 - 0 = 5050 - converted COO to RSB in 9.264e-03 s (100.00 %) - analyzed arrays in 2.217e-03 s (23.93 %) - cleaned-up arrays in 5.913e-05 s (0.64 %) - deduplicated arrays in 1.478e-05 s (0.16 %) + converted COO to RSB in 3.049e-02 s (100.00 %) + analyzed arrays in 8.694e-03 s (28.52 %) + cleaned-up arrays in 5.794e-05 s (0.19 %) + deduplicated arrays in 1.502e-05 s (0.05 %) sorted arrays in 0.000e+00 s (0.00 %) - shuffled partitions in 4.893e-03 s (52.82 %) - memory allocations took 1.216e-05 s (0.13 %) - leafs setup took 3.815e-06 s (0.04 %) - halfword conversion took 2.064e-03 s (22.28 %) -Built (100 x 100)[0x1d734a0]{S} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x42646096 (coo:0, csr:1, hw:1, ic:1, fi:0), storage: 1, subm: 7, symflags:'LS' + shuffled partitions in 1.445e-02 s (47.41 %) + memory allocations took 1.097e-05 s (0.04 %) + leafs setup took 3.099e-06 s (0.01 %) + halfword conversion took 7.250e-03 s (23.78 %) +Built (100 x 100)[0x17f9ae0]{S} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x42646096 (coo:0, csr:1, hw:1, ic:1, fi:0), storage: 1, subm: 6, symflags:'LS' # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 524288 bytes, per-thread 524288 bytes # RSB_IO_WANT_MEMORY_HIERARCHY_INFO_STRING: unset @@ -7509,10 +7545,10 @@ # RSB_IO_WANT_SORT_METHOD: 0 # RSB_IO_WANT_SUBDIVISION_MULTIPLIER: 0.5 # librsb version 1.3.0.2 - 202212201855: Initialization success -3 iterations (1 th.) took 0.002844s; avg 0.000948s ( +/- 34.18/ 24.57 %); best 0.0006239s; worst 0.001181s; std dev. 0.0002363 (taking best). -Reference operation time is 0.000623941 s (32.37 Mflops) with 1 threads. -Challenging best inner round reference (2.19345e-05 s/1 threads) with: subdivision 0.5, 7 leaves, 2.164 bytes/nz, 0.000623941 s/0 threads (speedup 0.0351548 x), same?n. -New candidate clone performs slowly; discarding it: 100 x 100, type S, 5050 nnz, 50 nnz/r, 10 subms, 7 lsubms, 2.1640 bpnz +3 iterations (1 th.) took 0.009114s; avg 0.003038s ( +/- 18.11/ 17.38 %); best 0.002488s; worst 0.003566s; std dev. 0.0004404 (taking best). +Reference operation time is 0.0024879 s (8.119 Mflops) with 1 threads. +Challenging best inner round reference (2.19345e-05 s/0 threads) with: subdivision 0.5, 6 leaves, 2.163 bytes/nz, 0.0024879 s/0 threads (speedup 0.00881648 x), same?n. +New candidate clone performs slowly; discarding it: 100 x 100, type S, 5050 nnz, 50 nnz/r, 8 subms, 6 lsubms, 2.1632 bpnz # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 524288 bytes, per-thread 524288 bytes # RSB_IO_WANT_MEMORY_HIERARCHY_INFO_STRING: unset @@ -7545,16 +7581,16 @@ # librsb version 1.3.0.2 - 202212201855: Initialization success Building a matrix with 5050 nnz, 100 x 100 Duplicates check: 5050 - 0 = 5050 - converted COO to RSB in 9.382e-03 s (100.00 %) - analyzed arrays in 2.217e-03 s (23.63 %) - cleaned-up arrays in 5.794e-05 s (0.62 %) - deduplicated arrays in 1.597e-05 s (0.17 %) + converted COO to RSB in 2.894e-02 s (100.00 %) + analyzed arrays in 7.517e-03 s (25.98 %) + cleaned-up arrays in 5.794e-05 s (0.20 %) + deduplicated arrays in 1.597e-05 s (0.06 %) sorted arrays in 0.000e+00 s (0.00 %) - shuffled partitions in 4.445e-03 s (47.38 %) - memory allocations took 1.311e-05 s (0.14 %) - leafs setup took 5.007e-06 s (0.05 %) - halfword conversion took 2.627e-03 s (28.00 %) -Built (100 x 100)[0x1d734a0]{S} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x42646096 (coo:0, csr:1, hw:1, ic:1, fi:0), storage: 1, subm: 10, symflags:'LS' + shuffled partitions in 1.377e-02 s (47.59 %) + memory allocations took 1.025e-05 s (0.04 %) + leafs setup took 3.815e-06 s (0.01 %) + halfword conversion took 7.559e-03 s (26.12 %) +Built (100 x 100)[0x17f9ae0]{S} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x42646096 (coo:0, csr:1, hw:1, ic:1, fi:0), storage: 1, subm: 10, symflags:'LS' # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 524288 bytes, per-thread 524288 bytes # RSB_IO_WANT_MEMORY_HIERARCHY_INFO_STRING: unset @@ -7600,9 +7636,9 @@ # RSB_IO_WANT_SORT_METHOD: 0 # RSB_IO_WANT_SUBDIVISION_MULTIPLIER: 1 # librsb version 1.3.0.2 - 202212201855: Initialization success -3 iterations (1 th.) took 0.002829s; avg 0.000943s ( +/- 36.92/ 22.27 %); best 0.0005949s; worst 0.001153s; std dev. 0.0002479 (taking best). -Reference operation time is 0.000594854 s (33.96 Mflops) with 1 threads. -Challenging best inner round reference (2.19345e-05 s/1 threads) with: subdivision 1, 10 leaves, 2.206 bytes/nz, 0.000594854 s/0 threads (speedup 0.0368737 x), same?n. +3 iterations (1 th.) took 0.01213s; avg 0.004044s ( +/- 37.49/ 21.43 %); best 0.002528s; worst 0.004911s; std dev. 0.001076 (taking best). +Reference operation time is 0.00252795 s (7.991 Mflops) with 1 threads. +Challenging best inner round reference (2.19345e-05 s/0 threads) with: subdivision 1, 10 leaves, 2.206 bytes/nz, 0.00252795 s/0 threads (speedup 0.00867679 x), same?n. New candidate clone performs slowly; discarding it: 100 x 100, type S, 5050 nnz, 50 nnz/r, 14 subms, 10 lsubms, 2.2059 bpnz # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 524288 bytes, per-thread 524288 bytes @@ -7636,16 +7672,16 @@ # librsb version 1.3.0.2 - 202212201855: Initialization success Building a matrix with 5050 nnz, 100 x 100 Duplicates check: 5050 - 0 = 5050 - converted COO to RSB in 9.400e-03 s (100.00 %) - analyzed arrays in 2.304e-03 s (24.51 %) - cleaned-up arrays in 5.794e-05 s (0.62 %) - deduplicated arrays in 1.502e-05 s (0.16 %) + converted COO to RSB in 3.251e-02 s (100.00 %) + analyzed arrays in 8.588e-03 s (26.42 %) + cleaned-up arrays in 5.794e-05 s (0.18 %) + deduplicated arrays in 1.502e-05 s (0.05 %) sorted arrays in 0.000e+00 s (0.00 %) - shuffled partitions in 4.456e-03 s (47.40 %) - memory allocations took 1.407e-05 s (0.15 %) - leafs setup took 5.960e-06 s (0.06 %) - halfword conversion took 2.546e-03 s (27.09 %) -Built (100 x 100)[0x1d8cc20]{S} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x42646096 (coo:0, csr:1, hw:1, ic:1, fi:0), storage: 1, subm: 10, symflags:'LS' + shuffled partitions in 1.451e-02 s (44.64 %) + memory allocations took 1.383e-05 s (0.04 %) + leafs setup took 5.007e-06 s (0.02 %) + halfword conversion took 9.315e-03 s (28.65 %) +Built (100 x 100)[0x17c1f50]{S} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x42646096 (coo:0, csr:1, hw:1, ic:1, fi:0), storage: 1, subm: 10, symflags:'LS' # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 524288 bytes, per-thread 524288 bytes # RSB_IO_WANT_MEMORY_HIERARCHY_INFO_STRING: unset @@ -7691,9 +7727,9 @@ # RSB_IO_WANT_SORT_METHOD: 0 # RSB_IO_WANT_SUBDIVISION_MULTIPLIER: 2 # librsb version 1.3.0.2 - 202212201855: Initialization success -3 iterations (1 th.) took 0.002862s; avg 0.000954s ( +/- 40.47/ 21.28 %); best 0.0005679s; worst 0.001157s; std dev. 0.0002731 (taking best). -Reference operation time is 0.000567913 s (35.57 Mflops) with 1 threads. -Challenging best inner round reference (2.19345e-05 s/1 threads) with: subdivision 2, 10 leaves, 2.206 bytes/nz, 0.000567913 s/0 threads (speedup 0.038623 x), same?n. +3 iterations (1 th.) took 0.009363s; avg 0.003121s ( +/- 26.66/ 27.36 %); best 0.002289s; worst 0.003975s; std dev. 0.0006884 (taking best). +Reference operation time is 0.00228906 s (8.825 Mflops) with 1 threads. +Challenging best inner round reference (2.19345e-05 s/0 threads) with: subdivision 2, 10 leaves, 2.206 bytes/nz, 0.00228906 s/0 threads (speedup 0.00958234 x), same?n. New candidate clone performs slowly; discarding it: 100 x 100, type S, 5050 nnz, 50 nnz/r, 14 subms, 10 lsubms, 2.2059 bpnz # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 524288 bytes, per-thread 524288 bytes @@ -7727,16 +7763,16 @@ # librsb version 1.3.0.2 - 202212201855: Initialization success Building a matrix with 5050 nnz, 100 x 100 Duplicates check: 5050 - 0 = 5050 - converted COO to RSB in 9.230e-03 s (100.00 %) - analyzed arrays in 2.913e-03 s (31.56 %) - cleaned-up arrays in 5.794e-05 s (0.63 %) - deduplicated arrays in 1.597e-05 s (0.17 %) + converted COO to RSB in 3.147e-02 s (100.00 %) + analyzed arrays in 9.901e-03 s (31.46 %) + cleaned-up arrays in 5.794e-05 s (0.18 %) + deduplicated arrays in 1.621e-05 s (0.05 %) sorted arrays in 0.000e+00 s (0.00 %) - shuffled partitions in 4.504e-03 s (48.80 %) - memory allocations took 1.621e-05 s (0.18 %) - leafs setup took 6.914e-06 s (0.07 %) - halfword conversion took 1.714e-03 s (18.57 %) -Built (100 x 100)[0x1db5080]{S} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x42646096 (coo:0, csr:1, hw:1, ic:1, fi:0), storage: 1, subm: 10, symflags:'LS' + shuffled partitions in 1.362e-02 s (43.29 %) + memory allocations took 3.195e-05 s (0.10 %) + leafs setup took 5.007e-06 s (0.02 %) + halfword conversion took 7.832e-03 s (24.89 %) +Built (100 x 100)[0x1837860]{S} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x42646096 (coo:0, csr:1, hw:1, ic:1, fi:0), storage: 1, subm: 10, symflags:'LS' # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 524288 bytes, per-thread 524288 bytes # RSB_IO_WANT_MEMORY_HIERARCHY_INFO_STRING: unset @@ -7782,11 +7818,11 @@ # RSB_IO_WANT_SORT_METHOD: 0 # RSB_IO_WANT_SUBDIVISION_MULTIPLIER: 4 # librsb version 1.3.0.2 - 202212201855: Initialization success -3 iterations (1 th.) took 0.003257s; avg 0.001086s ( +/- 47.69/ 45.44 %); best 0.0005679s; worst 0.001579s; std dev. 0.0004132 (taking best). -Reference operation time is 0.000567913 s (35.57 Mflops) with 1 threads. -Challenging best inner round reference (2.19345e-05 s/1 threads) with: subdivision 4, 10 leaves, 2.206 bytes/nz, 0.000567913 s/0 threads (speedup 0.038623 x), same?n. +3 iterations (1 th.) took 0.009486s; avg 0.003162s ( +/- 22.33/ 15.18 %); best 0.002456s; worst 0.003642s; std dev. 0.0005099 (taking best). +Reference operation time is 0.00245595 s (8.225 Mflops) with 1 threads. +Challenging best inner round reference (2.19345e-05 s/0 threads) with: subdivision 4, 10 leaves, 2.206 bytes/nz, 0.00245595 s/0 threads (speedup 0.00893117 x), same?n. New candidate clone performs slowly; discarding it: 100 x 100, type S, 5050 nnz, 50 nnz/r, 14 subms, 10 lsubms, 2.2059 bpnz -Best sparse multiply performance with subdivision multiplier of 1: 920.923 Mflops. +Best sparse multiply performance with subdivision multiplier of 0.25: 920.923 Mflops. # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 524288 bytes, per-thread 524288 bytes # RSB_IO_WANT_MEMORY_HIERARCHY_INFO_STRING: unset @@ -7802,23 +7838,23 @@ # RSB_IO_WANT_SORT_METHOD: 0 # RSB_IO_WANT_SUBDIVISION_MULTIPLIER: 1 # librsb version 1.3.0.2 - 202212201855: Initialization success -Last tuner inner round (1 of 1) took 0.059891 s (eq. to 3e+03/ 3e+03 old/new op.times), gained local/global speedup 1 x (2.19345e-05 : 2.19345e-05) / 1 x (2.19345e-05 : 2.19345e-05). This is not amortizable ! -Auto tuning inner round 1 did not find a configuration better than the original. -In 1 tuning rounds (tot. 0.06s, 0.046s for constructor, 0 clones) obtained NO speedup (best stays 920.9 Mflops). -Second run of RSB Autotuner took 0.060035 s and estimated a speedup of 1.000000 x (2.193e-05 s -> 2.193e-05 s per op) in same matrix (1 -> 1 lsubm) +Last tuner inner round (1 of 1) took 0.196907 s (eq. to 9e+03/ 9e+03 old/new op.times), gained local/global speedup 1.04348 x (2.28882e-05 : 2.19345e-05) / 1.04348 x (2.28882e-05 : 2.19345e-05). This is amortizable in 206472 op.times. +In 1 tuning rounds (tot. 0.2s, 0.15s for constructor, 0 clones) obtained a SPEEDUP of 4.3% (1.043x) (from 882.6 to 920.9 Mflops). +Second run of RSB Autotuner took 0.197033 s and estimated a speedup of 1.043478 x (2.289e-05 s -> 2.193e-05 s per op) in new matrix (1 -> 1 lsubm) +RSB Autotuner suggested a new matrix: freeing the old one. #min:1 #max:1 #sum:100 #norm:10 #used index storage compared to COO:10504 vs 40400 bytes (26.00%) ; compared to CSR:10504 vs 20604 bytes (50.99%) #%:CONSTRUCTOR_*:SORT SCAN INSERT SCAN+INSERT -%:CONSTRUCTOR_TIMES:lower-100x100-5050nz S N 1 100 100 5050 0.000000 0.001148 0.004281 0.005429 -%:UNSORTEDCOO2RSB_TIME:lower-100x100-5050nz S N 1 100 100 5050 0.005429 -%:RSB_SUBDIVISION_TIME:lower-100x100-5050nz S N 1 100 100 5050 0.001148 -%:RSB_SHUFFLE_TIME:lower-100x100-5050nz S N 1 100 100 5050 0.004281 +%:CONSTRUCTOR_TIMES:lower-100x100-5050nz S N 1 100 100 5050 0.000000 0.003487 0.014968 0.018455 +%:UNSORTEDCOO2RSB_TIME:lower-100x100-5050nz S N 1 100 100 5050 0.018455 +%:RSB_SUBDIVISION_TIME:lower-100x100-5050nz S N 1 100 100 5050 0.003487 +%:RSB_SHUFFLE_TIME:lower-100x100-5050nz S N 1 100 100 5050 0.014968 %:ROW_MAJOR_SORT_TIME:lower-100x100-5050nz S N 1 100 100 5050 0.000000 %:ROW_MAJOR_SORT_SCALING:lower-100x100-5050nz S N 1 100 100 5050 nan -%:SORTEDCOO2RSB_TIME:lower-100x100-5050nz S N 1 100 100 5050 0.005429 +%:SORTEDCOO2RSB_TIME:lower-100x100-5050nz S N 1 100 100 5050 0.018455 %:ROW_MAJOR_SORT_TO_MOP:lower-100x100-5050nz S N 1 100 100 5050 0.000 %:UNSORTEDCOO2RSB_SCALING:lower-100x100-5050nz S N 1 100 100 5050 1.00 %:SORTEDCOO2RSB_SCALING:lower-100x100-5050nz S N 1 100 100 5050 1.00 @@ -7833,34 +7869,34 @@ %:SM_MINMAXAVGNNZ:lower-100x100-5050nz S N 1 100 100 5050 5050 5050 5050 # %operation:matrix CONSTRUCTOR[1] SPMV[1] SPMV[1] -%operation:lower-100x100-5050nz 0.0075779 1e+09 1e+09 +%operation:lower-100x100-5050nz 0.026345 1e+09 1e+09 %constructor:matrix SORT[1] SCAN[1] SHUFFLE[1] INSERT[1] -%constructor:lower-100x100-5050nz 0 0.00114799 0 0.00428104 -# so far, program took 6.317s of wall clock time; ancillary tests 0.000s; I/O 0.000s; checks 0.000s; conversions 0.000s; rsb/mkl tuning 0.193s/0.000s . +%constructor:lower-100x100-5050nz 0 0.00348711 0 0.0149679 +# so far, program took 6.787s of wall clock time; ancillary tests 0.000s; I/O 0.000s; checks 0.000s; conversions 0.000s; rsb/mkl tuning 0.577s/0.000s . getrusage() stats: ru_maxrss: 5 (maximum resident set size -- MB) -ru_stime : 0.05219s (system CPU time used) -ru_utime : 6.665s (user CPU time used) +ru_stime : 0.0801s (system CPU time used) +ru_utime : 6.7s (user CPU time used) # multi-type benchmarking (DSCZ) -- now using typecode C (last was D). # Cache block size total 524288 bytes, per-thread 524288 bytes -# so far, program took 6.317s of wall clock time; ancillary tests 0.000s; I/O 0.000s; checks 0.000s; conversions 0.000s; rsb/mkl tuning 0.193s/0.000s . +# so far, program took 6.787s of wall clock time; ancillary tests 0.000s; I/O 0.000s; checks 0.000s; conversions 0.000s; rsb/mkl tuning 0.577s/0.000s . # Using 1 threads # Using alpha=1 beta=1 order=cols for rsb_spmv/rsb_spsv/rsb_spmm/rsb_spsm. # will use input matrix flags: RSB_FLAG_USE_HALFWORD_INDICES, RSB_FLAG_SORTED_INPUT, RSB_FLAG_LOWER, RSB_FLAG_QUAD_PARTITIONING, RSB_FLAG_SYMMETRIC, RSB_FLAG_OWN_PARTITIONING_ARRAYS # Using 1 threads Building a matrix with 5050 nnz, 100 x 100 Duplicates check: 5050 - 0 = 5050 - converted COO to RSB in 7.245e-03 s (100.00 %) - analyzed arrays in 1.069e-03 s (14.76 %) - cleaned-up arrays in 6.104e-05 s (0.84 %) - deduplicated arrays in 1.597e-05 s (0.22 %) + converted COO to RSB in 2.436e-02 s (100.00 %) + analyzed arrays in 3.914e-03 s (16.07 %) + cleaned-up arrays in 5.889e-05 s (0.24 %) + deduplicated arrays in 1.621e-05 s (0.07 %) sorted arrays in 0.000e+00 s (0.00 %) - shuffled partitions in 3.926e-03 s (54.19 %) - memory allocations took 1.192e-05 s (0.16 %) - leafs setup took 5.007e-06 s (0.07 %) - halfword conversion took 2.155e-03 s (29.75 %) -Built (100 x 100)[0x1d91b30]{C} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x2446196 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'LS' -# Constructed matrix (took 0.007s): (100 x 100)[0x1d91b30]{C} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x2446196 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'LS' + shuffled partitions in 1.409e-02 s (57.86 %) + memory allocations took 1.192e-05 s (0.05 %) + leafs setup took 5.007e-06 s (0.02 %) + halfword conversion took 6.256e-03 s (25.68 %) +Built (100 x 100)[0x180a9f0]{C} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x2446196 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'LS' +# Constructed matrix (took 0.024s): (100 x 100)[0x180a9f0]{C} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x2446196 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'LS' # matrix consistency check took 0.000s (ok) RSB Sparse Blocks Autotuner invoked requesting max 6 splits and max 6 merges in 1 rounds, threads spec.0 (specify negative values to enable threads tuning). Will autotune matrix: 100 x 100, type C, 5050 nnz, 50 nnz/r, 4 subms, 3 lsubms, 2.1212 bpnz. @@ -7911,10 +7947,10 @@ # RSB_IO_WANT_SORT_METHOD: 0 # RSB_IO_WANT_SUBDIVISION_MULTIPLIER: 1 # librsb version 1.3.0.2 - 202212201855: Initialization success -3 iterations (1 th.) took 0.002883s; avg 0.0009611s ( +/- 44.85/ 22.80 %); best 0.00053s; worst 0.00118s; std dev. 0.0003048 (taking best). -Reference operation time is 0.000530005 s (152.5 Mflops) with 1 threads. -Starting merge (same threads) based auto-tuning procedure (transA=N, nrhs=1, order=cols) (max 6 steps, inclusive 3 grace steps) on: 100 x 100, type C, 5050 nnz, 50 nnz/r, 4 subms, 3 lsubms, 2.1212 bpnz (tpop: 0.00053 Mflops: 152.452) -Merge (3 -> 1 leaves) took w.c.t. of 0.000133s, ~0.0001152s of computing time (of which 5.412e-05s sorting, 5.96e-06s analysis) +3 iterations (1 th.) took 0.007529s; avg 0.00251s ( +/- 21.86/ 32.37 %); best 0.001961s; worst 0.003322s; std dev. 0.0005861 (taking best). +Reference operation time is 0.00196099 s (41.2 Mflops) with 1 threads. +Starting merge (same threads) based auto-tuning procedure (transA=N, nrhs=1, order=cols) (max 6 steps, inclusive 3 grace steps) on: 100 x 100, type C, 5050 nnz, 50 nnz/r, 4 subms, 3 lsubms, 2.1212 bpnz (tpop: 0.001961 Mflops: 41.204) +Merge (3 -> 1 leaves) took w.c.t. of 0.0001712s, ~0.000149s of computing time (of which 7.296e-05s sorting, 8.821e-06s analysis) # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 524288 bytes, per-thread 524288 bytes # RSB_IO_WANT_MEMORY_HIERARCHY_INFO_STRING: unset @@ -7945,8 +7981,8 @@ # RSB_IO_WANT_SORT_METHOD: 0 # RSB_IO_WANT_SUBDIVISION_MULTIPLIER: 1 # librsb version 1.3.0.2 - 202212201855: Initialization success -3 iterations (1 th.) took 0.0002701s; avg 9.004e-05s ( +/- 3.35/ 5.65 %); best 8.702e-05s; worst 9.513e-05s; std dev. 3.618e-06 (taking best). -Reference operation time is 8.70228e-05 s (928.5 Mflops) with 1 threads. +3 iterations (1 th.) took 0.0002801s; avg 9.338e-05s ( +/- 3.49/ 6.21 %); best 9.012e-05s; worst 9.918e-05s; std dev. 4.113e-06 (taking best). +Reference operation time is 9.01222e-05 s (896.6 Mflops) with 1 threads. # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 524288 bytes, per-thread 524288 bytes # RSB_IO_WANT_MEMORY_HIERARCHY_INFO_STRING: unset @@ -7962,16 +7998,16 @@ # RSB_IO_WANT_SORT_METHOD: 0 # RSB_IO_WANT_SUBDIVISION_MULTIPLIER: 1 # librsb version 1.3.0.2 - 202212201855: Initialization success -After merge step 1: tpop: 8.702e-05 s ~Mflops: 928.493 nsubm:1 otn:1 -Applying merge (3 -> 1 leaves, 1 th.) yielded SPEEDUP of 6.090x: 0.00053s -> 8.702e-05s, so taking this instance. +After merge step 1: tpop: 9.012e-05 s ~Mflops: 896.560 nsubm:1 otn:1 +Applying merge (3 -> 1 leaves, 1 th.) yielded SPEEDUP of 21.759x: 0.001961s -> 9.012e-05s, so taking this instance. Saved plot to test-tuning-lower-100x100-5050nz--C-N-1--mv-tuned_merge1_1x1th.eps Merged all the matrix leaves: no reason to continue merging. -A total of 1 merge steps (of max 6) (3 -> 1 subms) took 0.01526s (of which 0.0001421s partitioning, 0.01185s I/O); computing times: 0.0001152s in par. loops, 5.412e-05s sorting, 5.96e-06s analyzing) -Total merge + benchmarking process took 0.01526s, equivalent to 175.4/28.8 new/old ops (0.005854s for 2 clones -- as 67.3/11.0 ops, or 33.6/5.5 ops per clone), SPEEDUP of 6.090x -Applying multi-merge (3 -> 1 leaves, 1 steps, 0 -> 1 th.sp.) yielded SPEEDUP of 6.090x (0.00053s -> 8.702e-05s), will amortize in 34.5 ops by saving 0.000443s per op. -In 1 tuning rounds (tot. 0.022s, 0.0059s for constructor, 2 clones) obtained a SPEEDUP of 509.0% (6.09x) (from 152.5 to 928.5 Mflops). Employed 0.012s for I/O of matrix plots. +A total of 1 merge steps (of max 6) (3 -> 1 subms) took 0.04096s (of which 0.0001781s partitioning, 0.03351s I/O); computing times: 0.000149s in par. loops, 7.296e-05s sorting, 8.821e-06s analyzing) +Total merge + benchmarking process took 0.04096s, equivalent to 454.5/20.9 new/old ops (0.01953s for 2 clones -- as 216.7/10.0 ops, or 108.4/5.0 ops per clone), SPEEDUP of 21.759x +Applying multi-merge (3 -> 1 leaves, 1 steps, 0 -> 1 th.sp.) yielded SPEEDUP of 21.759x (0.001961s -> 9.012e-05s), will amortize in 21.9 ops by saving 0.001871s per op. +In 1 tuning rounds (tot. 0.062s, 0.02s for constructor, 2 clones) obtained a SPEEDUP of 2075.9% (21.76x) (from 41.2 to 896.6 Mflops). Employed 0.02s for I/O of matrix plots. #pr: updating sample at index 3 (2^th of 4), 0^th touch for (0,0,0,0,0,2,0). -First run of RSB Autotuner took 0.0340452 s (5.300e-04 s -> 8.702e-05 s per spmv_sxsa) (tuned: 3 -> 1 lsubm). +First run of RSB Autotuner took 0.081877 s (1.961e-03 s -> 9.012e-05 s per spmv_sxsa) (tuned: 3 -> 1 lsubm). RSB Sparse Blocks Autotuner invoked requesting max 0 splits and max 0 merges in 1 rounds, auto threads spec. Will autotune matrix: 100 x 100, type C, 5050 nnz, 50 nnz/r, 1 subms, 1 lsubms, 2.0800 bpnz. Parameters: verbosity:1 mintimes:3 maxtimes:10 mindt:0 maxdt:10 @@ -8037,20 +8073,20 @@ # RSB_IO_WANT_SORT_METHOD: 0 # RSB_IO_WANT_SUBDIVISION_MULTIPLIER: 1 # librsb version 1.3.0.2 - 202212201855: Initialization success -3 iterations (1 th.) took 0.0002739s; avg 9.131e-05s ( +/- 6.01/ 9.66 %); best 8.583e-05s; worst 0.0001001s; std dev. 6.299e-06 (taking best). -Reference operation time is 8.58307e-05 s (941.4 Mflops) with 1 threads. +3 iterations (1 th.) took 0.0002799s; avg 9.33e-05s ( +/- 6.98/ 13.71 %); best 8.678e-05s; worst 0.0001061s; std dev. 9.048e-06 (taking best). +Reference operation time is 8.67844e-05 s (931 Mflops) with 1 threads. Building a matrix with 5050 nnz, 100 x 100 Duplicates check: 5050 - 0 = 5050 - converted COO to RSB in 3.447e-03 s (100.00 %) - analyzed arrays in 1.102e-03 s (31.97 %) - cleaned-up arrays in 5.913e-05 s (1.72 %) - deduplicated arrays in 1.502e-05 s (0.44 %) + converted COO to RSB in 1.254e-02 s (100.00 %) + analyzed arrays in 3.363e-03 s (26.82 %) + cleaned-up arrays in 5.913e-05 s (0.47 %) + deduplicated arrays in 1.502e-05 s (0.12 %) sorted arrays in 0.000e+00 s (0.00 %) - shuffled partitions in 2.241e-03 s (65.02 %) - memory allocations took 9.775e-06 s (0.28 %) - leafs setup took 4.053e-06 s (0.12 %) - halfword conversion took 1.383e-05 s (0.40 %) -Built (100 x 100)[0x1d80860]{C} @ (0(0..100),0(0..100)) (5050 nnz, 50 nnz/r) flags 0x42644094 (coo:0, csr:1, hw:0, ic:1, fi:0), storage: 1, subm: 1, symflags:'LS' + shuffled partitions in 9.073e-03 s (72.35 %) + memory allocations took 1.001e-05 s (0.08 %) + leafs setup took 5.007e-06 s (0.04 %) + halfword conversion took 1.383e-05 s (0.11 %) +Built (100 x 100)[0x17e77c0]{C} @ (0(0..100),0(0..100)) (5050 nnz, 50 nnz/r) flags 0x42644094 (coo:0, csr:1, hw:0, ic:1, fi:0), storage: 1, subm: 1, symflags:'LS' Starting autotuning stage, with subdivision of 1 (current threads=1, requested threads=0, max threads = 4). # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 524288 bytes, per-thread 524288 bytes @@ -8084,16 +8120,16 @@ # librsb version 1.3.0.2 - 202212201855: Initialization success Building a matrix with 5050 nnz, 100 x 100 Duplicates check: 5050 - 0 = 5050 - converted COO to RSB in 8.699e-03 s (100.00 %) - analyzed arrays in 2.417e-03 s (27.79 %) - cleaned-up arrays in 5.889e-05 s (0.68 %) - deduplicated arrays in 1.502e-05 s (0.17 %) + converted COO to RSB in 3.219e-02 s (100.00 %) + analyzed arrays in 8.822e-03 s (27.41 %) + cleaned-up arrays in 5.913e-05 s (0.18 %) + deduplicated arrays in 1.502e-05 s (0.05 %) sorted arrays in 0.000e+00 s (0.00 %) - shuffled partitions in 4.004e-03 s (46.03 %) - memory allocations took 1.287e-05 s (0.15 %) - leafs setup took 4.053e-06 s (0.05 %) - halfword conversion took 2.185e-03 s (25.12 %) -Built (100 x 100)[0x1d73ae0]{C} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x42646096 (coo:0, csr:1, hw:1, ic:1, fi:0), storage: 1, subm: 3, symflags:'LS' + shuffled partitions in 1.436e-02 s (44.61 %) + memory allocations took 9.537e-06 s (0.03 %) + leafs setup took 5.007e-06 s (0.02 %) + halfword conversion took 8.916e-03 s (27.70 %) +Built (100 x 100)[0x17fa120]{C} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x42646096 (coo:0, csr:1, hw:1, ic:1, fi:0), storage: 1, subm: 3, symflags:'LS' # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 524288 bytes, per-thread 524288 bytes # RSB_IO_WANT_MEMORY_HIERARCHY_INFO_STRING: unset @@ -8139,9 +8175,9 @@ # RSB_IO_WANT_SORT_METHOD: 0 # RSB_IO_WANT_SUBDIVISION_MULTIPLIER: 0.25 # librsb version 1.3.0.2 - 202212201855: Initialization success -3 iterations (1 th.) took 0.002865s; avg 0.000955s ( +/- 28.58/ 21.15 %); best 0.0006821s; worst 0.001157s; std dev. 0.0002003 (taking best). -Reference operation time is 0.000682116 s (118.5 Mflops) with 1 threads. -Challenging best inner round reference (8.58307e-05 s/1 threads) with: subdivision 0.25, 3 leaves, 2.121 bytes/nz, 0.000682116 s/0 threads (speedup 0.12583 x), same?n. +3 iterations (1 th.) took 0.01055s; avg 0.003517s ( +/- 30.12/ 50.88 %); best 0.002458s; worst 0.005307s; std dev. 0.001273 (taking best). +Reference operation time is 0.0024581 s (32.87 Mflops) with 1 threads. +Challenging best inner round reference (8.67844e-05 s/1 threads) with: subdivision 0.25, 3 leaves, 2.121 bytes/nz, 0.0024581 s/0 threads (speedup 0.0353055 x), same?n. New candidate clone performs slowly; discarding it: 100 x 100, type C, 5050 nnz, 50 nnz/r, 4 subms, 3 lsubms, 2.1212 bpnz # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 524288 bytes, per-thread 524288 bytes @@ -8175,16 +8211,16 @@ # librsb version 1.3.0.2 - 202212201855: Initialization success Building a matrix with 5050 nnz, 100 x 100 Duplicates check: 5050 - 0 = 5050 - converted COO to RSB in 9.053e-03 s (100.00 %) - analyzed arrays in 2.428e-03 s (26.82 %) - cleaned-up arrays in 5.913e-05 s (0.65 %) - deduplicated arrays in 1.502e-05 s (0.17 %) + converted COO to RSB in 3.077e-02 s (100.00 %) + analyzed arrays in 9.310e-03 s (30.26 %) + cleaned-up arrays in 5.889e-05 s (0.19 %) + deduplicated arrays in 1.502e-05 s (0.05 %) sorted arrays in 0.000e+00 s (0.00 %) - shuffled partitions in 4.402e-03 s (48.62 %) - memory allocations took 1.407e-05 s (0.16 %) - leafs setup took 4.053e-06 s (0.04 %) - halfword conversion took 2.130e-03 s (23.53 %) -Built (100 x 100)[0x1d91b30]{C} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x42646096 (coo:0, csr:1, hw:1, ic:1, fi:0), storage: 1, subm: 10, symflags:'LS' + shuffled partitions in 1.403e-02 s (45.60 %) + memory allocations took 1.526e-05 s (0.05 %) + leafs setup took 5.960e-06 s (0.02 %) + halfword conversion took 7.329e-03 s (23.82 %) +Built (100 x 100)[0x17c1f50]{C} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x42646096 (coo:0, csr:1, hw:1, ic:1, fi:0), storage: 1, subm: 10, symflags:'LS' # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 524288 bytes, per-thread 524288 bytes # RSB_IO_WANT_MEMORY_HIERARCHY_INFO_STRING: unset @@ -8230,9 +8266,9 @@ # RSB_IO_WANT_SORT_METHOD: 0 # RSB_IO_WANT_SUBDIVISION_MULTIPLIER: 0.5 # librsb version 1.3.0.2 - 202212201855: Initialization success -3 iterations (1 th.) took 0.003239s; avg 0.00108s ( +/- 15.24/ 19.29 %); best 0.0009151s; worst 0.001288s; std dev. 0.0001553 (taking best). -Reference operation time is 0.000915051 s (88.3 Mflops) with 1 threads. -Challenging best inner round reference (8.58307e-05 s/1 threads) with: subdivision 0.5, 10 leaves, 2.206 bytes/nz, 0.000915051 s/0 threads (speedup 0.0937989 x), same?n. +3 iterations (1 th.) took 0.01222s; avg 0.004072s ( +/- 18.40/ 25.56 %); best 0.003323s; worst 0.005113s; std dev. 0.0007594 (taking best). +Reference operation time is 0.00332284 s (24.32 Mflops) with 1 threads. +Challenging best inner round reference (8.67844e-05 s/1 threads) with: subdivision 0.5, 10 leaves, 2.206 bytes/nz, 0.00332284 s/0 threads (speedup 0.0261175 x), same?n. New candidate clone performs slowly; discarding it: 100 x 100, type C, 5050 nnz, 50 nnz/r, 14 subms, 10 lsubms, 2.2059 bpnz # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 524288 bytes, per-thread 524288 bytes @@ -8266,16 +8302,16 @@ # librsb version 1.3.0.2 - 202212201855: Initialization success Building a matrix with 5050 nnz, 100 x 100 Duplicates check: 5050 - 0 = 5050 - converted COO to RSB in 9.102e-03 s (100.00 %) - analyzed arrays in 2.612e-03 s (28.70 %) - cleaned-up arrays in 5.794e-05 s (0.64 %) - deduplicated arrays in 1.502e-05 s (0.17 %) + converted COO to RSB in 2.982e-02 s (100.00 %) + analyzed arrays in 8.142e-03 s (27.30 %) + cleaned-up arrays in 5.913e-05 s (0.20 %) + deduplicated arrays in 1.502e-05 s (0.05 %) sorted arrays in 0.000e+00 s (0.00 %) - shuffled partitions in 4.225e-03 s (46.42 %) - memory allocations took 1.216e-05 s (0.13 %) - leafs setup took 4.053e-06 s (0.04 %) - halfword conversion took 2.175e-03 s (23.89 %) -Built (100 x 100)[0x1d91b30]{C} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x42646096 (coo:0, csr:1, hw:1, ic:1, fi:0), storage: 1, subm: 10, symflags:'LS' + shuffled partitions in 1.629e-02 s (54.61 %) + memory allocations took 1.454e-05 s (0.05 %) + leafs setup took 5.960e-06 s (0.02 %) + halfword conversion took 5.295e-03 s (17.76 %) +Built (100 x 100)[0x17c1f50]{C} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x42646096 (coo:0, csr:1, hw:1, ic:1, fi:0), storage: 1, subm: 10, symflags:'LS' # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 524288 bytes, per-thread 524288 bytes # RSB_IO_WANT_MEMORY_HIERARCHY_INFO_STRING: unset @@ -8321,9 +8357,9 @@ # RSB_IO_WANT_SORT_METHOD: 0 # RSB_IO_WANT_SUBDIVISION_MULTIPLIER: 1 # librsb version 1.3.0.2 - 202212201855: Initialization success -3 iterations (1 th.) took 0.003232s; avg 0.001077s ( +/- 24.71/ 18.24 %); best 0.0008111s; worst 0.001274s; std dev. 0.0001952 (taking best). -Reference operation time is 0.0008111 s (99.62 Mflops) with 1 threads. -Challenging best inner round reference (8.58307e-05 s/1 threads) with: subdivision 1, 10 leaves, 2.206 bytes/nz, 0.0008111 s/0 threads (speedup 0.10582 x), same?n. +3 iterations (1 th.) took 0.01134s; avg 0.003782s ( +/- 31.65/ 48.75 %); best 0.002585s; worst 0.005625s; std dev. 0.001323 (taking best). +Reference operation time is 0.00258493 s (31.26 Mflops) with 1 threads. +Challenging best inner round reference (8.67844e-05 s/1 threads) with: subdivision 1, 10 leaves, 2.206 bytes/nz, 0.00258493 s/0 threads (speedup 0.0335731 x), same?n. New candidate clone performs slowly; discarding it: 100 x 100, type C, 5050 nnz, 50 nnz/r, 14 subms, 10 lsubms, 2.2059 bpnz # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 524288 bytes, per-thread 524288 bytes @@ -8357,16 +8393,16 @@ # librsb version 1.3.0.2 - 202212201855: Initialization success Building a matrix with 5050 nnz, 100 x 100 Duplicates check: 5050 - 0 = 5050 - converted COO to RSB in 8.882e-03 s (100.00 %) - analyzed arrays in 2.299e-03 s (25.88 %) - cleaned-up arrays in 5.913e-05 s (0.67 %) - deduplicated arrays in 1.502e-05 s (0.17 %) + converted COO to RSB in 3.393e-02 s (100.00 %) + analyzed arrays in 8.765e-03 s (25.83 %) + cleaned-up arrays in 5.913e-05 s (0.17 %) + deduplicated arrays in 1.502e-05 s (0.04 %) sorted arrays in 0.000e+00 s (0.00 %) - shuffled partitions in 4.368e-03 s (49.18 %) - memory allocations took 1.574e-05 s (0.18 %) - leafs setup took 5.960e-06 s (0.07 %) - halfword conversion took 2.118e-03 s (23.85 %) -Built (100 x 100)[0x1d91b30]{C} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x42646096 (coo:0, csr:1, hw:1, ic:1, fi:0), storage: 1, subm: 10, symflags:'LS' + shuffled partitions in 1.670e-02 s (49.20 %) + memory allocations took 1.383e-05 s (0.04 %) + leafs setup took 5.960e-06 s (0.02 %) + halfword conversion took 8.374e-03 s (24.68 %) +Built (100 x 100)[0x17c1f50]{C} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x42646096 (coo:0, csr:1, hw:1, ic:1, fi:0), storage: 1, subm: 10, symflags:'LS' # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 524288 bytes, per-thread 524288 bytes # RSB_IO_WANT_MEMORY_HIERARCHY_INFO_STRING: unset @@ -8412,9 +8448,9 @@ # RSB_IO_WANT_SORT_METHOD: 0 # RSB_IO_WANT_SUBDIVISION_MULTIPLIER: 2 # librsb version 1.3.0.2 - 202212201855: Initialization success -3 iterations (1 th.) took 0.003845s; avg 0.001282s ( +/- 3.71/ 3.37 %); best 0.001234s; worst 0.001325s; std dev. 3.721e-05 (taking best). -Reference operation time is 0.00123405 s (65.48 Mflops) with 1 threads. -Challenging best inner round reference (8.58307e-05 s/1 threads) with: subdivision 2, 10 leaves, 2.206 bytes/nz, 0.00123405 s/0 threads (speedup 0.0695518 x), same?n. +3 iterations (1 th.) took 0.01161s; avg 0.003869s ( +/- 33.13/ 39.25 %); best 0.002587s; worst 0.005387s; std dev. 0.001155 (taking best). +Reference operation time is 0.00258708 s (31.23 Mflops) with 1 threads. +Challenging best inner round reference (8.67844e-05 s/1 threads) with: subdivision 2, 10 leaves, 2.206 bytes/nz, 0.00258708 s/0 threads (speedup 0.0335453 x), same?n. New candidate clone performs slowly; discarding it: 100 x 100, type C, 5050 nnz, 50 nnz/r, 14 subms, 10 lsubms, 2.2059 bpnz # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 524288 bytes, per-thread 524288 bytes @@ -8448,16 +8484,16 @@ # librsb version 1.3.0.2 - 202212201855: Initialization success Building a matrix with 5050 nnz, 100 x 100 Duplicates check: 5050 - 0 = 5050 - converted COO to RSB in 9.812e-03 s (100.00 %) - analyzed arrays in 2.570e-03 s (26.19 %) - cleaned-up arrays in 5.794e-05 s (0.59 %) - deduplicated arrays in 1.621e-05 s (0.17 %) - sorted arrays in 0.000e+00 s (0.00 %) - shuffled partitions in 5.043e-03 s (51.40 %) - memory allocations took 1.979e-05 s (0.20 %) - leafs setup took 5.960e-06 s (0.06 %) - halfword conversion took 2.097e-03 s (21.37 %) -Built (100 x 100)[0x1dc8c90]{C} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x42646096 (coo:0, csr:1, hw:1, ic:1, fi:0), storage: 1, subm: 10, symflags:'LS' + converted COO to RSB in 2.986e-02 s (100.00 %) + analyzed arrays in 9.101e-03 s (30.48 %) + cleaned-up arrays in 5.913e-05 s (0.20 %) + deduplicated arrays in 1.407e-05 s (0.05 %) + sorted arrays in 9.537e-07 s (0.00 %) + shuffled partitions in 1.404e-02 s (47.02 %) + memory allocations took 1.812e-05 s (0.06 %) + leafs setup took 5.960e-06 s (0.02 %) + halfword conversion took 6.620e-03 s (22.17 %) +Built (100 x 100)[0x1837890]{C} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x42646096 (coo:0, csr:1, hw:1, ic:1, fi:0), storage: 1, subm: 10, symflags:'LS' # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 524288 bytes, per-thread 524288 bytes # RSB_IO_WANT_MEMORY_HIERARCHY_INFO_STRING: unset @@ -8503,11 +8539,11 @@ # RSB_IO_WANT_SORT_METHOD: 0 # RSB_IO_WANT_SUBDIVISION_MULTIPLIER: 4 # librsb version 1.3.0.2 - 202212201855: Initialization success -3 iterations (1 th.) took 0.003049s; avg 0.001016s ( +/- 47.08/ 33.13 %); best 0.0005379s; worst 0.001353s; std dev. 0.0003475 (taking best). -Reference operation time is 0.000537872 s (150.2 Mflops) with 1 threads. -Challenging best inner round reference (8.58307e-05 s/1 threads) with: subdivision 4, 10 leaves, 2.206 bytes/nz, 0.000537872 s/0 threads (speedup 0.159574 x), same?n. +3 iterations (1 th.) took 0.01308s; avg 0.00436s ( +/- 47.21/ 47.38 %); best 0.002302s; worst 0.006426s; std dev. 0.001684 (taking best). +Reference operation time is 0.00230193 s (35.1 Mflops) with 1 threads. +Challenging best inner round reference (8.67844e-05 s/1 threads) with: subdivision 4, 10 leaves, 2.206 bytes/nz, 0.00230193 s/0 threads (speedup 0.0377007 x), same?n. New candidate clone performs slowly; discarding it: 100 x 100, type C, 5050 nnz, 50 nnz/r, 14 subms, 10 lsubms, 2.2059 bpnz -Best sparse multiply performance with subdivision multiplier of 1: 941.388 Mflops. +Best sparse multiply performance with subdivision multiplier of 1: 931.043 Mflops. # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 524288 bytes, per-thread 524288 bytes # RSB_IO_WANT_MEMORY_HIERARCHY_INFO_STRING: unset @@ -8523,23 +8559,23 @@ # RSB_IO_WANT_SORT_METHOD: 0 # RSB_IO_WANT_SUBDIVISION_MULTIPLIER: 1 # librsb version 1.3.0.2 - 202212201855: Initialization success -Last tuner inner round (1 of 1) took 0.068193 s (eq. to 8e+02/ 8e+02 old/new op.times), gained local/global speedup 1 x (8.58307e-05 : 8.58307e-05) / 1 x (8.58307e-05 : 8.58307e-05). This is not amortizable ! +Last tuner inner round (1 of 1) took 0.233855 s (eq. to 3e+03/ 3e+03 old/new op.times), gained local/global speedup 1 x (8.67844e-05 : 8.67844e-05) / 1 x (8.67844e-05 : 8.67844e-05). This is not amortizable ! Auto tuning inner round 1 did not find a configuration better than the original. -In 1 tuning rounds (tot. 0.068s, 0.051s for constructor, 0 clones) obtained NO speedup (best stays 941.4 Mflops). -Second run of RSB Autotuner took 0.0682669 s and estimated a speedup of 1.000000 x (8.583e-05 s -> 8.583e-05 s per op) in same matrix (1 -> 1 lsubm) +In 1 tuning rounds (tot. 0.23s, 0.17s for constructor, 0 clones) obtained NO speedup (best stays 931 Mflops). +Second run of RSB Autotuner took 0.233932 s and estimated a speedup of 1.000000 x (8.678e-05 s -> 8.678e-05 s per op) in same matrix (1 -> 1 lsubm) #min:1 0 #max:1 0 #sum:100 0 #norm:10 0 #used index storage compared to COO:10504 vs 40400 bytes (26.00%) ; compared to CSR:10504 vs 20604 bytes (50.99%) #%:CONSTRUCTOR_*:SORT SCAN INSERT SCAN+INSERT -%:CONSTRUCTOR_TIMES:lower-100x100-5050nz S N 1 100 100 5050 0.000000 0.001069 0.003926 0.004995 -%:UNSORTEDCOO2RSB_TIME:lower-100x100-5050nz S N 1 100 100 5050 0.004995 -%:RSB_SUBDIVISION_TIME:lower-100x100-5050nz S N 1 100 100 5050 0.001069 -%:RSB_SHUFFLE_TIME:lower-100x100-5050nz S N 1 100 100 5050 0.003926 +%:CONSTRUCTOR_TIMES:lower-100x100-5050nz S N 1 100 100 5050 0.000000 0.003914 0.014094 0.018008 +%:UNSORTEDCOO2RSB_TIME:lower-100x100-5050nz S N 1 100 100 5050 0.018008 +%:RSB_SUBDIVISION_TIME:lower-100x100-5050nz S N 1 100 100 5050 0.003914 +%:RSB_SHUFFLE_TIME:lower-100x100-5050nz S N 1 100 100 5050 0.014094 %:ROW_MAJOR_SORT_TIME:lower-100x100-5050nz S N 1 100 100 5050 0.000000 %:ROW_MAJOR_SORT_SCALING:lower-100x100-5050nz S N 1 100 100 5050 nan -%:SORTEDCOO2RSB_TIME:lower-100x100-5050nz S N 1 100 100 5050 0.004995 +%:SORTEDCOO2RSB_TIME:lower-100x100-5050nz S N 1 100 100 5050 0.018008 %:ROW_MAJOR_SORT_TO_MOP:lower-100x100-5050nz S N 1 100 100 5050 0.000 %:UNSORTEDCOO2RSB_SCALING:lower-100x100-5050nz S N 1 100 100 5050 1.00 %:SORTEDCOO2RSB_SCALING:lower-100x100-5050nz S N 1 100 100 5050 1.00 @@ -8554,34 +8590,34 @@ %:SM_MINMAXAVGNNZ:lower-100x100-5050nz S N 1 100 100 5050 5050 5050 5050 # %operation:matrix CONSTRUCTOR[1] SPMV[1] SPMV[1] -%operation:lower-100x100-5050nz 0.00724506 1e+09 1e+09 +%operation:lower-100x100-5050nz 0.024359 1e+09 1e+09 %constructor:matrix SORT[1] SCAN[1] SHUFFLE[1] INSERT[1] -%constructor:lower-100x100-5050nz 0 0.00106907 0 0.00392604 -# so far, program took 6.437s of wall clock time; ancillary tests 0.000s; I/O 0.000s; checks 0.000s; conversions 0.000s; rsb/mkl tuning 0.295s/0.000s . +%constructor:lower-100x100-5050nz 0 0.00391388 0 0.0140939 +# so far, program took 7.157s of wall clock time; ancillary tests 0.000s; I/O 0.000s; checks 0.000s; conversions 0.000s; rsb/mkl tuning 0.892s/0.000s . getrusage() stats: ru_maxrss: 5 (maximum resident set size -- MB) -ru_stime : 0.06431s (system CPU time used) -ru_utime : 6.979s (user CPU time used) +ru_stime : 0.09649s (system CPU time used) +ru_utime : 7.023s (user CPU time used) # multi-type benchmarking (DSCZ) -- now using typecode Z (last was D). # Cache block size total 524288 bytes, per-thread 524288 bytes -# so far, program took 6.437s of wall clock time; ancillary tests 0.000s; I/O 0.000s; checks 0.000s; conversions 0.000s; rsb/mkl tuning 0.295s/0.000s . +# so far, program took 7.157s of wall clock time; ancillary tests 0.000s; I/O 0.000s; checks 0.000s; conversions 0.000s; rsb/mkl tuning 0.892s/0.000s . # Using 1 threads # Using alpha=1 beta=1 order=cols for rsb_spmv/rsb_spsv/rsb_spmm/rsb_spsm. # will use input matrix flags: RSB_FLAG_USE_HALFWORD_INDICES, RSB_FLAG_SORTED_INPUT, RSB_FLAG_LOWER, RSB_FLAG_QUAD_PARTITIONING, RSB_FLAG_SYMMETRIC, RSB_FLAG_OWN_PARTITIONING_ARRAYS # Using 1 threads Building a matrix with 5050 nnz, 100 x 100 Duplicates check: 5050 - 0 = 5050 - converted COO to RSB in 8.199e-03 s (100.00 %) - analyzed arrays in 1.103e-03 s (13.45 %) - cleaned-up arrays in 6.199e-05 s (0.76 %) - deduplicated arrays in 1.597e-05 s (0.19 %) + converted COO to RSB in 2.522e-02 s (100.00 %) + analyzed arrays in 3.386e-03 s (13.43 %) + cleaned-up arrays in 5.913e-05 s (0.23 %) + deduplicated arrays in 1.502e-05 s (0.06 %) sorted arrays in 0.000e+00 s (0.00 %) - shuffled partitions in 4.286e-03 s (52.27 %) - memory allocations took 2.193e-05 s (0.27 %) - leafs setup took 4.053e-06 s (0.05 %) - halfword conversion took 2.705e-03 s (32.99 %) -Built (100 x 100)[0x1d6bc70]{Z} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x2446196 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'LS' -# Constructed matrix (took 0.008s): (100 x 100)[0x1d6bc70]{Z} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x2446196 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'LS' + shuffled partitions in 1.509e-02 s (59.83 %) + memory allocations took 2.289e-05 s (0.09 %) + leafs setup took 5.007e-06 s (0.02 %) + halfword conversion took 6.640e-03 s (26.33 %) +Built (100 x 100)[0x17c1f50]{Z} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x2446196 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'LS' +# Constructed matrix (took 0.025s): (100 x 100)[0x17c1f50]{Z} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x2446196 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'LS' # matrix consistency check took 0.000s (ok) RSB Sparse Blocks Autotuner invoked requesting max 6 splits and max 6 merges in 1 rounds, threads spec.0 (specify negative values to enable threads tuning). Will autotune matrix: 100 x 100, type Z, 5050 nnz, 50 nnz/r, 4 subms, 3 lsubms, 2.1212 bpnz. @@ -8632,10 +8668,10 @@ # RSB_IO_WANT_SORT_METHOD: 0 # RSB_IO_WANT_SUBDIVISION_MULTIPLIER: 1 # librsb version 1.3.0.2 - 202212201855: Initialization success -3 iterations (1 th.) took 0.003299s; avg 0.0011s ( +/- 17.98/ 20.85 %); best 0.0009019s; worst 0.001329s; std dev. 0.0001757 (taking best). -Reference operation time is 0.000901937 s (89.58 Mflops) with 1 threads. -Starting merge (same threads) based auto-tuning procedure (transA=N, nrhs=1, order=cols) (max 6 steps, inclusive 3 grace steps) on: 100 x 100, type Z, 5050 nnz, 50 nnz/r, 4 subms, 3 lsubms, 2.1212 bpnz (tpop: 0.0009019 Mflops: 89.585) -Merge (3 -> 1 leaves) took w.c.t. of 0.0002332s, ~0.0001771s of computing time (of which 8.106e-05s sorting, 7.153e-06s analysis) +3 iterations (1 th.) took 0.01153s; avg 0.003844s ( +/- 40.04/ 30.72 %); best 0.002305s; worst 0.005025s; std dev. 0.001139 (taking best). +Reference operation time is 0.00230503 s (35.05 Mflops) with 1 threads. +Starting merge (same threads) based auto-tuning procedure (transA=N, nrhs=1, order=cols) (max 6 steps, inclusive 3 grace steps) on: 100 x 100, type Z, 5050 nnz, 50 nnz/r, 4 subms, 3 lsubms, 2.1212 bpnz (tpop: 0.002305 Mflops: 35.054) +Merge (3 -> 1 leaves) took w.c.t. of 0.000138s, ~0.0001221s of computing time (of which 6.199e-05s sorting, 6.199e-06s analysis) # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 524288 bytes, per-thread 524288 bytes # RSB_IO_WANT_MEMORY_HIERARCHY_INFO_STRING: unset @@ -8666,8 +8702,8 @@ # RSB_IO_WANT_SORT_METHOD: 0 # RSB_IO_WANT_SUBDIVISION_MULTIPLIER: 1 # librsb version 1.3.0.2 - 202212201855: Initialization success -3 iterations (1 th.) took 0.0002739s; avg 9.131e-05s ( +/- 2.61/ 2.87 %); best 8.893e-05s; worst 9.394e-05s; std dev. 2.051e-06 (taking best). -Reference operation time is 8.89301e-05 s (908.6 Mflops) with 1 threads. +3 iterations (1 th.) took 0.0002689s; avg 8.965e-05s ( +/- 2.93/ 4.79 %); best 8.702e-05s; worst 9.394e-05s; std dev. 3.059e-06 (taking best). +Reference operation time is 8.70228e-05 s (928.5 Mflops) with 1 threads. # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 524288 bytes, per-thread 524288 bytes # RSB_IO_WANT_MEMORY_HIERARCHY_INFO_STRING: unset @@ -8683,16 +8719,16 @@ # RSB_IO_WANT_SORT_METHOD: 0 # RSB_IO_WANT_SUBDIVISION_MULTIPLIER: 1 # librsb version 1.3.0.2 - 202212201855: Initialization success -After merge step 1: tpop: 8.893e-05 s ~Mflops: 908.578 nsubm:1 otn:1 -Applying merge (3 -> 1 leaves, 1 th.) yielded SPEEDUP of 10.142x: 0.0009019s -> 8.893e-05s, so taking this instance. +After merge step 1: tpop: 8.702e-05 s ~Mflops: 928.493 nsubm:1 otn:1 +Applying merge (3 -> 1 leaves, 1 th.) yielded SPEEDUP of 26.488x: 0.002305s -> 8.702e-05s, so taking this instance. Saved plot to test-tuning-lower-100x100-5050nz--Z-N-1--mv-tuned_merge1_1x1th.eps Merged all the matrix leaves: no reason to continue merging. -A total of 1 merge steps (of max 6) (3 -> 1 subms) took 0.01565s (of which 0.0002451s partitioning, 0.01245s I/O); computing times: 0.0001771s in par. loops, 8.106e-05s sorting, 7.153e-06s analyzing) -Total merge + benchmarking process took 0.01565s, equivalent to 176.0/17.3 new/old ops (0.005475s for 2 clones -- as 61.6/6.1 ops, or 30.8/3.0 ops per clone), SPEEDUP of 10.142x -Applying multi-merge (3 -> 1 leaves, 1 steps, 0 -> 1 th.sp.) yielded SPEEDUP of 10.142x (0.0009019s -> 8.893e-05s), will amortize in 19.2 ops by saving 0.000813s per op. -In 1 tuning rounds (tot. 0.022s, 0.0055s for constructor, 2 clones) obtained a SPEEDUP of 914.2% (10.14x) (from 89.58 to 908.6 Mflops). Employed 0.013s for I/O of matrix plots. +A total of 1 merge steps (of max 6) (3 -> 1 subms) took 0.03897s (of which 0.0001471s partitioning, 0.0272s I/O); computing times: 0.0001221s in par. loops, 6.199e-05s sorting, 6.199e-06s analyzing) +Total merge + benchmarking process took 0.03897s, equivalent to 447.8/16.9 new/old ops (0.0224s for 2 clones -- as 257.4/9.7 ops, or 128.7/4.9 ops per clone), SPEEDUP of 26.488x +Applying multi-merge (3 -> 1 leaves, 1 steps, 0 -> 1 th.sp.) yielded SPEEDUP of 26.488x (0.002305s -> 8.702e-05s), will amortize in 17.6 ops by saving 0.002218s per op. +In 1 tuning rounds (tot. 0.065s, 0.022s for constructor, 2 clones) obtained a SPEEDUP of 2548.8% (26.49x) (from 35.05 to 928.5 Mflops). Employed 0.028s for I/O of matrix plots. #pr: updating sample at index 4 (3^th of 4), 0^th touch for (0,0,0,0,0,3,0). -First run of RSB Autotuner took 0.0356231 s (9.019e-04 s -> 8.893e-05 s per spmv_sxsa) (tuned: 3 -> 1 lsubm). +First run of RSB Autotuner took 0.0924921 s (2.305e-03 s -> 8.702e-05 s per spmv_sxsa) (tuned: 3 -> 1 lsubm). RSB Sparse Blocks Autotuner invoked requesting max 0 splits and max 0 merges in 1 rounds, auto threads spec. Will autotune matrix: 100 x 100, type Z, 5050 nnz, 50 nnz/r, 1 subms, 1 lsubms, 2.0800 bpnz. Parameters: verbosity:1 mintimes:3 maxtimes:10 mindt:0 maxdt:10 @@ -8758,20 +8794,20 @@ # RSB_IO_WANT_SORT_METHOD: 0 # RSB_IO_WANT_SUBDIVISION_MULTIPLIER: 1 # librsb version 1.3.0.2 - 202212201855: Initialization success -3 iterations (1 th.) took 0.0002768s; avg 9.227e-05s ( +/- 6.98/ 10.34 %); best 8.583e-05s; worst 0.0001018s; std dev. 6.88e-06 (taking best). -Reference operation time is 8.58307e-05 s (941.4 Mflops) with 1 threads. +3 iterations (1 th.) took 0.0002999s; avg 9.998e-05s ( +/- 12.00/ 23.05 %); best 8.798e-05s; worst 0.000123s; std dev. 1.63e-05 (taking best). +Reference operation time is 8.79765e-05 s (918.4 Mflops) with 1 threads. Building a matrix with 5050 nnz, 100 x 100 Duplicates check: 5050 - 0 = 5050 - converted COO to RSB in 3.383e-03 s (100.00 %) - analyzed arrays in 1.095e-03 s (32.37 %) - cleaned-up arrays in 5.984e-05 s (1.77 %) - deduplicated arrays in 1.597e-05 s (0.47 %) + converted COO to RSB in 1.028e-02 s (100.00 %) + analyzed arrays in 3.793e-03 s (36.90 %) + cleaned-up arrays in 6.008e-05 s (0.58 %) + deduplicated arrays in 1.478e-05 s (0.14 %) sorted arrays in 0.000e+00 s (0.00 %) - shuffled partitions in 2.181e-03 s (64.47 %) - memory allocations took 1.121e-05 s (0.33 %) - leafs setup took 5.007e-06 s (0.15 %) - halfword conversion took 1.407e-05 s (0.42 %) -Built (100 x 100)[0x1d72240]{Z} @ (0(0..100),0(0..100)) (5050 nnz, 50 nnz/r) flags 0x42644094 (coo:0, csr:1, hw:0, ic:1, fi:0), storage: 1, subm: 1, symflags:'LS' + shuffled partitions in 6.382e-03 s (62.09 %) + memory allocations took 9.060e-06 s (0.09 %) + leafs setup took 4.053e-06 s (0.04 %) + halfword conversion took 1.407e-05 s (0.14 %) +Built (100 x 100)[0x17f9c10]{Z} @ (0(0..100),0(0..100)) (5050 nnz, 50 nnz/r) flags 0x42644094 (coo:0, csr:1, hw:0, ic:1, fi:0), storage: 1, subm: 1, symflags:'LS' Starting autotuning stage, with subdivision of 1 (current threads=1, requested threads=0, max threads = 4). # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 524288 bytes, per-thread 524288 bytes @@ -8805,16 +8841,16 @@ # librsb version 1.3.0.2 - 202212201855: Initialization success Building a matrix with 5050 nnz, 100 x 100 Duplicates check: 5050 - 0 = 5050 - converted COO to RSB in 9.276e-03 s (100.00 %) - analyzed arrays in 2.504e-03 s (26.99 %) - cleaned-up arrays in 5.913e-05 s (0.64 %) - deduplicated arrays in 1.502e-05 s (0.16 %) + converted COO to RSB in 3.208e-02 s (100.00 %) + analyzed arrays in 1.137e-02 s (35.46 %) + cleaned-up arrays in 5.889e-05 s (0.18 %) + deduplicated arrays in 1.502e-05 s (0.05 %) sorted arrays in 0.000e+00 s (0.00 %) - shuffled partitions in 4.484e-03 s (48.34 %) - memory allocations took 1.383e-05 s (0.15 %) - leafs setup took 5.960e-06 s (0.06 %) - halfword conversion took 2.192e-03 s (23.63 %) -Built (100 x 100)[0x1d6ed20]{Z} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x42646096 (coo:0, csr:1, hw:1, ic:1, fi:0), storage: 1, subm: 5, symflags:'LS' + shuffled partitions in 1.349e-02 s (42.04 %) + memory allocations took 1.597e-05 s (0.05 %) + leafs setup took 5.007e-06 s (0.02 %) + halfword conversion took 7.121e-03 s (22.20 %) +Built (100 x 100)[0x17c1f50]{Z} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x42646096 (coo:0, csr:1, hw:1, ic:1, fi:0), storage: 1, subm: 6, symflags:'LS' # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 524288 bytes, per-thread 524288 bytes # RSB_IO_WANT_MEMORY_HIERARCHY_INFO_STRING: unset @@ -8860,10 +8896,10 @@ # RSB_IO_WANT_SORT_METHOD: 0 # RSB_IO_WANT_SUBDIVISION_MULTIPLIER: 0.25 # librsb version 1.3.0.2 - 202212201855: Initialization success -3 iterations (1 th.) took 0.003223s; avg 0.001074s ( +/- 7.21/ 8.46 %); best 0.0009968s; worst 0.001165s; std dev. 6.936e-05 (taking best). -Reference operation time is 0.000996828 s (81.06 Mflops) with 1 threads. -Challenging best inner round reference (8.58307e-05 s/1 threads) with: subdivision 0.25, 5 leaves, 2.143 bytes/nz, 0.000996828 s/0 threads (speedup 0.0861038 x), same?n. -New candidate clone performs slowly; discarding it: 100 x 100, type Z, 5050 nnz, 50 nnz/r, 7 subms, 5 lsubms, 2.1426 bpnz +3 iterations (1 th.) took 0.01179s; avg 0.003932s ( +/- 27.26/ 27.45 %); best 0.00286s; worst 0.005011s; std dev. 0.0008782 (taking best). +Reference operation time is 0.00285983 s (28.25 Mflops) with 1 threads. +Challenging best inner round reference (8.79765e-05 s/1 threads) with: subdivision 0.25, 6 leaves, 2.163 bytes/nz, 0.00285983 s/0 threads (speedup 0.0307628 x), same?n. +New candidate clone performs slowly; discarding it: 100 x 100, type Z, 5050 nnz, 50 nnz/r, 8 subms, 6 lsubms, 2.1632 bpnz # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 524288 bytes, per-thread 524288 bytes # RSB_IO_WANT_MEMORY_HIERARCHY_INFO_STRING: unset @@ -8896,16 +8932,16 @@ # librsb version 1.3.0.2 - 202212201855: Initialization success Building a matrix with 5050 nnz, 100 x 100 Duplicates check: 5050 - 0 = 5050 - converted COO to RSB in 8.846e-03 s (100.00 %) - analyzed arrays in 2.749e-03 s (31.08 %) - cleaned-up arrays in 5.794e-05 s (0.65 %) - deduplicated arrays in 1.478e-05 s (0.17 %) - sorted arrays in 1.192e-06 s (0.01 %) - shuffled partitions in 3.859e-03 s (43.63 %) - memory allocations took 1.574e-05 s (0.18 %) - leafs setup took 5.007e-06 s (0.06 %) - halfword conversion took 2.142e-03 s (24.21 %) -Built (100 x 100)[0x1d6bc70]{Z} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x42646096 (coo:0, csr:1, hw:1, ic:1, fi:0), storage: 1, subm: 10, symflags:'LS' + converted COO to RSB in 3.088e-02 s (100.00 %) + analyzed arrays in 7.417e-03 s (24.02 %) + cleaned-up arrays in 5.889e-05 s (0.19 %) + deduplicated arrays in 1.502e-05 s (0.05 %) + sorted arrays in 0.000e+00 s (0.00 %) + shuffled partitions in 1.446e-02 s (46.83 %) + memory allocations took 1.431e-05 s (0.05 %) + leafs setup took 5.960e-06 s (0.02 %) + halfword conversion took 8.907e-03 s (28.84 %) +Built (100 x 100)[0x17c3020]{Z} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x42646096 (coo:0, csr:1, hw:1, ic:1, fi:0), storage: 1, subm: 10, symflags:'LS' # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 524288 bytes, per-thread 524288 bytes # RSB_IO_WANT_MEMORY_HIERARCHY_INFO_STRING: unset @@ -8951,9 +8987,9 @@ # RSB_IO_WANT_SORT_METHOD: 0 # RSB_IO_WANT_SUBDIVISION_MULTIPLIER: 0.5 # librsb version 1.3.0.2 - 202212201855: Initialization success -3 iterations (1 th.) took 0.003019s; avg 0.001006s ( +/- 5.39/ 3.94 %); best 0.000952s; worst 0.001046s; std dev. 3.972e-05 (taking best). -Reference operation time is 0.000952005 s (84.87 Mflops) with 1 threads. -Challenging best inner round reference (8.58307e-05 s/1 threads) with: subdivision 0.5, 10 leaves, 2.206 bytes/nz, 0.000952005 s/0 threads (speedup 0.0901578 x), same?n. +3 iterations (1 th.) took 0.01114s; avg 0.003713s ( +/- 2.59/ 2.20 %); best 0.003617s; worst 0.003795s; std dev. 7.334e-05 (taking best). +Reference operation time is 0.00361705 s (22.34 Mflops) with 1 threads. +Challenging best inner round reference (8.79765e-05 s/1 threads) with: subdivision 0.5, 10 leaves, 2.206 bytes/nz, 0.00361705 s/0 threads (speedup 0.0243227 x), same?n. New candidate clone performs slowly; discarding it: 100 x 100, type Z, 5050 nnz, 50 nnz/r, 14 subms, 10 lsubms, 2.2059 bpnz # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 524288 bytes, per-thread 524288 bytes @@ -8987,16 +9023,16 @@ # librsb version 1.3.0.2 - 202212201855: Initialization success Building a matrix with 5050 nnz, 100 x 100 Duplicates check: 5050 - 0 = 5050 - converted COO to RSB in 8.856e-03 s (100.00 %) - analyzed arrays in 2.161e-03 s (24.40 %) - cleaned-up arrays in 5.817e-05 s (0.66 %) - deduplicated arrays in 1.502e-05 s (0.17 %) - sorted arrays in 9.537e-07 s (0.01 %) - shuffled partitions in 4.407e-03 s (49.76 %) - memory allocations took 1.383e-05 s (0.16 %) - leafs setup took 5.007e-06 s (0.06 %) - halfword conversion took 2.194e-03 s (24.78 %) -Built (100 x 100)[0x1d82e40]{Z} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x42646096 (coo:0, csr:1, hw:1, ic:1, fi:0), storage: 1, subm: 10, symflags:'LS' + converted COO to RSB in 2.877e-02 s (100.00 %) + analyzed arrays in 7.243e-03 s (25.18 %) + cleaned-up arrays in 6.008e-05 s (0.21 %) + deduplicated arrays in 1.478e-05 s (0.05 %) + sorted arrays in 0.000e+00 s (0.00 %) + shuffled partitions in 1.458e-02 s (50.69 %) + memory allocations took 3.600e-05 s (0.13 %) + leafs setup took 5.960e-06 s (0.02 %) + halfword conversion took 6.825e-03 s (23.72 %) +Built (100 x 100)[0x17c3020]{Z} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x42646096 (coo:0, csr:1, hw:1, ic:1, fi:0), storage: 1, subm: 10, symflags:'LS' # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 524288 bytes, per-thread 524288 bytes # RSB_IO_WANT_MEMORY_HIERARCHY_INFO_STRING: unset @@ -9042,9 +9078,9 @@ # RSB_IO_WANT_SORT_METHOD: 0 # RSB_IO_WANT_SUBDIVISION_MULTIPLIER: 1 # librsb version 1.3.0.2 - 202212201855: Initialization success -3 iterations (1 th.) took 0.003162s; avg 0.001054s ( +/- 5.02/ 7.60 %); best 0.001001s; worst 0.001134s; std dev. 5.761e-05 (taking best). -Reference operation time is 0.00100112 s (80.71 Mflops) with 1 threads. -Challenging best inner round reference (8.58307e-05 s/1 threads) with: subdivision 1, 10 leaves, 2.206 bytes/nz, 0.00100112 s/0 threads (speedup 0.0857347 x), same?n. +3 iterations (1 th.) took 0.01219s; avg 0.004065s ( +/- 20.09/ 39.91 %); best 0.003248s; worst 0.005687s; std dev. 0.001147 (taking best). +Reference operation time is 0.00324798 s (24.88 Mflops) with 1 threads. +Challenging best inner round reference (8.79765e-05 s/1 threads) with: subdivision 1, 10 leaves, 2.206 bytes/nz, 0.00324798 s/0 threads (speedup 0.0270865 x), same?n. New candidate clone performs slowly; discarding it: 100 x 100, type Z, 5050 nnz, 50 nnz/r, 14 subms, 10 lsubms, 2.2059 bpnz # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 524288 bytes, per-thread 524288 bytes @@ -9078,16 +9114,16 @@ # librsb version 1.3.0.2 - 202212201855: Initialization success Building a matrix with 5050 nnz, 100 x 100 Duplicates check: 5050 - 0 = 5050 - converted COO to RSB in 8.951e-03 s (100.00 %) - analyzed arrays in 2.216e-03 s (24.76 %) - cleaned-up arrays in 5.817e-05 s (0.65 %) - deduplicated arrays in 1.502e-05 s (0.17 %) - sorted arrays in 9.537e-07 s (0.01 %) - shuffled partitions in 4.530e-03 s (50.61 %) - memory allocations took 1.383e-05 s (0.15 %) - leafs setup took 5.960e-06 s (0.07 %) - halfword conversion took 2.108e-03 s (23.55 %) -Built (100 x 100)[0x1dfa1e0]{Z} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x42646096 (coo:0, csr:1, hw:1, ic:1, fi:0), storage: 1, subm: 10, symflags:'LS' + converted COO to RSB in 2.978e-02 s (100.00 %) + analyzed arrays in 8.693e-03 s (29.19 %) + cleaned-up arrays in 5.984e-05 s (0.20 %) + deduplicated arrays in 1.502e-05 s (0.05 %) + sorted arrays in 0.000e+00 s (0.00 %) + shuffled partitions in 1.414e-02 s (47.49 %) + memory allocations took 1.621e-05 s (0.05 %) + leafs setup took 5.007e-06 s (0.02 %) + halfword conversion took 6.845e-03 s (22.99 %) +Built (100 x 100)[0x1863f00]{Z} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x42646096 (coo:0, csr:1, hw:1, ic:1, fi:0), storage: 1, subm: 10, symflags:'LS' # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 524288 bytes, per-thread 524288 bytes # RSB_IO_WANT_MEMORY_HIERARCHY_INFO_STRING: unset @@ -9133,9 +9169,9 @@ # RSB_IO_WANT_SORT_METHOD: 0 # RSB_IO_WANT_SUBDIVISION_MULTIPLIER: 2 # librsb version 1.3.0.2 - 202212201855: Initialization success -3 iterations (1 th.) took 0.003094s; avg 0.001031s ( +/- 5.08/ 4.72 %); best 0.0009789s; worst 0.00108s; std dev. 4.135e-05 (taking best). -Reference operation time is 0.000978947 s (82.54 Mflops) with 1 threads. -Challenging best inner round reference (8.58307e-05 s/1 threads) with: subdivision 2, 10 leaves, 2.206 bytes/nz, 0.000978947 s/0 threads (speedup 0.0876766 x), same?n. +3 iterations (1 th.) took 0.01136s; avg 0.003786s ( +/- 30.48/ 30.66 %); best 0.002632s; worst 0.004947s; std dev. 0.0009451 (taking best). +Reference operation time is 0.0026319 s (30.7 Mflops) with 1 threads. +Challenging best inner round reference (8.79765e-05 s/1 threads) with: subdivision 2, 10 leaves, 2.206 bytes/nz, 0.0026319 s/0 threads (speedup 0.0334269 x), same?n. New candidate clone performs slowly; discarding it: 100 x 100, type Z, 5050 nnz, 50 nnz/r, 14 subms, 10 lsubms, 2.2059 bpnz # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 524288 bytes, per-thread 524288 bytes @@ -9169,16 +9205,16 @@ # librsb version 1.3.0.2 - 202212201855: Initialization success Building a matrix with 5050 nnz, 100 x 100 Duplicates check: 5050 - 0 = 5050 - converted COO to RSB in 8.795e-03 s (100.00 %) - analyzed arrays in 2.178e-03 s (24.76 %) - cleaned-up arrays in 5.889e-05 s (0.67 %) - deduplicated arrays in 1.597e-05 s (0.18 %) + converted COO to RSB in 3.266e-02 s (100.00 %) + analyzed arrays in 7.378e-03 s (22.59 %) + cleaned-up arrays in 5.889e-05 s (0.18 %) + deduplicated arrays in 1.597e-05 s (0.05 %) sorted arrays in 0.000e+00 s (0.00 %) - shuffled partitions in 4.150e-03 s (47.19 %) - memory allocations took 3.219e-05 s (0.37 %) - leafs setup took 4.053e-06 s (0.05 %) - halfword conversion took 2.354e-03 s (26.76 %) -Built (100 x 100)[0x1dfa1e0]{Z} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x42646096 (coo:0, csr:1, hw:1, ic:1, fi:0), storage: 1, subm: 10, symflags:'LS' + shuffled partitions in 1.588e-02 s (48.63 %) + memory allocations took 6.390e-05 s (0.20 %) + leafs setup took 5.960e-06 s (0.02 %) + halfword conversion took 9.253e-03 s (28.33 %) +Built (100 x 100)[0x1863f00]{Z} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x42646096 (coo:0, csr:1, hw:1, ic:1, fi:0), storage: 1, subm: 10, symflags:'LS' # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 524288 bytes, per-thread 524288 bytes # RSB_IO_WANT_MEMORY_HIERARCHY_INFO_STRING: unset @@ -9224,11 +9260,11 @@ # RSB_IO_WANT_SORT_METHOD: 0 # RSB_IO_WANT_SUBDIVISION_MULTIPLIER: 4 # librsb version 1.3.0.2 - 202212201855: Initialization success -3 iterations (1 th.) took 0.002929s; avg 0.0009763s ( +/- 15.90/ 13.77 %); best 0.0008211s; worst 0.001111s; std dev. 0.0001192 (taking best). -Reference operation time is 0.000821114 s (98.4 Mflops) with 1 threads. -Challenging best inner round reference (8.58307e-05 s/1 threads) with: subdivision 4, 10 leaves, 2.206 bytes/nz, 0.000821114 s/0 threads (speedup 0.10453 x), same?n. +3 iterations (1 th.) took 0.01002s; avg 0.00334s ( +/- 27.73/ 14.39 %); best 0.002414s; worst 0.003821s; std dev. 0.0006552 (taking best). +Reference operation time is 0.00241399 s (33.47 Mflops) with 1 threads. +Challenging best inner round reference (8.79765e-05 s/1 threads) with: subdivision 4, 10 leaves, 2.206 bytes/nz, 0.00241399 s/0 threads (speedup 0.0364444 x), same?n. New candidate clone performs slowly; discarding it: 100 x 100, type Z, 5050 nnz, 50 nnz/r, 14 subms, 10 lsubms, 2.2059 bpnz -Best sparse multiply performance with subdivision multiplier of 1: 941.388 Mflops. +Best sparse multiply performance with subdivision multiplier of 1: 918.428 Mflops. # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 524288 bytes, per-thread 524288 bytes # RSB_IO_WANT_MEMORY_HIERARCHY_INFO_STRING: unset @@ -9244,23 +9280,23 @@ # RSB_IO_WANT_SORT_METHOD: 0 # RSB_IO_WANT_SUBDIVISION_MULTIPLIER: 1 # librsb version 1.3.0.2 - 202212201855: Initialization success -Last tuner inner round (1 of 1) took 0.0673909 s (eq. to 8e+02/ 8e+02 old/new op.times), gained local/global speedup 1 x (8.58307e-05 : 8.58307e-05) / 1 x (8.58307e-05 : 8.58307e-05). This is not amortizable ! +Last tuner inner round (1 of 1) took 0.228871 s (eq. to 3e+03/ 3e+03 old/new op.times), gained local/global speedup 1 x (8.79765e-05 : 8.79765e-05) / 1 x (8.79765e-05 : 8.79765e-05). This is not amortizable ! Auto tuning inner round 1 did not find a configuration better than the original. -In 1 tuning rounds (tot. 0.067s, 0.05s for constructor, 0 clones) obtained NO speedup (best stays 941.4 Mflops). -Second run of RSB Autotuner took 0.0675061 s and estimated a speedup of 1.000000 x (8.583e-05 s -> 8.583e-05 s per op) in same matrix (1 -> 1 lsubm) +In 1 tuning rounds (tot. 0.23s, 0.17s for constructor, 0 clones) obtained NO speedup (best stays 918.4 Mflops). +Second run of RSB Autotuner took 0.228946 s and estimated a speedup of 1.000000 x (8.798e-05 s -> 8.798e-05 s per op) in same matrix (1 -> 1 lsubm) #min:1 0 #max:1 0 #sum:100 0 #norm:10 0 #used index storage compared to COO:10504 vs 40400 bytes (26.00%) ; compared to CSR:10504 vs 20604 bytes (50.99%) #%:CONSTRUCTOR_*:SORT SCAN INSERT SCAN+INSERT -%:CONSTRUCTOR_TIMES:lower-100x100-5050nz S N 1 100 100 5050 0.000000 0.001103 0.004286 0.005389 -%:UNSORTEDCOO2RSB_TIME:lower-100x100-5050nz S N 1 100 100 5050 0.005389 -%:RSB_SUBDIVISION_TIME:lower-100x100-5050nz S N 1 100 100 5050 0.001103 -%:RSB_SHUFFLE_TIME:lower-100x100-5050nz S N 1 100 100 5050 0.004286 +%:CONSTRUCTOR_TIMES:lower-100x100-5050nz S N 1 100 100 5050 0.000000 0.003386 0.015086 0.018472 +%:UNSORTEDCOO2RSB_TIME:lower-100x100-5050nz S N 1 100 100 5050 0.018472 +%:RSB_SUBDIVISION_TIME:lower-100x100-5050nz S N 1 100 100 5050 0.003386 +%:RSB_SHUFFLE_TIME:lower-100x100-5050nz S N 1 100 100 5050 0.015086 %:ROW_MAJOR_SORT_TIME:lower-100x100-5050nz S N 1 100 100 5050 0.000000 %:ROW_MAJOR_SORT_SCALING:lower-100x100-5050nz S N 1 100 100 5050 nan -%:SORTEDCOO2RSB_TIME:lower-100x100-5050nz S N 1 100 100 5050 0.005389 +%:SORTEDCOO2RSB_TIME:lower-100x100-5050nz S N 1 100 100 5050 0.018472 %:ROW_MAJOR_SORT_TO_MOP:lower-100x100-5050nz S N 1 100 100 5050 0.000 %:UNSORTEDCOO2RSB_SCALING:lower-100x100-5050nz S N 1 100 100 5050 1.00 %:SORTEDCOO2RSB_SCALING:lower-100x100-5050nz S N 1 100 100 5050 1.00 @@ -9275,68 +9311,68 @@ %:SM_MINMAXAVGNNZ:lower-100x100-5050nz S N 1 100 100 5050 5050 5050 5050 # %operation:matrix CONSTRUCTOR[1] SPMV[1] SPMV[1] -%operation:lower-100x100-5050nz 0.00819898 1e+09 1e+09 +%operation:lower-100x100-5050nz 0.0252161 1e+09 1e+09 %constructor:matrix SORT[1] SCAN[1] SHUFFLE[1] INSERT[1] -%constructor:lower-100x100-5050nz 0 0.00110316 0 0.00428581 -# so far, program took 6.557s of wall clock time; ancillary tests 0.000s; I/O 0.000s; checks 0.000s; conversions 0.000s; rsb/mkl tuning 0.398s/0.000s . +%constructor:lower-100x100-5050nz 0 0.00338602 0 0.0150859 +# so far, program took 7.534s of wall clock time; ancillary tests 0.000s; I/O 0.000s; checks 0.000s; conversions 0.000s; rsb/mkl tuning 1.214s/0.000s . getrusage() stats: ru_maxrss: 5 (maximum resident set size -- MB) -ru_stime : 0.07639s (system CPU time used) -ru_utime : 7.29s (user CPU time used) +ru_stime : 0.1166s (system CPU time used) +ru_utime : 7.34s (user CPU time used) # benchmarking terminated --- finalizing run. # ====== BEGIN Total summary record. #pr: ======== All results (not limiting) #pr: Dump from a base of 4 samples (of max 4) ordered by (1,1,1,1,1,4,1) = (filename x cores x incX x incY x nrhs x typecode x transA). pr: BESTCODE MTX NR NC NNZ NRHS TYPE SYM TRANS NT AT-NT AT-MKL-NT BPNZ AT-BPNZ NSUBM AT-SUBM RSBBEST-MFLOPS OPTIME MKL-OPTIME AT-OPTIME AT-MKL-OPTIME AT-TIME RWminBW-GBps CB-bpf AT-MS CMFLOPS -pr: 1:R_R lower-100x100-5050nz 100 100 5050 1 D S N 1 1 0 2.1212 2.0800 3 1 920.92 9.611e-04 0.000e+00 2.193e-05 0.000e+00 3.399e-02 2.43e+00 2.60e+00 1 2.02e-02 -pr: 2:R_R lower-100x100-5050nz 100 100 5050 1 S S N 1 1 0 2.1212 2.0800 3 1 920.92 9.730e-04 0.000e+00 2.193e-05 0.000e+00 3.317e-02 1.45e+00 1.56e+00 1 2.02e-02 -pr: 3:R_R lower-100x100-5050nz 100 100 5050 1 C S N 1 1 0 2.1212 2.0800 3 1 928.49 5.300e-04 0.000e+00 8.702e-05 0.000e+00 3.405e-02 6.13e-01 6.50e-01 1 8.08e-02 -pr: 4:R_R lower-100x100-5050nz 100 100 5050 1 Z S N 1 1 0 2.1212 2.0800 3 1 908.58 9.019e-04 0.000e+00 8.893e-05 0.000e+00 3.562e-02 1.08e+00 1.17e+00 1 8.08e-02 +pr: 1:R_R lower-100x100-5050nz 100 100 5050 1 D S N 1 1 0 2.1212 2.0800 3 1 882.55 2.400e-03 0.000e+00 2.289e-05 0.000e+00 8.450e-02 2.33e+00 2.60e+00 1 2.02e-02 +pr: 2:R_R lower-100x100-5050nz 100 100 5050 1 S S N 1 1 0 2.1212 2.0800 3 1 920.92 2.348e-03 0.000e+00 2.193e-05 0.000e+00 8.306e-02 1.45e+00 1.56e+00 1 2.02e-02 +pr: 3:R_R lower-100x100-5050nz 100 100 5050 1 C S N 1 1 0 2.1212 2.0800 3 1 896.56 1.961e-03 0.000e+00 9.012e-05 0.000e+00 8.188e-02 5.91e-01 6.50e-01 1 8.08e-02 +pr: 4:R_R lower-100x100-5050nz 100 100 5050 1 Z S N 1 1 0 2.1212 2.0800 3 1 928.49 2.305e-03 0.000e+00 8.702e-05 0.000e+00 9.249e-02 1.10e+00 1.17e+00 1 8.08e-02 #pr: below, we define 'successful' autotuning when speedup of 1.010000x is exceeded, and 'tuned' results even the ones which are same as untuned #pr: rsb autotuning was successful in 4 cases (100.00 %) and unsuccessful in 0 cases (0.00 %) -#pr: (in succ. cases rsb autotuning gave avg. 2510.2 % faster, avg. sp. ratio 26.102x, max sp. ratio 44.359x, avg. ratio 0.000x) -#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 963.3/391.2/1549.4/3853.3 tuned ops) -#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 43.3/ 34.1/ 64.2/173.2 untuned ops) -#pr: (and amortizes from untuned rsb in avg. 47.9, min. 34.9, max. 76.9 ops) +#pr: (in succ. cases rsb autotuning gave avg. 6403.9 % faster, avg. sp. ratio 65.039x, max sp. ratio 107.054x, avg. ratio 0.000x) +#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 2362.5/908.5/3786.8/9450.0 tuned ops) +#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 38.1/ 35.2/ 41.8/152.5 untuned ops) +#pr: (and amortizes from untuned rsb in avg. 39.2, min. 35.5, max. 43.8 ops) #pr: (avg/min/max (avg) nnz per subm before successful tuning were 1683/ 1683/ 1683) #pr: (avg/min/max (avg) nnz per subm after successful tuning were 5050/ 5050/ 5050) #pr: (avg/min/max (avg) bytes per subm before successful tuning were 15150/ 6733/ 26933) #pr: (avg/min/max (avg) bytes per subm after successful tuning were 45450/ 20200/ 80800) #pr: (avg/min/max (avg) bytes per nnz before successful tuning were 2.121/ 2.121/ 2.121) -#pr: (avg/min/max operands (mtx,lhs,rhs) read bandwidth lower bound 1.374/ 0.603/ 2.394,GBps) -#pr: (avg/min/max operands (mtx,rhs:r;lhs:rw) bandwidth lower bound 5.578/ 0.613/ 2.430,GBps) +#pr: (avg/min/max operands (mtx,lhs,rhs) read bandwidth lower bound 1.350/ 0.583/ 2.294,GBps) +#pr: (avg/min/max operands (mtx,rhs:r;lhs:rw) bandwidth lower bound 5.479/ 0.591/ 2.329,GBps) #pr: (avg/min/max code balance (bytes read at least once per flop) 1.495/ 0.650/ 2.599) #pr: (avg/min/max (avg) bytes per nnz after successful tuning were 2.080/ 2.080/ 2.080) #pr: (matrix has been subdivided more/less/same in resp. 0 / 4 /0 cases) #pr: (matrix has used more/less/same threads in resp. 0 / 0 /4 cases) #pr: no unsuccessful rsb autotuning attempt (according to 1.01x threshold) -#pr: rsb auto tuning (either succ. or uns.) time was: on avg.: 0.03 s, min 0.03 s, max 0.04 s, tot 0.14 s (4 samples) -#pr: rsb auto tuning ( only successful ) time was: on avg.: 0.03 s, min 0.03 s, max 0.04 s, tot 0.14 s (4 samples) -#pr: best tun. rsb canon. mflops were: on avg. 9.197e+02, min 9.086e+02, max 9.285e+02 (4 samples) -#pr: ref. unt. rsb canon. mflops were: on avg. 7.095e+01, min 2.076e+01, max 1.525e+02 (4 samples) -#pr: best tun. rsb operation time was: on avg. 5.496e-05s, min 2.193e-05s, max 8.893e-05s, tot 2.198e-04s (4 samples) -#pr: ref. unt. rsb operation time was: on avg. 8.415e-04s, min 5.300e-04s, max 9.730e-04s, tot 3.366e-03s (4 samples) -#pr: min / max ratio of in-memory MEMSET bandwidth to extrapolated read bandwidth ratio: 2.445e+00 9.699e+00 -#pr: in-cache to in-memory MEMSET bandwidth ratio: 9.993e-01 -#pr: Record collection took 0.39 s. +#pr: rsb auto tuning (either succ. or uns.) time was: on avg.: 0.09 s, min 0.08 s, max 0.09 s, tot 0.34 s (4 samples) +#pr: rsb auto tuning ( only successful ) time was: on avg.: 0.09 s, min 0.08 s, max 0.09 s, tot 0.34 s (4 samples) +#pr: best tun. rsb canon. mflops were: on avg. 9.071e+02, min 8.826e+02, max 9.285e+02 (4 samples) +#pr: ref. unt. rsb canon. mflops were: on avg. 2.332e+01, min 8.417e+00, max 4.120e+01 (4 samples) +#pr: best tun. rsb operation time was: on avg. 5.549e-05s, min 2.193e-05s, max 9.012e-05s, tot 2.220e-04s (4 samples) +#pr: ref. unt. rsb operation time was: on avg. 2.254e-03s, min 1.961e-03s, max 2.400e-03s, tot 9.014e-03s (4 samples) +#pr: min / max ratio of in-memory MEMSET bandwidth to extrapolated read bandwidth ratio: 2.562e+00 1.009e+01 +#pr: in-cache to in-memory MEMSET bandwidth ratio: 9.978e-01 +#pr: Record collection took 1.18 s. #pr: Record comprises 40 memory benchmark samples (prepend RSB_PR_MBW=1 to dump this). -#pr: Record comprises 89 environment variables in 3855 bytes (prepend RSB_PR_ENV=1 to dump this). +#pr: Record comprises 89 environment variables in 3909 bytes (prepend RSB_PR_ENV=1 to dump this). # ====== END Total summary record. #pr: ======== Saved a performance record of 4 samples to test.rpr # Removing the temporary record file test.rpr.tmp. -# terminating run at 1710619234 (after 6.6s of w.c.t.) +# terminating run at 1710622491 (after 7.5s of w.c.t.) + ls -ltr test-tuning-lower-100x100-5050nz--C-N-1--base.eps test-tuning-lower-100x100-5050nz--C-N-1--mv-tuned_merge1_1x1th.eps test-tuning-lower-100x100-5050nz--D-N-1--base.eps test-tuning-lower-100x100-5050nz--D-N-1--mv-tuned_merge1_1x1th.eps test-tuning-lower-100x100-5050nz--S-N-1--base.eps test-tuning-lower-100x100-5050nz--S-N-1--mv-tuned_merge1_1x1th.eps test-tuning-lower-100x100-5050nz--Z-N-1--base.eps test-tuning-lower-100x100-5050nz--Z-N-1--mv-tuned_merge1_1x1th.eps --rw-r--r-- 1 pbuilder1 pbuilder1 85623 Mar 16 08:00 test-tuning-lower-100x100-5050nz--D-N-1--base.eps --rw-r--r-- 1 pbuilder1 pbuilder1 84545 Mar 16 08:00 test-tuning-lower-100x100-5050nz--D-N-1--mv-tuned_merge1_1x1th.eps --rw-r--r-- 1 pbuilder1 pbuilder1 85622 Mar 16 08:00 test-tuning-lower-100x100-5050nz--S-N-1--base.eps --rw-r--r-- 1 pbuilder1 pbuilder1 84545 Mar 16 08:00 test-tuning-lower-100x100-5050nz--S-N-1--mv-tuned_merge1_1x1th.eps --rw-r--r-- 1 pbuilder1 pbuilder1 85623 Mar 16 08:00 test-tuning-lower-100x100-5050nz--C-N-1--base.eps --rw-r--r-- 1 pbuilder1 pbuilder1 84545 Mar 16 08:00 test-tuning-lower-100x100-5050nz--C-N-1--mv-tuned_merge1_1x1th.eps --rw-r--r-- 1 pbuilder1 pbuilder1 85622 Mar 16 08:00 test-tuning-lower-100x100-5050nz--Z-N-1--base.eps --rw-r--r-- 1 pbuilder1 pbuilder1 84544 Mar 16 08:00 test-tuning-lower-100x100-5050nz--Z-N-1--mv-tuned_merge1_1x1th.eps +-rw-r--r-- 1 pbuilder2 pbuilder2 85637 Mar 17 10:54 test-tuning-lower-100x100-5050nz--D-N-1--base.eps +-rw-r--r-- 1 pbuilder2 pbuilder2 84559 Mar 17 10:54 test-tuning-lower-100x100-5050nz--D-N-1--mv-tuned_merge1_1x1th.eps +-rw-r--r-- 1 pbuilder2 pbuilder2 85638 Mar 17 10:54 test-tuning-lower-100x100-5050nz--S-N-1--base.eps +-rw-r--r-- 1 pbuilder2 pbuilder2 84560 Mar 17 10:54 test-tuning-lower-100x100-5050nz--S-N-1--mv-tuned_merge1_1x1th.eps +-rw-r--r-- 1 pbuilder2 pbuilder2 85638 Mar 17 10:54 test-tuning-lower-100x100-5050nz--C-N-1--base.eps +-rw-r--r-- 1 pbuilder2 pbuilder2 84560 Mar 17 10:54 test-tuning-lower-100x100-5050nz--C-N-1--mv-tuned_merge1_1x1th.eps +-rw-r--r-- 1 pbuilder2 pbuilder2 85638 Mar 17 10:54 test-tuning-lower-100x100-5050nz--Z-N-1--base.eps +-rw-r--r-- 1 pbuilder2 pbuilder2 84560 Mar 17 10:54 test-tuning-lower-100x100-5050nz--Z-N-1--mv-tuned_merge1_1x1th.eps + rsbench --read-performance-record test.rpr + ls -ltr test.txt --rw-r--r-- 1 pbuilder1 pbuilder1 4082 Mar 16 08:00 test.txt +-rw-r--r-- 1 pbuilder2 pbuilder2 4084 Mar 17 10:54 test.txt + RSB_PR_WLTC=2 + RSB_PR_SR=0 + rsbench --read-performance-record test.rpr @@ -9344,31 +9380,31 @@ /usr/bin/latex + which kpsepath /usr/bin/kpsepath -++ kpsepath tex ++ sed 's/!!//g;s/:/\n/g;' -+ find . /nonexistent/first-build/.texlive2022/texmf-config/tex/kpsewhich// /nonexistent/first-build/.texlive2022/texmf-var/tex/kpsewhich// /nonexistent/first-build/texmf/tex/kpsewhich// /usr/local/share/texmf/tex/kpsewhich// /etc/texmf/tex/kpsewhich// /var/lib/texmf/tex/kpsewhich// /usr/share/texmf/tex/kpsewhich// /usr/share/texlive/texmf-dist/tex/kpsewhich// /nonexistent/first-build/.texlive2022/texmf-config/tex/generic// /nonexistent/first-build/.texlive2022/texmf-var/tex/generic// /nonexistent/first-build/texmf/tex/generic// /usr/local/share/texmf/tex/generic// /etc/texmf/tex/generic// /var/lib/texmf/tex/generic// /usr/share/texmf/tex/generic// /usr/share/texlive/texmf-dist/tex/generic// /nonexistent/first-build/.texlive2022/texmf-config/tex/latex// /nonexistent/first-build/.texlive2022/texmf-var/tex/latex// /nonexistent/first-build/texmf/tex/latex// /usr/local/share/texmf/tex/latex// /etc/texmf/tex/latex// /var/lib/texmf/tex/latex// /usr/share/texmf/tex/latex// /usr/share/texlive/texmf-dist/tex/latex// /nonexistent/first-build/.texlive2022/texmf-config/tex/// /nonexistent/first-build/.texlive2022/texmf-var/tex/// /nonexistent/first-build/texmf/tex/// /usr/local/share/texmf/tex/// /etc/texmf/tex/// /var/lib/texmf/tex/// /usr/share/texmf/tex/// /usr/share/texlive/texmf-dist/tex/// -name sciposter.cls -find: '/nonexistent/first-build/.texlive2022/texmf-config/tex/kpsewhich//': No such file or directory -find: '/nonexistent/first-build/.texlive2022/texmf-var/tex/kpsewhich//': No such file or directory -find: '/nonexistent/first-build/texmf/tex/kpsewhich//': No such file or directory +++ kpsepath tex ++ find . /nonexistent/second-build/.texlive2022/texmf-config/tex/kpsewhich// /nonexistent/second-build/.texlive2022/texmf-var/tex/kpsewhich// /nonexistent/second-build/texmf/tex/kpsewhich// /usr/local/share/texmf/tex/kpsewhich// /etc/texmf/tex/kpsewhich// /var/lib/texmf/tex/kpsewhich// /usr/share/texmf/tex/kpsewhich// /usr/share/texlive/texmf-dist/tex/kpsewhich// /nonexistent/second-build/.texlive2022/texmf-config/tex/generic// /nonexistent/second-build/.texlive2022/texmf-var/tex/generic// /nonexistent/second-build/texmf/tex/generic// /usr/local/share/texmf/tex/generic// /etc/texmf/tex/generic// /var/lib/texmf/tex/generic// /usr/share/texmf/tex/generic// /usr/share/texlive/texmf-dist/tex/generic// /nonexistent/second-build/.texlive2022/texmf-config/tex/latex// /nonexistent/second-build/.texlive2022/texmf-var/tex/latex// /nonexistent/second-build/texmf/tex/latex// /usr/local/share/texmf/tex/latex// /etc/texmf/tex/latex// /var/lib/texmf/tex/latex// /usr/share/texmf/tex/latex// /usr/share/texlive/texmf-dist/tex/latex// /nonexistent/second-build/.texlive2022/texmf-config/tex/// /nonexistent/second-build/.texlive2022/texmf-var/tex/// /nonexistent/second-build/texmf/tex/// /usr/local/share/texmf/tex/// /etc/texmf/tex/// /var/lib/texmf/tex/// /usr/share/texmf/tex/// /usr/share/texlive/texmf-dist/tex/// -name sciposter.cls +find: '/nonexistent/second-build/.texlive2022/texmf-config/tex/kpsewhich//': No such file or directory +find: '/nonexistent/second-build/.texlive2022/texmf-var/tex/kpsewhich//': No such file or directory +find: '/nonexistent/second-build/texmf/tex/kpsewhich//': No such file or directory find: '/usr/local/share/texmf/tex/kpsewhich//': No such file or directory find: '/etc/texmf/tex/kpsewhich//': No such file or directory find: '/var/lib/texmf/tex/kpsewhich//': No such file or directory find: '/usr/share/texmf/tex/kpsewhich//': No such file or directory find: '/usr/share/texlive/texmf-dist/tex/kpsewhich//': No such file or directory -find: '/nonexistent/first-build/.texlive2022/texmf-config/tex/generic//': No such file or directory -find: '/nonexistent/first-build/.texlive2022/texmf-var/tex/generic//': No such file or directory -find: '/nonexistent/first-build/texmf/tex/generic//': No such file or directory +find: '/nonexistent/second-build/.texlive2022/texmf-config/tex/generic//': No such file or directory +find: '/nonexistent/second-build/.texlive2022/texmf-var/tex/generic//': No such file or directory +find: '/nonexistent/second-build/texmf/tex/generic//': No such file or directory find: '/usr/local/share/texmf/tex/generic//': No such file or directory find: '/usr/share/texmf/tex/generic//': No such file or directory -find: '/nonexistent/first-build/.texlive2022/texmf-config/tex/latex//': No such file or directory -find: '/nonexistent/first-build/.texlive2022/texmf-var/tex/latex//': No such file or directory -find: '/nonexistent/first-build/texmf/tex/latex//': No such file or directory +find: '/nonexistent/second-build/.texlive2022/texmf-config/tex/latex//': No such file or directory +find: '/nonexistent/second-build/.texlive2022/texmf-var/tex/latex//': No such file or directory +find: '/nonexistent/second-build/texmf/tex/latex//': No such file or directory find: '/usr/local/share/texmf/tex/latex//': No such file or directory find: '/etc/texmf/tex/latex//': No such file or directory find: '/var/lib/texmf/tex/latex//': No such file or directory -find: '/nonexistent/first-build/.texlive2022/texmf-config/tex///': No such file or directory -find: '/nonexistent/first-build/.texlive2022/texmf-var/tex///': No such file or directory -find: '/nonexistent/first-build/texmf/tex///': No such file or directory +find: '/nonexistent/second-build/.texlive2022/texmf-config/tex///': No such file or directory +find: '/nonexistent/second-build/.texlive2022/texmf-var/tex///': No such file or directory +find: '/nonexistent/second-build/texmf/tex///': No such file or directory find: '/usr/local/share/texmf/tex///': No such file or directory + exit 0 for mf in pd.mtx vf.mtx ; do if test -f /build/reproducible-path/librsb-1.3.0.2+dfsg/examples/$mf ; then true; else cp -p /build/reproducible-path/librsb-1.3.0.2+dfsg/$mf /build/reproducible-path/librsb-1.3.0.2+dfsg/examples/$mf ; fi; done @@ -9383,7 +9419,7 @@ This error may be safely ignored. Correctly allocated a matrix. Summary information of the matrix: -(3 x 3)[0xc47210]{D} @ (0(0..3),0(0..3)) (3 nnz, 1 nnz/r) flags 0x2040384 (coo:1, csr:0, hw:0, ic:1, fi:0), storage: 40, subm: 1, symflags:'' +(3 x 3)[0x1f9f210]{D} @ (0(0..3),0(0..3)) (3 nnz, 1 nnz/r) flags 0x2040384 (coo:1, csr:0, hw:0, ic:1, fi:0), storage: 40, subm: 1, symflags:'' Correctly performed a SPMV. Correctly freed the matrix. Correctly finalized the library. @@ -9398,7 +9434,7 @@ This error may be safely ignored. Correctly allocated a matrix. Summary information of the matrix: -(3 x 3)[0x2518210]{D} @ (0(0..3),0(0..3)) (3 nnz, 1 nnz/r) flags 0x2040384 (coo:1, csr:0, hw:0, ic:1, fi:0), storage: 40, subm: 1, symflags:'' +(3 x 3)[0xf16210]{D} @ (0(0..3),0(0..3)) (3 nnz, 1 nnz/r) flags 0x2040384 (coo:1, csr:0, hw:0, ic:1, fi:0), storage: 40, subm: 1, symflags:'' Correctly performed a SPMV. Correctly freed the matrix. Correctly finalized the library. @@ -9462,51 +9498,51 @@ Done. Building a matrix with 5 nnz, 5 x 5 Duplicates check: 5 - 0 = 5 - converted COO to RSB in 7.753e-03 s (100.00 %) - analyzed arrays in 2.188e-03 s (28.22 %) - cleaned-up arrays in 1.907e-06 s (0.02 %) - deduplicated arrays in 9.537e-07 s (0.01 %) - sorted arrays in 1.210e-03 s (15.61 %) - shuffled partitions in 2.241e-03 s (28.90 %) - memory allocations took 1.597e-05 s (0.21 %) - leafs setup took 5.007e-06 s (0.06 %) - halfword conversion took 2.088e-03 s (26.93 %) -Built (5 x 5)[0x25195d0]{D} @ (0(0..0),0(0..0)) (5 nnz, 1 nnz/r) flags 0x2046186 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 2, symflags:'' + converted COO to RSB in 3.120e-02 s (100.00 %) + analyzed arrays in 7.328e-03 s (23.48 %) + cleaned-up arrays in 9.537e-07 s (0.00 %) + deduplicated arrays in 1.192e-06 s (0.00 %) + sorted arrays in 7.279e-03 s (23.33 %) + shuffled partitions in 9.544e-03 s (30.58 %) + memory allocations took 1.597e-05 s (0.05 %) + leafs setup took 5.007e-06 s (0.02 %) + halfword conversion took 7.028e-03 s (22.52 %) +Built (5 x 5)[0xf175d0]{D} @ (0(0..0),0(0..0)) (5 nnz, 1 nnz/r) flags 0x2046186 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 2, symflags:'' Allocated matrix of 5 nonzeroes: -(5 x 5)[0x25195d0]{D} @ (0(0..0),0(0..0)) (5 nnz, 1 nnz/r) flags 0x2046186 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 2, symflags:'' +(5 x 5)[0xf175d0]{D} @ (0(0..0),0(0..0)) (5 nnz, 1 nnz/r) flags 0x2046186 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 2, symflags:'' -Before auto-tuning, 100 multiplications took 0.124807s. +Before auto-tuning, 100 multiplications took 0.548597s. Threads autotuning (may take more than 1.500000s)... Will use autotuning routine to sample matrix: 5 x 5, type D, 5 nnz, 1 nnz/r, 3 subms, 2 lsubms, 4.0000 bpnz. Parameters: verbosity:1 mintimes:3 maxtimes:10 mindt:0 maxdt:0.1 -Sampling (15 x 0.1 s stages, transA=N, nrhs=2, timer gran.=9.80496e-08), 4 suggested as starting thread count(default). -3 iterations (4 th.) took 0.002757s; avg 0.000919s ( +/- 39.16/ 21.64 %); best 0.0005591s; worst 0.001118s; std dev. 0.000255 (taking best). -Reference operation time is 0.000559092 s (0.03577 Mflops) with 4 threads. -3 iterations (4 th.) took 0.003228s; avg 0.001076s ( +/- 45.63/ 48.78 %); best 0.0005851s; worst 0.001601s; std dev. 0.0004154 (taking best). -Reference operation time is 0.000585079 s (0.03418 Mflops) with 4 threads. -After 0.006153s, autotuning routine did not find a better threads count configuration. -(5 x 5)[0x25195d0]{D} @ (0(0..0),0(0..0)) (5 nnz, 1 nnz/r) flags 0x2046186 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 2, symflags:'' -After threads auto-tuning, 100 multiplications took 0.138603s -- effective speedup of 0.900465 x +Sampling (15 x 0.1 s stages, transA=N, nrhs=2, timer gran.=8.9705e-08), 4 suggested as starting thread count(default). +3 iterations (4 th.) took 0.01423s; avg 0.004744s ( +/- 19.10/ 19.88 %); best 0.003838s; worst 0.005687s; std dev. 0.0007553 (taking best). +Reference operation time is 0.00383806 s (0.005211 Mflops) with 4 threads. +3 iterations (4 th.) took 0.01156s; avg 0.003852s ( +/- 13.47/ 15.95 %); best 0.003333s; worst 0.004466s; std dev. 0.0004675 (taking best). +Reference operation time is 0.00333309 s (0.006 Mflops) with 4 threads. +After 0.025925s, autotuning routine did not find a better threads count configuration. +(5 x 5)[0xf175d0]{D} @ (0(0..0),0(0..0)) (5 nnz, 1 nnz/r) flags 0x2046186 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 2, symflags:'' +After threads auto-tuning, 100 multiplications took 0.412838s -- effective speedup of 1.32884 x Matrix autotuning (may take more than 1.500000s; using 4 threads )... Will autotune matrix: 5 x 5, type D, 5 nnz, 1 nnz/r, 3 subms, 2 lsubms, 4.0000 bpnz. Parameters: verbosity:1 mintimes:3 maxtimes:10 mindt:0 maxdt:0.1 -Starting autotuning (15 x 0.1 s stages, transA=N, nrhs=2, timer gran.=9.80496e-08), 4 suggested as starting thread count. -3 iterations (4 th.) took 0.007702s; avg 0.002567s ( +/- 79.24/117.86 %); best 0.0005329s; worst 0.005593s; std dev. 0.002182 (taking best). -Reference operation time is 0.000532866 s (0.03753 Mflops) with 4 threads. -Starting merge (user-supplied threads) based auto-tuning procedure (transA=N, nrhs=2, order=cols) (max 6 steps, inclusive 3 grace steps) on: 5 x 5, type D, 5 nnz, 1 nnz/r, 3 subms, 2 lsubms, 4.0000 bpnz (tpop: 0.0005329 Mflops: 0.038) -Merge (2 -> 1 leaves) took w.c.t. of 4.292e-05s, ~7.868e-06s of computing time (of which 9.537e-07s sorting, 9.06e-06s analysis) -3 iterations (4 th.) took 7.868e-06s; avg 2.623e-06s ( +/- 63.64/127.27 %); best 9.537e-07s; worst 5.96e-06s; std dev. 2.36e-06 (taking best). +Starting autotuning (15 x 0.1 s stages, transA=N, nrhs=2, timer gran.=8.9705e-08), 4 suggested as starting thread count. +3 iterations (4 th.) took 0.01047s; avg 0.003491s ( +/- 19.26/ 34.56 %); best 0.002819s; worst 0.004698s; std dev. 0.0008551 (taking best). +Reference operation time is 0.00281906 s (0.007095 Mflops) with 4 threads. +Starting merge (user-supplied threads) based auto-tuning procedure (transA=N, nrhs=2, order=cols) (max 6 steps, inclusive 3 grace steps) on: 5 x 5, type D, 5 nnz, 1 nnz/r, 3 subms, 2 lsubms, 4.0000 bpnz (tpop: 0.002819 Mflops: 0.007) +Merge (2 -> 1 leaves) took w.c.t. of 3.29e-05s, ~6.914e-06s of computing time (of which 0s sorting, 6.914e-06s analysis) +3 iterations (4 th.) took 7.153e-06s; avg 2.384e-06s ( +/- 60.00/110.00 %); best 9.537e-07s; worst 5.007e-06s; std dev. 1.857e-06 (taking best). Reference operation time is 9.53674e-07 s (20.97 Mflops) with 4 threads. After merge step 1: tpop: 9.537e-07 s ~Mflops: 20.972 nsubm:1 otn:4 -Applying merge (2 -> 1 leaves, 4 th.) yielded SPEEDUP of 558.750x: 0.0005329s -> 9.537e-07s, so taking this instance. +Applying merge (2 -> 1 leaves, 4 th.) yielded SPEEDUP of 2956.000x: 0.002819s -> 9.537e-07s, so taking this instance. Merged all the matrix leaves: no reason to continue merging. -A total of 1 merge steps (of max 6) (2 -> 1 subms) took 0.003333s (of which 0.000648s partitioning, 0s I/O); computing times: 7.868e-06s in par. loops, 9.537e-07s sorting, 9.06e-06s analyzing) -Total merge + benchmarking process took 0.003333s, equivalent to 3495.0/6.3 new/old ops (0.005845s for 2 clones -- as 6129.0/11.0 ops, or 3064.5/5.5 ops per clone), SPEEDUP of 558.750x -Applying multi-merge (2 -> 1 leaves, 1 steps, 4 -> 4 th.sp.) yielded SPEEDUP of 558.750x (0.0005329s -> 9.537e-07s), will amortize in 6.3 ops by saving 0.0005319s per op. -In 1 tuning rounds (tot. 0.014s, 0.0058s for constructor, 2 clones) obtained a SPEEDUP of 55775.0% (558.8x) (from 0.03753 to 20.97 Mflops). -After 0.014347s, autotuning routine declared speedup of 558.75 x, when using threads count of 4. -(5 x 5)[0x251ba80]{D} @ (0(0..5),0(0..5)) (5 nnz, 1 nnz/r) flags 0x2040186 (coo:1, csr:0, hw:1, ic:1, fi:0), storage: 40, subm: 1, symflags:'' -After threads auto-tuning, 100 multiplications took 0.000035s -- further speedup of 3954.71 x +A total of 1 merge steps (of max 6) (2 -> 1 subms) took 0.01226s (of which 0.001069s partitioning, 0s I/O); computing times: 6.914e-06s in par. loops, 0s sorting, 6.914e-06s analyzing) +Total merge + benchmarking process took 0.01226s, equivalent to 12860.8/4.4 new/old ops (0.02207s for 2 clones -- as 23138.0/7.8 ops, or 11569.0/3.9 ops per clone), SPEEDUP of 2956.000x +Applying multi-merge (2 -> 1 leaves, 1 steps, 4 -> 4 th.sp.) yielded SPEEDUP of 2956.000x (0.002819s -> 9.537e-07s), will amortize in 4.4 ops by saving 0.002818s per op. +In 1 tuning rounds (tot. 0.034s, 0.022s for constructor, 2 clones) obtained a SPEEDUP of 295500.0% (2956x) (from 0.007095 to 20.97 Mflops). +After 0.033752s, autotuning routine declared speedup of 2956 x, when using threads count of 4. +(5 x 5)[0xf19a80]{D} @ (0(0..5),0(0..5)) (5 nnz, 1 nnz/r) flags 0x2040186 (coo:1, csr:0, hw:1, ic:1, fi:0), storage: 40, subm: 1, symflags:'' +After threads auto-tuning, 100 multiplications took 0.000037s -- further speedup of 11171.4 x 0/2 0 0 -> 0 1/2 1 0 -> 5 0/2 0 3 -> 0 @@ -9517,7 +9553,7 @@ Correctly initialized the library. Correctly allocated a matrix with 7 nonzeroes. Summary information of the matrix: -(6 x 6)[0x25195d0]{D} @ (0(1..2),0(5..6)) (1 nnz, 0.17 nnz/r) flags 0x20443ee (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 1, symflags:'UT' +(6 x 6)[0xf175d0]{D} @ (0(1..2),0(5..6)) (1 nnz, 0.17 nnz/r) flags 0x20443ee (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 1, symflags:'UT' Matrix printout: %%MatrixMarket matrix coordinate real general 6 6 1 @@ -9668,83 +9704,71 @@ Creating 500 x 500 matrix with 62500 nonzeroes. Building a matrix with 62500 nnz, 500 x 500 Duplicates check: 62500 - 0 = 62500 - converted COO to RSB in 1.926e-02 s (100.00 %) - analyzed arrays in 2.848e-03 s (14.79 %) - cleaned-up arrays in 8.140e-04 s (4.23 %) - deduplicated arrays in 2.270e-04 s (1.18 %) - sorted arrays in 7.944e-03 s (41.24 %) - shuffled partitions in 5.019e-03 s (26.06 %) - memory allocations took 1.109e-04 s (0.58 %) - leafs setup took 1.287e-05 s (0.07 %) - halfword conversion took 2.262e-03 s (11.74 %) -Built (500 x 500)[0x1897fd0]{D} @ (0(0..0),0(0..0)) (62500 nnz, 1.2e+02 nnz/r) flags 0x2046186 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 16, symflags:'' + converted COO to RSB in 5.423e-02 s (100.00 %) + analyzed arrays in 7.215e-03 s (13.31 %) + cleaned-up arrays in 7.441e-04 s (1.37 %) + deduplicated arrays in 2.060e-04 s (0.38 %) + sorted arrays in 2.260e-02 s (41.68 %) + shuffled partitions in 1.533e-02 s (28.28 %) + memory allocations took 9.012e-05 s (0.17 %) + leafs setup took 1.001e-05 s (0.02 %) + halfword conversion took 8.002e-03 s (14.76 %) +Built (500 x 500)[0x128afd0]{D} @ (0(0..0),0(0..0)) (62500 nnz, 1.2e+02 nnz/r) flags 0x2046186 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 16, symflags:'' Allocated matrix of 62500 nonzeroes: -(500 x 500)[0x1897fd0]{D} @ (0(0..0),0(0..0)) (62500 nnz, 1.2e+02 nnz/r) flags 0x2046186 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 16, symflags:'' +(500 x 500)[0x128afd0]{D} @ (0(0..0),0(0..0)) (62500 nnz, 1.2e+02 nnz/r) flags 0x2046186 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 16, symflags:'' -Before auto-tuning, 100 multiplications took 0.579113s. +Before auto-tuning, 100 multiplications took 0.476682s. Threads autotuning (may take more than 1.500000s)... Will use autotuning routine to sample matrix: 500 x 500, type D, 62500 nnz, 1.2e+02 nnz/r, 23 subms, 16 lsubms, 2.0650 bpnz. Parameters: verbosity:1 mintimes:3 maxtimes:10 mindt:0 maxdt:0.1 -Sampling (15 x 0.1 s stages, transA=N, nrhs=2, timer gran.=9.75013e-08), 4 suggested as starting thread count(default). -3 iterations (4 th.) took 0.01038s; avg 0.003458s ( +/- 30.52/ 17.32 %); best 0.002403s; worst 0.004057s; std dev. 0.0007485 (taking best). -Reference operation time is 0.00240302 s (104 Mflops) with 4 threads. -3 iterations (4 th.) took 0.004841s; avg 0.001614s ( +/- 14.68/ 25.56 %); best 0.001377s; worst 0.002026s; std dev. 0.0002927 (taking best). -Reference operation time is 0.00137687 s (181.6 Mflops) with 4 threads. -After 0.015368s, autotuning routine did not find a better threads count configuration. -(500 x 500)[0x1897fd0]{D} @ (0(0..0),0(0..0)) (62500 nnz, 1.2e+02 nnz/r) flags 0x2046186 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 16, symflags:'' -After threads auto-tuning, 100 multiplications took 0.515204s -- effective speedup of 1.12405 x +Sampling (15 x 0.1 s stages, transA=N, nrhs=2, timer gran.=8.86559e-08), 4 suggested as starting thread count(default). +3 iterations (4 th.) took 0.01934s; avg 0.006446s ( +/- 49.94/ 27.20 %); best 0.003227s; worst 0.008199s; std dev. 0.002279 (taking best). +Reference operation time is 0.003227 s (77.47 Mflops) with 4 threads. +3 iterations (4 th.) took 0.0177s; avg 0.005901s ( +/- 59.67/ 44.83 %); best 0.00238s; worst 0.008547s; std dev. 0.002593 (taking best). +Reference operation time is 0.00237989 s (105 Mflops) with 4 threads. +After 0.037181s, autotuning routine did not find a better threads count configuration. +(500 x 500)[0x128afd0]{D} @ (0(0..0),0(0..0)) (62500 nnz, 1.2e+02 nnz/r) flags 0x2046186 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 16, symflags:'' +After threads auto-tuning, 100 multiplications took 0.213458s -- effective speedup of 2.23314 x Matrix autotuning (may take more than 1.500000s; using 4 threads )... Will autotune matrix: 500 x 500, type D, 62500 nnz, 1.2e+02 nnz/r, 23 subms, 16 lsubms, 2.0650 bpnz. Parameters: verbosity:1 mintimes:3 maxtimes:10 mindt:0 maxdt:0.1 -Starting autotuning (15 x 0.1 s stages, transA=N, nrhs=2, timer gran.=9.75013e-08), 4 suggested as starting thread count. -3 iterations (4 th.) took 0.004379s; avg 0.00146s ( +/- 41.77/ 47.57 %); best 0.00085s; worst 0.002154s; std dev. 0.0005358 (taking best). -Reference operation time is 0.000849962 s (294.1 Mflops) with 4 threads. -Starting merge (user-supplied threads) based auto-tuning procedure (transA=N, nrhs=2, order=cols) (max 6 steps, inclusive 3 grace steps) on: 500 x 500, type D, 62500 nnz, 1.2e+02 nnz/r, 23 subms, 16 lsubms, 2.0650 bpnz (tpop: 0.00085 Mflops: 294.131) -Merge (16 -> 10 leaves) took w.c.t. of 0.001429s, ~0.001681s of computing time (of which 0.000845s sorting, 1.192e-05s analysis) -3 iterations (4 th.) took 0.04785s; avg 0.01595s ( +/- 91.34/ 87.16 %); best 0.001382s; worst 0.02985s; std dev. 0.01163 (taking best). -Reference operation time is 0.00138187 s (180.9 Mflops) with 4 threads. -After merge step 1: tpop: 0.001382 s ~Mflops: 180.914 nsubm:10 otn:4 -Applying merge (16 -> 10 leaves, 4 th.) yielded SLOWDOWN (1th of 3 tolerable) of 1.626x: 0.00085s -> 0.001382s. -Skipping further merge based tests after 1 definite performance degradations in a row (and last exceeding limit). -A total of 1 merge steps (of max 6) (16 -> 10 subms) took 0.04934s (of which 0.001445s partitioning, 0s I/O); computing times: 0.001681s in par. loops, 0.000845s sorting, 1.192e-05s analyzing) -Total merge + benchmarking process took 0.04934s, equivalent to 58.0/58.0 new/old ops (0.003808s for 1 clones -- as 4.5/4.5 ops, or 4.5/4.5 ops per clone), SPEEDUP of 1.000x (NO SPEEDUP) -Merging based autotuning FAILED (=NO SPEEDUP); let's try splitting then... -3 iterations (4 th.) took 0.005307s; avg 0.001769s ( +/- 22.05/ 36.47 %); best 0.001379s; worst 0.002414s; std dev. 0.0004595 (taking best). -Reference operation time is 0.00137901 s (181.3 Mflops) with 4 threads. -Starting split (user-supplied threads) based auto-tuning procedure (transA=N, nrhs=2, order=cols) (max 6 steps, inclusive 3 grace steps) on: 500 x 500, type D, 62500 nnz, 1.2e+02 nnz/r, 23 subms, 16 lsubms, 2.0650 bpnz (tpop: 0.001379 Mflops: 181.289) -Split (16 -> 40 leaves, 23 -> 55 subms) took 0.001624s (of which: 1.121e-05s analysis, -1.368e+10s mem.mgmt); compute time: 0.001255s overall, 0.0004225s searches, 0.0008326s shuffle, 0.0003779s switch, 9.06e-06s quadrants. -3 iterations (4 th.) took 0.004559s; avg 0.00152s ( +/- 19.60/ 20.03 %); best 0.001222s; worst 0.001824s; std dev. 0.0002459 (taking best). -Reference operation time is 0.0012219 s (204.6 Mflops) with 4 threads. -After split step 1: tpop: 0.001222 s ~Mflops: 204.600 nsubm:40 otn:4 -Applying split (16 -> 40 leaves, 4 th.) yielded SPEEDUP of 1.129x: 0.001379s -> 0.001222s, so taking this instance. -Split (40 -> 100 leaves, 55 -> 135 subms) took 0.001981s (of which: 1.407e-05s analysis, -3.421e+10s mem.mgmt); compute time: 0.002722s overall, 0.001644s searches, 0.001078s shuffle, 0.0003016s switch, 2.551e-05s quadrants. -3 iterations (4 th.) took 0.004418s; avg 0.001473s ( +/- 6.57/ 11.44 %); best 0.001376s; worst 0.001641s; std dev. 0.0001195 (taking best). -Reference operation time is 0.00137591 s (181.7 Mflops) with 4 threads. -After split step 2: tpop: 0.001376 s ~Mflops: 181.697 nsubm:100 otn:4 -Applying split (40 -> 100 leaves, 4 th.) yielded SLOWDOWN (1th of 3 tolerable) of 1.126x: 0.001222s -> 0.001376s. -Split (100 -> 250 leaves, 135 -> 335 subms) took 0.002212s (of which: 2.503e-05s analysis, -8.553e+10s mem.mgmt); compute time: 0.001737s overall, 0.0006216s searches, 0.001115s shuffle, 0.0002265s switch, 8.75e-05s quadrants. -3 iterations (4 th.) took 0.004207s; avg 0.001402s ( +/- 13.57/ 10.61 %); best 0.001212s; worst 0.001551s; std dev. 0.0001415 (taking best). -Reference operation time is 0.00121212 s (206.3 Mflops) with 4 threads. -After split step 3: tpop: 0.001212 s ~Mflops: 206.250 nsubm:250 otn:4 -Applying split (100 -> 250 leaves, 4 th.) yielded NEGLIGIBLE change (1th in a row) (old/new=1.00806x): 0.001222s -> 0.001212s, so IGNORING this instance. -Split (250 -> 625 leaves, 335 -> 835 subms) took 0.002453s (of which: 5.817e-05s analysis, -2.138e+11s mem.mgmt); compute time: 0.002525s overall, 0.0004499s searches, 0.002075s shuffle, 0.0003541s switch, 0.000464s quadrants. -3 iterations (4 th.) took 0.005185s; avg 0.001728s ( +/- 28.89/ 19.71 %); best 0.001229s; worst 0.002069s; std dev. 0.0003608 (taking best). -Reference operation time is 0.00122905 s (203.4 Mflops) with 4 threads. -After split step 4: tpop: 0.001229 s ~Mflops: 203.410 nsubm:625 otn:4 -Applying split (250 -> 625 leaves, 4 th.) yielded NEGLIGIBLE change (2th in a row) (old/new=0.99418x): 0.001222s -> 0.001229s, so IGNORING this instance. -Split (625 -> 1561 leaves, 835 -> 2083 subms) took 0.00673s (of which: 0.0001709s analysis, -5.337e+11s mem.mgmt); compute time: 0.01038s overall, 0.0007253s searches, 0.009659s shuffle, 0.001267s switch, 0.003433s quadrants. -3 iterations (4 th.) took 0.007295s; avg 0.002432s ( +/- 15.62/ 9.60 %); best 0.002052s; worst 0.002665s; std dev. 0.0002709 (taking best). -Reference operation time is 0.00205183 s (121.8 Mflops) with 4 threads. -After split step 5: tpop: 0.002052 s ~Mflops: 121.842 nsubm:1561 otn:4 -Applying split (625 -> 1561 leaves, 4 th.) yielded SLOWDOWN (2th of 3 tolerable) of 1.679x: 0.001222s -> 0.002052s. -Skipping further split based tests after 2 definite performance degradations in a row (and last exceeding limit). -A total of 5 split steps (of max 6) (16 -> 1561 subms) took 0.04772s (of which 0.01789s partitioning, 0s I/O); computing times: 0.01862s in par. loops, 0.003863s sorting, 0.0002794s analyzing) -Total split + benchmarking process took 0.04772s, equivalent to 39.1/34.6 new/old ops (0.008261s for 2 clones -- as 6.8/6.0 ops, or 3.4/3.0 ops per clone), SPEEDUP of 1.129x -Applying multi-split (16 -> 40 leaves, 1 steps, 4 -> 4 th.sp.) yielded SPEEDUP of 1.129x (0.001379s -> 0.001222s), will amortize in 303.7 ops by saving 0.0001571s per op. -In 1 tuning rounds (tot. 0.12s, 0.012s for constructor, 3 clones) obtained a SPEEDUP of 12.9% (1.129x) (from 181.3 to 204.6 Mflops). -After 0.116401s, autotuning routine declared speedup of 1.12859 x, when using threads count of 4. -(500 x 500)[0x189eef0]{D} @ (0(0..0),0(0..0)) (62500 nnz, 1.2e+02 nnz/r) flags 0x2046186 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 40, symflags:'' -After threads auto-tuning, 100 multiplications took 0.283652s -- further speedup of 1.81633 x +Starting autotuning (15 x 0.1 s stages, transA=N, nrhs=2, timer gran.=8.86559e-08), 4 suggested as starting thread count. +3 iterations (4 th.) took 0.004826s; avg 0.001609s ( +/- 1.53/ 2.32 %); best 0.001584s; worst 0.001646s; std dev. 2.686e-05 (taking best). +Reference operation time is 0.00158405 s (157.8 Mflops) with 4 threads. +Starting merge (user-supplied threads) based auto-tuning procedure (transA=N, nrhs=2, order=cols) (max 6 steps, inclusive 3 grace steps) on: 500 x 500, type D, 62500 nnz, 1.2e+02 nnz/r, 23 subms, 16 lsubms, 2.0650 bpnz (tpop: 0.001584 Mflops: 157.823) +Merge (16 -> 10 leaves) took w.c.t. of 0.002752s, ~0.003242s of computing time (of which 0.0006332s sorting, 9.775e-06s analysis) +3 iterations (4 th.) took 0.004752s; avg 0.001584s ( +/- 5.17/ 4.54 %); best 0.001502s; worst 0.001656s; std dev. 6.318e-05 (taking best). +Reference operation time is 0.00150204 s (166.4 Mflops) with 4 threads. +After merge step 1: tpop: 0.001502 s ~Mflops: 166.441 nsubm:10 otn:4 +Applying merge (16 -> 10 leaves, 4 th.) yielded SPEEDUP of 1.055x: 0.001584s -> 0.001502s, so taking this instance. +Merge (10 -> 7 leaves) took w.c.t. of 0.0005291s, ~0.0005062s of computing time (of which 0.0003359s sorting, 8.106e-06s analysis) +3 iterations (4 th.) took 0.00461s; avg 0.001537s ( +/- 3.36/ 5.55 %); best 0.001485s; worst 0.001622s; std dev. 6.074e-05 (taking best). +Reference operation time is 0.00148511 s (168.3 Mflops) with 4 threads. +After merge step 2: tpop: 0.001485 s ~Mflops: 168.338 nsubm:7 otn:4 +Applying merge (10 -> 7 leaves, 4 th.) yielded SPEEDUP of 1.011x: 0.001502s -> 0.001485s, so taking this instance. +Merge (7 -> 4 leaves) took w.c.t. of 0.0003488s, ~0.0003309s of computing time (of which 0.000181s sorting, 6.914e-06s analysis) +3 iterations (4 th.) took 0.004818s; avg 0.001606s ( +/- 1.11/ 1.48 %); best 0.001588s; worst 0.00163s; std dev. 1.755e-05 (taking best). +Reference operation time is 0.00158811 s (157.4 Mflops) with 4 threads. +After merge step 3: tpop: 0.001588 s ~Mflops: 157.420 nsubm:4 otn:4 +Applying merge (7 -> 4 leaves, 4 th.) yielded SLOWDOWN (1th of 3 tolerable) of 1.069x: 0.001485s -> 0.001588s. +Merge (4 -> 3 leaves) took w.c.t. of 0.0003259s, ~0.000304s of computing time (of which 0s sorting, 6.914e-06s analysis) +3 iterations (4 th.) took 0.004754s; avg 0.001585s ( +/- 3.70/ 3.74 %); best 0.001526s; worst 0.001644s; std dev. 4.809e-05 (taking best). +Reference operation time is 0.00152612 s (163.8 Mflops) with 4 threads. +After merge step 4: tpop: 0.001526 s ~Mflops: 163.814 nsubm:3 otn:4 +Applying merge (4 -> 3 leaves, 4 th.) yielded SLOWDOWN (2th of 3 tolerable) of 1.028x: 0.001485s -> 0.001526s. +Merge (3 -> 2 leaves) took w.c.t. of 0.0003111s, ~0.000294s of computing time (of which 0s sorting, 5.007e-06s analysis) +3 iterations (4 th.) took 0.00574s; avg 0.001913s ( +/- 0.85/ 0.71 %); best 0.001897s; worst 0.001927s; std dev. 1.231e-05 (taking best). +Reference operation time is 0.0018971 s (131.8 Mflops) with 4 threads. +After merge step 5: tpop: 0.001897 s ~Mflops: 131.780 nsubm:2 otn:4 +Applying merge (3 -> 2 leaves, 4 th.) yielded SLOWDOWN (3th of 3 tolerable) of 1.277x: 0.001485s -> 0.001897s. +Skipping further merge based tests after 3 definite performance degradations in a row (and last exceeding limit). +A total of 5 merge steps (of max 6) (16 -> 2 subms) took 0.03852s (of which 0.004318s partitioning, 0s I/O); computing times: 0.004677s in par. loops, 0.00115s sorting, 3.672e-05s analyzing) +Total merge + benchmarking process took 0.03852s, equivalent to 25.9/24.3 new/old ops (0.01367s for 3 clones -- as 9.2/8.6 ops, or 3.1/2.9 ops per clone), SPEEDUP of 1.067x +Applying multi-merge (16 -> 7 leaves, 2 steps, 4 -> 4 th.sp.) yielded SPEEDUP of 1.067x (0.001584s -> 0.001485s), will amortize in 389.4 ops by saving 9.894e-05s per op. +In 1 tuning rounds (tot. 0.048s, 0.014s for constructor, 3 clones) obtained a SPEEDUP of 6.7% (1.067x) (from 157.8 to 168.3 Mflops). +After 0.048470s, autotuning routine declared speedup of 1.06662 x, when using threads count of 4. +(500 x 500)[0x128fc20]{D} @ (0(0..0),0(0..0)) (62500 nnz, 1.2e+02 nnz/r) flags 0x2046186 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 7, symflags:'' +After threads auto-tuning, 100 multiplications took 0.364694s -- further speedup of 0.585307 x librsb timer-based profiling is not supported in this build. If you wish to have it, re-configure librsb with its support. So you can safely ignore the error you might just have seen printed out on screen. /build/reproducible-path/librsb-1.3.0.2+dfsg/examples/backsolve Hello, RSB! @@ -9752,19 +9776,19 @@ Correctly initialized the library. Building a matrix with 7 nnz, 6 x 6 Duplicates check: 1 - 0 = 1 - converted COO to RSB in 4.288e-03 s (100.00 %) - analyzed arrays in 3.080e-03 s (71.83 %) - cleaned-up arrays in 9.060e-06 s (0.21 %) - deduplicated arrays in 9.537e-07 s (0.02 %) - sorted arrays in 3.099e-06 s (0.07 %) - shuffled partitions in 1.140e-03 s (26.58 %) - memory allocations took 2.503e-05 s (0.58 %) - leafs setup took 7.153e-06 s (0.17 %) - halfword conversion took 1.001e-05 s (0.23 %) -Built (6 x 6)[0x2126250]{D} @ (0(0..1),0(5..6)) (1 nnz, 0.17 nnz/r) flags 0x20443ee (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 1, symflags:'UT' + converted COO to RSB in 1.291e-02 s (100.00 %) + analyzed arrays in 9.075e-03 s (70.28 %) + cleaned-up arrays in 9.060e-06 s (0.07 %) + deduplicated arrays in 0.000e+00 s (0.00 %) + sorted arrays in 2.861e-06 s (0.02 %) + shuffled partitions in 3.770e-03 s (29.20 %) + memory allocations took 2.408e-05 s (0.19 %) + leafs setup took 4.053e-06 s (0.03 %) + halfword conversion took 9.060e-06 s (0.07 %) +Built (6 x 6)[0x1f00250]{D} @ (0(0..1),0(5..6)) (1 nnz, 0.17 nnz/r) flags 0x20443ee (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 1, symflags:'UT' Correctly allocated a matrix with 7 nonzeroes. Summary information of the matrix: -(6 x 6)[0x2126250]{D} @ (0(0..1),0(5..6)) (1 nnz, 0.17 nnz/r) flags 0x20443ee (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 1, symflags:'UT' +(6 x 6)[0x1f00250]{D} @ (0(0..1),0(5..6)) (1 nnz, 0.17 nnz/r) flags 0x20443ee (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 1, symflags:'UT' Matrix printout: %%MatrixMarket matrix coordinate real general 6 6 1 @@ -9790,20 +9814,37 @@ 1 1 Will autotune matrix: 6 x 6, type D, 1 nnz, 0.17 nnz/r, 1 subms, 1 lsubms, 4.0000 bpnz. -Parameters: verbosity:1 mintimes:3 maxtimes:10 mindt:0 maxdt:9.766e-08 -3 iterations (4 th.) took 4.005e-05s; avg 1.335e-05s ( +/- 92.86/183.93 %); best 9.537e-07s; worst 3.791e-05s; std dev. 1.736e-05 (taking best). +Parameters: verbosity:1 mintimes:3 maxtimes:10 mindt:0 maxdt:8.96e-08 +3 iterations (4 th.) took 5.889e-05s; avg 1.963e-05s ( +/- 95.14/184.21 %); best 9.537e-07s; worst 5.579e-05s; std dev. 2.557e-05 (taking best). Reference operation time is 9.53674e-07 s (2.097 Mflops) with 4 threads. Starting merge (same threads) based auto-tuning procedure (transA=N, nrhs=1, order=cols) (max 6 steps, inclusive 3 grace steps) on: 6 x 6, type D, 1 nnz, 0.17 nnz/r, 1 subms, 1 lsubms, 4.0000 bpnz (tpop: 9.537e-07 Mflops: 2.097) -Merge (1 -> 1 leaves) took w.c.t. of 1.192e-06s, ~0s of computing time (of which 0s sorting, 0s analysis) -3 iterations (4 th.) took 2.861e-06s; avg 9.537e-07s ( +/- 89.76/100.00 %); best 9.766e-08s; worst 1.907e-06s; std dev. 7.787e-07 (taking best). -Reference operation time is 9.76563e-08 s (20.48 Mflops) with 4 threads. -After merge step 1: tpop: 9.766e-08 s ~Mflops: 20.480 nsubm:1 otn:4 -Applying merge (1 -> 1 leaves, 4 th.) yielded SPEEDUP of 9.766x: 9.537e-07s -> 9.766e-08s, so taking this instance. +Merge (1 -> 1 leaves) took w.c.t. of 0s, ~0s of computing time (of which 0s sorting, 0s analysis) +3 iterations (4 th.) took 4.053e-06s; avg 1.351e-06s ( +/- 29.41/ 58.82 %); best 9.537e-07s; worst 2.146e-06s; std dev. 5.62e-07 (taking best). +Reference operation time is 9.53674e-07 s (2.097 Mflops) with 4 threads. +After merge step 1: tpop: 9.537e-07 s ~Mflops: 2.097 nsubm:1 otn:4 +Applying merge (1 -> 1 leaves, 4 th.) yielded NEGLIGIBLE change (1th in a row) (old/new=1.00000x): 9.537e-07s -> 9.537e-07s, so IGNORING this instance. Merged all the matrix leaves: no reason to continue merging. -A total of 1 merge steps (of max 6) (1 -> 1 subms) took 0.003305s (of which 5.96e-06s partitioning, 0s I/O); computing times: 0s in par. loops, 0s sorting, 0s analyzing) -Total merge + benchmarking process took 0.003305s, equivalent to 33842.8/3465.5 new/old ops (0.006617s for 2 clones -- as 67758.8/6938.5 ops, or 33879.4/3469.2 ops per clone), SPEEDUP of 9.766x -Applying multi-merge (1 -> 1 leaves, 1 steps, 0 -> 4 th.sp.) yielded SPEEDUP of 9.766x (9.537e-07s -> 9.766e-08s), will amortize in 3860.9 ops by saving 8.56e-07s per op. -In 1 tuning rounds (tot. 0.0068s, 0.0066s for constructor, 2 clones) obtained a SPEEDUP of 876.6% (9.766x) (from 2.097 to 20.48 Mflops). +A total of 1 merge steps (of max 6) (1 -> 1 subms) took 2.718e-05s (of which 5.007e-06s partitioning, 0s I/O); computing times: 0s in par. loops, 0s sorting, 0s analyzing) +Total merge + benchmarking process took 2.718e-05s, equivalent to 28.5/28.5 new/old ops (0.01104s for 1 clones -- as 11573.0/11573.0 ops, or 11573.0/11573.0 ops per clone), SPEEDUP of 1.000x (NO SPEEDUP) +Merging based autotuning FAILED (=NO SPEEDUP); let's try splitting then... +3 iterations (4 th.) took 5.007e-06s; avg 1.669e-06s ( +/- 42.86/ 85.71 %); best 9.537e-07s; worst 3.099e-06s; std dev. 1.012e-06 (taking best). +Reference operation time is 9.53674e-07 s (2.097 Mflops) with 4 threads. +Starting split (same threads) based auto-tuning procedure (transA=N, nrhs=1, order=cols) (max 6 steps, inclusive 3 grace steps) on: 6 x 6, type D, 1 nnz, 0.17 nnz/r, 1 subms, 1 lsubms, 4.0000 bpnz (tpop: 9.537e-07 Mflops: 2.097) +Split (1 -> 1 leaves, 1 -> 1 subms) took 2.48e-05s (of which: 3.099e-06s analysis, 0s mem.mgmt); compute time: 0s overall, 0s searches, 0s shuffle, 0s switch, 0s quadrants. +3 iterations (4 th.) took 3.099e-06s; avg 1.033e-06s ( +/- 91.33/107.69 %); best 8.96e-08s; worst 2.146e-06s; std dev. 8.778e-07 (taking best). +Reference operation time is 8.95977e-08 s (22.32 Mflops) with 4 threads. +After split step 1: tpop: 8.96e-08 s ~Mflops: 22.322 nsubm:1 otn:4 +Applying split (1 -> 1 leaves, 4 th.) yielded SPEEDUP of 10.644x: 9.537e-07s -> 8.96e-08s, so taking this instance. +Split (1 -> 1 leaves, 1 -> 1 subms) took 2.813e-05s (of which: 2.861e-06s analysis, 0s mem.mgmt); compute time: 0s overall, 0s searches, 0s shuffle, 0s switch, 0s quadrants. +3 iterations (4 th.) took 6.914e-06s; avg 2.305e-06s ( +/- 58.62/106.90 %); best 9.537e-07s; worst 4.768e-06s; std dev. 1.745e-06 (taking best). +Reference operation time is 9.53674e-07 s (2.097 Mflops) with 4 threads. +After split step 2: tpop: 9.537e-07 s ~Mflops: 2.097 nsubm:1 otn:4 +Applying split (1 -> 1 leaves, 4 th.) yielded SLOWDOWN (1th of 3 tolerable) of 10.644x: 8.96e-08s -> 9.537e-07s. +Skipping further split based tests after 1 definite performance degradations in a row (and last exceeding limit). +A total of 2 split steps (of max 6) (1 -> 1 subms) took 0.01096s (of which 8.416e-05s partitioning, 0s I/O); computing times: 0s in par. loops, 0s sorting, 5.96e-06s analyzing) +Total split + benchmarking process took 0.01096s, equivalent to 122325.7/11492.5 new/old ops (0.02241s for 2 clones -- as 250141.0/23500.8 ops, or 125070.5/11750.4 ops per clone), SPEEDUP of 10.644x +Applying multi-split (1 -> 1 leaves, 1 steps, 0 -> 4 th.sp.) yielded SPEEDUP of 10.644x (9.537e-07s -> 8.96e-08s), will amortize in 12684.2 ops by saving 8.641e-07s per op. +In 1 tuning rounds (tot. 0.034s, 0.033s for constructor, 3 clones) obtained a SPEEDUP of 964.4% (10.64x) (from 2.097 to 22.32 Mflops). Backsolving we should get a unitary vector: %%MatrixMarket matrix array real general @@ -9838,106 +9879,183 @@ /build/reproducible-path/librsb-1.3.0.2+dfsg/examples/fortran Building a matrix with 210 nnz, 20 x 20 Duplicates check: 210 - 0 = 210 - converted COO to RSB in 9.884e-03 s (100.00 %) - analyzed arrays in 3.476e-03 s (35.17 %) - cleaned-up arrays in 5.960e-06 s (0.06 %) - deduplicated arrays in 4.053e-06 s (0.04 %) - sorted arrays in 1.713e-03 s (17.33 %) - shuffled partitions in 2.366e-03 s (23.94 %) - memory allocations took 5.984e-05 s (0.61 %) - leafs setup took 9.060e-06 s (0.09 %) - halfword conversion took 2.228e-03 s (22.54 %) -Built (20 x 20)[0x1352160]{D} @ (0(0..0),0(0..0)) (210 nnz, 10 nnz/r) flags 0x2446396 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 10, symflags:'LS' + converted COO to RSB in 2.582e-02 s (100.00 %) + analyzed arrays in 7.699e-03 s (29.81 %) + cleaned-up arrays in 5.960e-06 s (0.02 %) + deduplicated arrays in 2.861e-06 s (0.01 %) + sorted arrays in 4.855e-03 s (18.80 %) + shuffled partitions in 6.795e-03 s (26.31 %) + memory allocations took 5.603e-05 s (0.22 %) + leafs setup took 8.106e-06 s (0.03 %) + halfword conversion took 6.380e-03 s (24.71 %) +Built (20 x 20)[0x151f160]{D} @ (0(0..0),0(0..0)) (210 nnz, 10 nnz/r) flags 0x2446396 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 10, symflags:'LS' Will autotune matrix: 20 x 20, type D, 210 nnz, 10 nnz/r, 14 subms, 10 lsubms, 3.1429 bpnz. -Parameters: verbosity:1 mintimes:3 maxtimes:10 mindt:0 maxdt:1.04e-07 -Starting autotuning (16 x 1.03998e-07 s stages, transA=N, nrhs=1, timer gran.=1.03998e-07), 4 suggested as starting thread count(default). -3 iterations (4 th.) took 0.01609s; avg 0.005363s ( +/- 80.24/147.51 %); best 0.00106s; worst 0.01328s; std dev. 0.005602 (taking best). -Reference operation time is 0.00106001 s (0.7924 Mflops) with 4 threads. -Starting merge (same threads) based auto-tuning procedure (transA=N, nrhs=1, order=cols) (max 6 steps, inclusive 3 grace steps) on: 20 x 20, type D, 210 nnz, 10 nnz/r, 14 subms, 10 lsubms, 3.1429 bpnz (tpop: 0.00106 Mflops: 0.792) -Merge (10 -> 8 leaves) took w.c.t. of 6.294e-05s, ~1.693e-05s of computing time (of which 3.099e-06s sorting, 1.192e-05s analysis) -3 iterations (4 th.) took 0.0376s; avg 0.01253s ( +/- 90.27/173.21 %); best 0.00122s; worst 0.03424s; std dev. 0.01535 (taking best). -Reference operation time is 0.00121999 s (0.6885 Mflops) with 4 threads. -After merge step 1: tpop: 0.00122 s ~Mflops: 0.689 nsubm:8 otn:4 -Applying merge (10 -> 8 leaves, 4 th.) yielded SLOWDOWN (1th of 3 tolerable) of 1.151x: 0.00106s -> 0.00122s. -Merge (8 -> 6 leaves) took w.c.t. of 4.196e-05s, ~1.287e-05s of computing time (of which 2.146e-06s sorting, 1.192e-05s analysis) -3 iterations (4 th.) took 0.003618s; avg 0.001206s ( +/- 52.32/ 30.83 %); best 0.0005751s; worst 0.001578s; std dev. 0.0004485 (taking best). -Reference operation time is 0.000575066 s (1.461 Mflops) with 4 threads. -After merge step 2: tpop: 0.0005751 s ~Mflops: 1.461 nsubm:6 otn:4 -Applying merge (8 -> 6 leaves, 4 th.) yielded SPEEDUP of 1.843x: 0.00106s -> 0.0005751s, so taking this instance. -Merge (6 -> 3 leaves) took w.c.t. of 3.719e-05s, ~1.216e-05s of computing time (of which 4.053e-06s sorting, 5.007e-06s analysis) -3 iterations (4 th.) took 0.007143s; avg 0.002381s ( +/- 57.78/113.94 %); best 0.001005s; worst 0.005094s; std dev. 0.001918 (taking best). -Reference operation time is 0.00100517 s (0.8357 Mflops) with 4 threads. -After merge step 3: tpop: 0.001005 s ~Mflops: 0.836 nsubm:3 otn:4 -Applying merge (6 -> 3 leaves, 4 th.) yielded SLOWDOWN (1th of 3 tolerable) of 1.748x: 0.0005751s -> 0.001005s. +Parameters: verbosity:1 mintimes:3 maxtimes:10 mindt:0 maxdt:9.005e-08 +Starting autotuning (16 x 9.00507e-08 s stages, transA=N, nrhs=1, timer gran.=9.00507e-08), 4 suggested as starting thread count(default). +3 iterations (4 th.) took 0.00911s; avg 0.003037s ( +/- 20.97/ 38.44 %); best 0.0024s; worst 0.004204s; std dev. 0.0008266 (taking best). +Reference operation time is 0.00239992 s (0.35 Mflops) with 4 threads. +Starting merge (same threads) based auto-tuning procedure (transA=N, nrhs=1, order=cols) (max 6 steps, inclusive 3 grace steps) on: 20 x 20, type D, 210 nnz, 10 nnz/r, 14 subms, 10 lsubms, 3.1429 bpnz (tpop: 0.0024 Mflops: 0.350) +Merge (10 -> 8 leaves) took w.c.t. of 4.888e-05s, ~1.407e-05s of computing time (of which 2.146e-06s sorting, 6.914e-06s analysis) +3 iterations (4 th.) took 0.01237s; avg 0.004123s ( +/- 12.45/ 21.33 %); best 0.00361s; worst 0.005003s; std dev. 0.0006249 (taking best). +Reference operation time is 0.0036099 s (0.2327 Mflops) with 4 threads. +After merge step 1: tpop: 0.00361 s ~Mflops: 0.233 nsubm:8 otn:4 +Applying merge (10 -> 8 leaves, 4 th.) yielded SLOWDOWN (1th of 3 tolerable) of 1.504x: 0.0024s -> 0.00361s. Skipping further merge based tests after 1 definite performance degradations in a row (and last exceeding limit). -A total of 3 merge steps (of max 6) (10 -> 3 subms) took 0.05133s (of which 0.0001643s partitioning, 0s I/O); computing times: 4.196e-05s in par. loops, 9.298e-06s sorting, 2.885e-05s analyzing) -Total merge + benchmarking process took 0.05133s, equivalent to 89.3/48.4 new/old ops (0.006113s for 2 clones -- as 10.6/5.8 ops, or 5.3/2.9 ops per clone), SPEEDUP of 1.843x -Applying multi-merge (10 -> 6 leaves, 2 steps, 0 -> 4 th.sp.) yielded SPEEDUP of 1.843x (0.00106s -> 0.0005751s), will amortize in 105.8 ops by saving 0.0004849s per op. -In 1 tuning rounds (tot. 0.071s, 0.0061s for constructor, 2 clones) obtained a SPEEDUP of 84.3% (1.843x) (from 0.7924 to 1.461 Mflops). +A total of 1 merge steps (of max 6) (10 -> 8 subms) took 0.01245s (of which 5.484e-05s partitioning, 0s I/O); computing times: 1.407e-05s in par. loops, 2.146e-06s sorting, 6.914e-06s analyzing) +Total merge + benchmarking process took 0.01245s, equivalent to 5.2/5.2 new/old ops (0.01184s for 1 clones -- as 4.9/4.9 ops, or 4.9/4.9 ops per clone), SPEEDUP of 1.000x (NO SPEEDUP) +Merging based autotuning FAILED (=NO SPEEDUP); let's try splitting then... +3 iterations (4 th.) took 0.009897s; avg 0.003299s ( +/- 27.01/ 49.90 %); best 0.002408s; worst 0.004945s; std dev. 0.001165 (taking best). +Reference operation time is 0.00240803 s (0.3488 Mflops) with 4 threads. +Starting split (same threads) based auto-tuning procedure (transA=N, nrhs=1, order=cols) (max 6 steps, inclusive 3 grace steps) on: 20 x 20, type D, 210 nnz, 10 nnz/r, 14 subms, 10 lsubms, 3.1429 bpnz (tpop: 0.002408 Mflops: 0.349) +Split (10 -> 25 leaves, 14 -> 34 subms) took 0.005317s (of which: 5.96e-06s analysis, -8.553e+09s mem.mgmt); compute time: 0.0001352s overall, 5.007e-06s searches, 0.0001302s shuffle, 0.0001011s switch, 3.099e-06s quadrants. +3 iterations (4 th.) took 0.01225s; avg 0.004084s ( +/- 37.66/ 21.30 %); best 0.002546s; worst 0.004954s; std dev. 0.001091 (taking best). +Reference operation time is 0.00254607 s (0.3299 Mflops) with 4 threads. +After split step 1: tpop: 0.002546 s ~Mflops: 0.330 nsubm:25 otn:4 +Applying split (10 -> 25 leaves, 4 th.) yielded SLOWDOWN (1th of 3 tolerable) of 1.057x: 0.002408s -> 0.002546s. +Split (25 -> 57 leaves, 34 -> 78 subms) took 0.004712s (of which: 9.06e-06s analysis, -2.053e+10s mem.mgmt); compute time: 6.914e-05s overall, 6.914e-06s searches, 6.223e-05s shuffle, 1.287e-05s switch, 5.007e-06s quadrants. +3 iterations (4 th.) took 0.009733s; avg 0.003244s ( +/- 27.47/ 50.67 %); best 0.002353s; worst 0.004888s; std dev. 0.001164 (taking best). +Reference operation time is 0.00235295 s (0.357 Mflops) with 4 threads. +After split step 2: tpop: 0.002353 s ~Mflops: 0.357 nsubm:57 otn:4 +Applying split (25 -> 57 leaves, 4 th.) yielded SPEEDUP of 1.023x: 0.002408s -> 0.002353s, so taking this instance. +Split (57 -> 137 leaves, 78 -> 186 subms) took 0.004625s (of which: 1.407e-05s analysis, -4.79e+10s mem.mgmt); compute time: 0.0001543s overall, 1.645e-05s searches, 0.0001378s shuffle, 3.29e-05s switch, 1.836e-05s quadrants. +3 iterations (4 th.) took 0.009663s; avg 0.003221s ( +/- 24.94/ 42.51 %); best 0.002418s; worst 0.00459s; std dev. 0.0009729 (taking best). +Reference operation time is 0.0024178 s (0.3474 Mflops) with 4 threads. +After split step 3: tpop: 0.002418 s ~Mflops: 0.347 nsubm:137 otn:4 +Applying split (57 -> 137 leaves, 4 th.) yielded SLOWDOWN (1th of 3 tolerable) of 1.028x: 0.002353s -> 0.002418s. +Split (137 -> 146 leaves, 186 -> 198 subms) took 0.005168s (of which: 2.694e-05s analysis, -5.132e+09s mem.mgmt); compute time: 9.108e-05s overall, 1.907e-06s searches, 8.917e-05s shuffle, 7.415e-05s switch, 4.053e-06s quadrants. +3 iterations (4 th.) took 0.01059s; avg 0.003531s ( +/- 40.03/ 39.27 %); best 0.002118s; worst 0.004918s; std dev. 0.001143 (taking best). +Reference operation time is 0.00211787 s (0.3966 Mflops) with 4 threads. +After split step 4: tpop: 0.002118 s ~Mflops: 0.397 nsubm:146 otn:4 +Applying split (137 -> 146 leaves, 4 th.) yielded SPEEDUP of 1.111x: 0.002353s -> 0.002118s, so taking this instance. +Split (146 -> 146 leaves, 198 -> 198 subms) took 0.006953s (of which: 2.813e-05s analysis, 0s mem.mgmt); compute time: 0s overall, 0s searches, 0s shuffle, 0s switch, 0s quadrants. +3 iterations (4 th.) took 0.009416s; avg 0.003139s ( +/- 22.77/ 23.27 %); best 0.002424s; worst 0.003869s; std dev. 0.00059 (taking best). +Reference operation time is 0.002424 s (0.3465 Mflops) with 4 threads. +After split step 5: tpop: 0.002424 s ~Mflops: 0.347 nsubm:146 otn:4 +Applying split (146 -> 146 leaves, 4 th.) yielded SLOWDOWN (1th of 3 tolerable) of 1.145x: 0.002118s -> 0.002424s. +Split (146 -> 146 leaves, 198 -> 198 subms) took 0.00662s (of which: 2.599e-05s analysis, 0s mem.mgmt); compute time: 0s overall, 0s searches, 0s shuffle, 0s switch, 0s quadrants. +3 iterations (4 th.) took 0.0096s; avg 0.0032s ( +/- 30.37/ 51.78 %); best 0.002228s; worst 0.004857s; std dev. 0.001178 (taking best). +Reference operation time is 0.00222802 s (0.377 Mflops) with 4 threads. +After split step 6: tpop: 0.002228 s ~Mflops: 0.377 nsubm:146 otn:4 +Applying split (146 -> 146 leaves, 4 th.) yielded SLOWDOWN (2th of 3 tolerable) of 1.052x: 0.002118s -> 0.002228s. +A total of 6 split steps (of max 6) (10 -> 146 subms) took 0.119s (of which 0.03432s partitioning, 0s I/O); computing times: 0.0004497s in par. loops, 3.028e-05s sorting, 0.0001101s analyzing) +Total split + benchmarking process took 0.119s, equivalent to 56.2/49.4 new/old ops (0.03372s for 3 clones -- as 15.9/14.0 ops, or 5.3/4.7 ops per clone), SPEEDUP of 1.137x +Applying multi-split (10 -> 146 leaves, 4 steps, 0 -> 4 th.sp.) yielded SPEEDUP of 1.137x (0.002408s -> 0.002118s), will amortize in 410.2 ops by saving 0.0002902s per op. +In 1 tuning rounds (tot. 0.17s, 0.046s for constructor, 4 clones) obtained a SPEEDUP of 13.7% (1.137x) (from 0.3488 to 0.3966 Mflops). autotuner chose 4 threads -Will autotune matrix: 20 x 20, type D, 210 nnz, 10 nnz/r, 8 subms, 6 lsubms, 2.8762 bpnz. -Parameters: verbosity:1 mintimes:3 maxtimes:10 mindt:0 maxdt:1.04e-07 -Starting autotuning (16 x 1.03998e-07 s stages, transA=N, nrhs=1, timer gran.=1.03998e-07), 4 suggested as starting thread count(default). -3 iterations (4 th.) took 0.01979s; avg 0.006597s ( +/- 84.28/145.08 %); best 0.001037s; worst 0.01617s; std dev. 0.006797 (taking best). -~ 4 threads: 0.001037s (0.81 Mflops) (0/2 degradations so far) - -3 iterations (3 th.) took 0.03225s; avg 0.01075s ( +/- 94.73/179.91 %); best 0.000567s; worst 0.03009s; std dev. 0.01368 (taking best). - 3 threads: 0.000567s (1.5 Mflops) (0/2 degradations so far) - -3 iterations (2 th.) took 0.006412s; avg 0.002137s ( +/- 51.48/ 87.01 %); best 0.001037s; worst 0.003997s; std dev. 0.001322 (taking best). - 2 threads: 0.001037s (0.81 Mflops) (1/2 degradations so far) - -3 iterations (1 th.) took 0.003771s; avg 0.001257s ( +/- 58.48/ 30.31 %); best 0.0005219s; worst 0.001638s; std dev. 0.0005199 (taking best). - 1 threads: 0.0005219s (1.6 Mflops) (0/2 degradations so far) - -Best threads choice is 1; starting threads were 4; max speed gap is 2x; search took 0.062s. -Starting merge (and threads) based auto-tuning procedure (transA=N, nrhs=1, order=cols) (max 6 steps, inclusive 3 grace steps) on: 20 x 20, type D, 210 nnz, 10 nnz/r, 8 subms, 6 lsubms, 2.8762 bpnz (tpop: 0.0005219 Mflops: 1.610) -Merge (6 -> 3 leaves) took w.c.t. of 3.695e-05s, ~1.502e-05s of computing time (of which 5.007e-06s sorting, 1.001e-05s analysis) -3 iterations (4 th.) took 0.04273s; avg 0.01424s ( +/- 96.05/188.73 %); best 0.0005629s; worst 0.04113s; std dev. 0.01901 (taking best). -~ 4 threads: 0.0005629s (1.5 Mflops) (0/2 degradations so far) - -3 iterations (3 th.) took 0.05034s; avg 0.01678s ( +/- 90.58/121.48 %); best 0.00158s; worst 0.03717s; std dev. 0.01498 (taking best). - 3 threads: 0.00158s (0.53 Mflops) (1/2 degradations so far) - -3 iterations (2 th.) took 0.00379s; avg 0.001263s ( +/- 15.85/ 24.19 %); best 0.001063s; worst 0.001569s; std dev. 0.0002196 (taking best). - 2 threads: 0.001063s (0.79 Mflops) (2/2 degradations so far) - -Best threads choice is 4; starting threads were 4; max speed gap is 2.8x; search took 0.097s. -After merge step 1: tpop: 0.0005629 s ~Mflops: 1.492 nsubm:3 otn:4 -Applying merge (6 -> 3 leaves, 4 th.) yielded SLOWDOWN (1th of 3 tolerable) of 1.079x: 0.0005219s -> 0.0005629s. -Merge (3 -> 1 leaves) took w.c.t. of 4.578e-05s, ~1.907e-05s of computing time (of which 5.007e-06s sorting, 1.001e-05s analysis) -3 iterations (4 th.) took 8.106e-06s; avg 2.702e-06s ( +/- 64.71/ 85.29 %); best 9.537e-07s; worst 5.007e-06s; std dev. 1.701e-06 (taking best). -~ 4 threads: 9.537e-07s (8.8e+02 Mflops) (0/2 degradations so far) - -3 iterations (3 th.) took 5.96e-06s; avg 1.987e-06s ( +/- 4.00/ 8.00 %); best 1.907e-06s; worst 2.146e-06s; std dev. 1.124e-07 (taking best). - 3 threads: 1.907e-06s (4.4e+02 Mflops) (1/2 degradations so far) - -3 iterations (2 th.) took 5.007e-06s; avg 1.669e-06s ( +/- 42.86/ 28.57 %); best 9.537e-07s; worst 2.146e-06s; std dev. 5.15e-07 (taking best). - 2 threads: 9.537e-07s (8.8e+02 Mflops) (0/2 degradations so far) - -3 iterations (1 th.) took 5.96e-06s; avg 1.987e-06s ( +/- 4.00/ 8.00 %); best 1.907e-06s; worst 2.146e-06s; std dev. 1.124e-07 (taking best). - 1 threads: 1.907e-06s (4.4e+02 Mflops) (1/2 degradations so far) - -Best threads choice is 4; starting threads were 4; max speed gap is 2x; search took 6.7e-05s. -After merge step 2: tpop: 9.537e-07 s ~Mflops: 880.804 nsubm:1 otn:4 -Applying merge (3 -> 1 leaves, 4 th.) yielded SPEEDUP of 547.250x: 0.0005219s -> 9.537e-07s, so taking this instance. -Merged all the matrix leaves: no reason to continue merging. -A total of 2 merge steps (of max 6) (6 -> 1 subms) took 0.1004s (of which 9.704e-05s partitioning, 0s I/O); computing times: 3.409e-05s in par. loops, 1.001e-05s sorting, 2.003e-05s analyzing) -Total merge + benchmarking process took 0.1004s, equivalent to 105271.8/192.4 new/old ops (0.00593s for 2 clones -- as 6218.0/11.4 ops, or 3109.0/5.7 ops per clone), SPEEDUP of 547.250x -Applying multi-merge (6 -> 1 leaves, 2 steps, 1 -> 4 th.sp.) yielded SPEEDUP of 547.250x (0.0005219s -> 9.537e-07s), will amortize in 192.7 ops by saving 0.0005209s per op. -In 1 tuning rounds (tot. 0.17s, 0.0059s for constructor, 2 clones) obtained a SPEEDUP of 54625.0% (547.2x) (from 1.61 to 880.8 Mflops). +Will autotune matrix: 20 x 20, type D, 210 nnz, 10 nnz/r, 198 subms, 146 lsubms, 4.2286 bpnz. +Parameters: verbosity:1 mintimes:3 maxtimes:10 mindt:0 maxdt:9.005e-08 +Starting autotuning (16 x 9.00507e-08 s stages, transA=N, nrhs=1, timer gran.=9.00507e-08), 4 suggested as starting thread count(default). +3 iterations (4 th.) took 0.01014s; avg 0.003381s ( +/- 26.51/ 51.92 %); best 0.002485s; worst 0.005137s; std dev. 0.001242 (taking best). +~ 4 threads: 0.002485s (0.34 Mflops) (0/2 degradations so far) - +3 iterations (3 th.) took 0.01197s; avg 0.00399s ( +/- 44.11/ 22.47 %); best 0.00223s; worst 0.004886s; std dev. 0.001244 (taking best). + 3 threads: 0.00223s (0.38 Mflops) (0/2 degradations so far) - +3 iterations (2 th.) took 0.01002s; avg 0.00334s ( +/- 33.59/ 41.64 %); best 0.002218s; worst 0.004731s; std dev. 0.001043 (taking best). + 2 threads: 0.002218s (0.38 Mflops) (0/2 degradations so far) - +3 iterations (1 th.) took 0.009566s; avg 0.003189s ( +/- 27.15/ 51.91 %); best 0.002323s; worst 0.004844s; std dev. 0.001171 (taking best). + 1 threads: 0.002323s (0.36 Mflops) (1/2 degradations so far) - +Best threads choice is 2; starting threads were 4; max speed gap is 1.1x; search took 0.042s. +Starting merge (and threads) based auto-tuning procedure (transA=N, nrhs=1, order=cols) (max 6 steps, inclusive 3 grace steps) on: 20 x 20, type D, 210 nnz, 10 nnz/r, 198 subms, 146 lsubms, 4.2286 bpnz (tpop: 0.002218 Mflops: 0.379) +Merge (146 -> 99 leaves) took w.c.t. of 0.003722s, ~0.0001495s of computing time (of which 1.335e-05s sorting, 2.193e-05s analysis) +3 iterations (4 th.) took 0.01191s; avg 0.00397s ( +/- 34.56/ 25.66 %); best 0.002598s; worst 0.004989s; std dev. 0.001008 (taking best). +~ 4 threads: 0.002598s (0.32 Mflops) (0/2 degradations so far) - +3 iterations (3 th.) took 0.09282s; avg 0.03094s ( +/- 60.21/ 93.57 %); best 0.01231s; worst 0.05989s; std dev. 0.02075 (taking best). + 3 threads: 0.01231s (0.068 Mflops) (1/2 degradations so far) - +3 iterations (2 th.) took 0.01204s; avg 0.004015s ( +/- 11.99/ 12.49 %); best 0.003533s; worst 0.004516s; std dev. 0.0004015 (taking best). + 2 threads: 0.003533s (0.24 Mflops) (2/2 degradations so far) - +Best threads choice is 4; starting threads were 4; max speed gap is 4.7x; search took 0.12s. +After merge step 1: tpop: 0.002598 s ~Mflops: 0.323 nsubm:99 otn:4 +Applying merge (146 -> 99 leaves, 4 th.) yielded SLOWDOWN (1th of 3 tolerable) of 1.171x: 0.002218s -> 0.002598s. +Merge (99 -> 68 leaves) took w.c.t. of 0.003379s, ~6.008e-05s of computing time (of which 8.821e-06s sorting, 2.408e-05s analysis) +3 iterations (4 th.) took 0.01143s; avg 0.003811s ( +/- 26.27/ 21.32 %); best 0.00281s; worst 0.004624s; std dev. 0.0007524 (taking best). +~ 4 threads: 0.00281s (0.3 Mflops) (0/2 degradations so far) - +3 iterations (3 th.) took 0.01249s; avg 0.004162s ( +/- 31.52/ 23.22 %); best 0.00285s; worst 0.005128s; std dev. 0.0009617 (taking best). + 3 threads: 0.00285s (0.29 Mflops) (1/2 degradations so far) - +3 iterations (2 th.) took 0.01267s; avg 0.004223s ( +/- 21.59/ 10.96 %); best 0.003311s; worst 0.004686s; std dev. 0.0006448 (taking best). + 2 threads: 0.003311s (0.25 Mflops) (2/2 degradations so far) - +Best threads choice is 4; starting threads were 4; max speed gap is 1.2x; search took 0.037s. +After merge step 2: tpop: 0.00281 s ~Mflops: 0.299 nsubm:68 otn:4 +Applying merge (99 -> 68 leaves, 4 th.) yielded SLOWDOWN (2th of 3 tolerable) of 1.267x: 0.002218s -> 0.00281s. +Skipping further merge based tests after 2 definite performance degradations in a row (and last exceeding limit). +A total of 2 merge steps (of max 6) (146 -> 68 subms) took 0.1606s (of which 0.007121s partitioning, 0s I/O); computing times: 0.0002096s in par. loops, 2.217e-05s sorting, 4.601e-05s analyzing) +Total merge + benchmarking process took 0.1606s, equivalent to 72.4/72.4 new/old ops (0.01176s for 1 clones -- as 5.3/5.3 ops, or 5.3/5.3 ops per clone), SPEEDUP of 1.000x (NO SPEEDUP) +Merging based autotuning FAILED (=NO SPEEDUP); let's try splitting then... +3 iterations (4 th.) took 0.01112s; avg 0.003706s ( +/- 42.22/ 31.31 %); best 0.002141s; worst 0.004866s; std dev. 0.001149 (taking best). +~ 4 threads: 0.002141s (0.39 Mflops) (0/2 degradations so far) - +3 iterations (3 th.) took 0.0106s; avg 0.003534s ( +/- 29.74/ 44.64 %); best 0.002483s; worst 0.005112s; std dev. 0.001136 (taking best). + 3 threads: 0.002483s (0.34 Mflops) (1/2 degradations so far) - +3 iterations (2 th.) took 0.01151s; avg 0.003837s ( +/- 40.68/ 60.93 %); best 0.002276s; worst 0.006175s; std dev. 0.001684 (taking best). + 2 threads: 0.002276s (0.37 Mflops) (2/2 degradations so far) - +Best threads choice is 4; starting threads were 4; max speed gap is 1.2x; search took 0.034s. +Starting split (and threads) based auto-tuning procedure (transA=N, nrhs=1, order=cols) (max 6 steps, inclusive 3 grace steps) on: 20 x 20, type D, 210 nnz, 10 nnz/r, 198 subms, 146 lsubms, 4.2286 bpnz (tpop: 0.002141 Mflops: 0.392) +Split (146 -> 146 leaves, 198 -> 198 subms) took 0.006095s (of which: 2.909e-05s analysis, 0s mem.mgmt); compute time: 0s overall, 0s searches, 0s shuffle, 0s switch, 0s quadrants. +3 iterations (4 th.) took 0.009575s; avg 0.003192s ( +/- 28.97/ 52.08 %); best 0.002267s; worst 0.004854s; std dev. 0.001178 (taking best). +~ 4 threads: 0.002267s (0.37 Mflops) (0/2 degradations so far) - +3 iterations (3 th.) took 0.01295s; avg 0.004316s ( +/- 14.09/ 13.57 %); best 0.003708s; worst 0.004902s; std dev. 0.0004876 (taking best). + 3 threads: 0.003708s (0.23 Mflops) (1/2 degradations so far) - +3 iterations (2 th.) took 0.009536s; avg 0.003179s ( +/- 22.36/ 42.95 %); best 0.002468s; worst 0.004544s; std dev. 0.0009657 (taking best). + 2 threads: 0.002468s (0.34 Mflops) (2/2 degradations so far) - +Best threads choice is 4; starting threads were 4; max speed gap is 1.6x; search took 0.032s. +After split step 1: tpop: 0.002267 s ~Mflops: 0.371 nsubm:146 otn:4 +Applying split (146 -> 146 leaves, 4 th.) yielded SLOWDOWN (1th of 3 tolerable) of 1.059x: 0.002141s -> 0.002267s. +Split (146 -> 146 leaves, 198 -> 198 subms) took 0.004375s (of which: 4.601e-05s analysis, 0s mem.mgmt); compute time: 0s overall, 0s searches, 0s shuffle, 0s switch, 0s quadrants. +3 iterations (4 th.) took 0.01158s; avg 0.003861s ( +/- 34.95/ 23.71 %); best 0.002512s; worst 0.004777s; std dev. 0.0009742 (taking best). +~ 4 threads: 0.002512s (0.33 Mflops) (0/2 degradations so far) - +3 iterations (3 th.) took 0.01158s; avg 0.00386s ( +/- 39.66/ 30.14 %); best 0.002329s; worst 0.005023s; std dev. 0.00113 (taking best). + 3 threads: 0.002329s (0.36 Mflops) (0/2 degradations so far) - +3 iterations (2 th.) took 0.01012s; avg 0.003372s ( +/- 13.05/ 24.49 %); best 0.002932s; worst 0.004198s; std dev. 0.0005843 (taking best). + 2 threads: 0.002932s (0.29 Mflops) (1/2 degradations so far) - +3 iterations (1 th.) took 0.01117s; avg 0.003725s ( +/- 40.83/ 44.39 %); best 0.002204s; worst 0.005378s; std dev. 0.001299 (taking best). + 1 threads: 0.002204s (0.38 Mflops) (0/2 degradations so far) - +Best threads choice is 1; starting threads were 4; max speed gap is 1.3x; search took 0.045s. +After split step 2: tpop: 0.002204 s ~Mflops: 0.381 nsubm:146 otn:1 +Applying split (146 -> 146 leaves, 1 th.) yielded SLOWDOWN (2th of 3 tolerable) of 1.029x: 0.002141s -> 0.002204s. +Split (146 -> 146 leaves, 198 -> 198 subms) took 0.00473s (of which: 3.004e-05s analysis, 0s mem.mgmt); compute time: 0s overall, 0s searches, 0s shuffle, 0s switch, 0s quadrants. +3 iterations (4 th.) took 0.009247s; avg 0.003082s ( +/- 27.30/ 47.36 %); best 0.002241s; worst 0.004542s; std dev. 0.001036 (taking best). +~ 4 threads: 0.002241s (0.37 Mflops) (0/2 degradations so far) - +3 iterations (3 th.) took 0.01573s; avg 0.005244s ( +/- 53.81/ 58.31 %); best 0.002422s; worst 0.008301s; std dev. 0.002406 (taking best). + 3 threads: 0.002422s (0.35 Mflops) (1/2 degradations so far) - +3 iterations (2 th.) took 0.0109s; avg 0.003633s ( +/- 37.39/ 35.61 %); best 0.002275s; worst 0.004927s; std dev. 0.001084 (taking best). + 2 threads: 0.002275s (0.37 Mflops) (2/2 degradations so far) - +Best threads choice is 4; starting threads were 4; max speed gap is 1.1x; search took 0.036s. +After split step 3: tpop: 0.002241 s ~Mflops: 0.375 nsubm:146 otn:4 +Applying split (146 -> 146 leaves, 4 th.) yielded SLOWDOWN (3th of 3 tolerable) of 1.047x: 0.002141s -> 0.002241s. +Split (146 -> 146 leaves, 198 -> 198 subms) took 0.00522s (of which: 2.909e-05s analysis, 0s mem.mgmt); compute time: 0s overall, 0s searches, 0s shuffle, 0s switch, 0s quadrants. +3 iterations (4 th.) took 0.01042s; avg 0.003474s ( +/- 34.72/ 62.78 %); best 0.002268s; worst 0.005655s; std dev. 0.001545 (taking best). +~ 4 threads: 0.002268s (0.37 Mflops) (0/2 degradations so far) - +3 iterations (3 th.) took 0.01101s; avg 0.003671s ( +/- 29.55/ 30.19 %); best 0.002586s; worst 0.004779s; std dev. 0.0008953 (taking best). + 3 threads: 0.002586s (0.32 Mflops) (1/2 degradations so far) - +3 iterations (2 th.) took 0.01007s; avg 0.003358s ( +/- 31.42/ 39.19 %); best 0.002303s; worst 0.004674s; std dev. 0.0009854 (taking best). + 2 threads: 0.002303s (0.36 Mflops) (2/2 degradations so far) - +Best threads choice is 4; starting threads were 4; max speed gap is 1.1x; search took 0.032s. +After split step 4: tpop: 0.002268 s ~Mflops: 0.370 nsubm:146 otn:4 +Applying split (146 -> 146 leaves, 4 th.) yielded SLOWDOWN (4th of 3 tolerable) of 1.059x: 0.002141s -> 0.002268s. +Skipping further split based tests after 4 definite performance degradations in a row. +A total of 4 split steps (of max 6) (146 -> 146 subms) took 0.1654s (of which 0.02088s partitioning, 0s I/O); computing times: 0s in par. loops, 0s sorting, 0.0001342s analyzing) +Total split + benchmarking process took 0.1654s, equivalent to 77.3/77.3 new/old ops (0.01034s for 1 clones -- as 4.8/4.8 ops, or 4.8/4.8 ops per clone), SPEEDUP of 1.000x (NO SPEEDUP) +In 1 tuning rounds (tot. 0.42s, 0.022s for constructor, 2 clones) obtained NO speedup (best stays 0.3923 Mflops). check results are ok Building a matrix with 36 nnz, 6 x 6 Duplicates check: 36 - 0 = 36 - converted COO to RSB in 3.313e-03 s (100.00 %) - analyzed arrays in 1.119e-03 s (33.77 %) - cleaned-up arrays in 1.907e-06 s (0.06 %) - deduplicated arrays in 9.537e-07 s (0.03 %) - sorted arrays in 1.085e-03 s (32.75 %) - shuffled partitions in 1.082e-03 s (32.66 %) - memory allocations took 1.025e-05 s (0.31 %) - leafs setup took 4.053e-06 s (0.12 %) - halfword conversion took 6.914e-06 s (0.21 %) -Built (6 x 6)[0x1356db0]{Z} @ (0(0..6),0(0..6)) (36 nnz, 6 nnz/r) flags 0x20440b4 (coo:0, csr:1, hw:0, ic:1, fi:0), storage: 1, subm: 1, symflags:'UL' + converted COO to RSB in 1.148e-02 s (100.00 %) + analyzed arrays in 6.622e-03 s (57.68 %) + cleaned-up arrays in 2.146e-06 s (0.02 %) + deduplicated arrays in 9.537e-07 s (0.01 %) + sorted arrays in 2.117e-03 s (18.44 %) + shuffled partitions in 2.722e-03 s (23.71 %) + memory allocations took 9.775e-06 s (0.09 %) + leafs setup took 2.146e-06 s (0.02 %) + halfword conversion took 2.861e-06 s (0.02 %) +Built (6 x 6)[0x1523520]{Z} @ (0(0..6),0(0..6)) (36 nnz, 6 nnz/r) flags 0x20440b4 (coo:0, csr:1, hw:0, ic:1, fi:0), storage: 1, subm: 1, symflags:'UL' Read matrix pd.mtx 6 x 6 : 36 Matrix has no symmetry Using NRHS=4 -Repeated USMV took 0.4888E-04 s -A single USMM took 0.3386E-04 s -USMM-to-USMV speed ratio is is 1.444 x +Repeated USMV took 0.6104E-04 s +A single USMM took 0.8893E-04 s +USMM-to-USMV speed ratio is is 0.6863 x Call auto-tuning routine.. Repeat measurement. -Tuned USMM took 0.1192E-04 s -Tuned-to-untuned speed ratio is is 2.840 x +Tuned USMM took 0.1001E-04 s +Tuned-to-untuned speed ratio is is 8.881 x FAILED: 0 PASSED: 2 /build/reproducible-path/librsb-1.3.0.2+dfsg/examples/fortran_rsb_fi @@ -9986,249 +10104,223 @@ Loading matrix from file "/build/reproducible-path/librsb-1.3.0.2+dfsg/pd.mtx". Building a matrix with 36 nnz, 6 x 6 Duplicates check: 36 - 0 = 36 - converted COO to RSB in 8.690e-03 s (100.00 %) - analyzed arrays in 2.685e-03 s (30.90 %) - cleaned-up arrays in 3.099e-06 s (0.04 %) - deduplicated arrays in 1.907e-06 s (0.02 %) - sorted arrays in 1.481e-03 s (17.04 %) - shuffled partitions in 2.198e-03 s (25.29 %) - memory allocations took 2.193e-05 s (0.25 %) - leafs setup took 9.060e-06 s (0.10 %) - halfword conversion took 2.271e-03 s (26.13 %) -Built (6 x 6)[0x22f96a0]{D} @ (0(0..0),0(0..0)) (36 nnz, 6 nnz/r) flags 0x42046186 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 16, symflags:'' + converted COO to RSB in 2.582e-02 s (100.00 %) + analyzed arrays in 8.659e-03 s (33.53 %) + cleaned-up arrays in 3.099e-06 s (0.01 %) + deduplicated arrays in 2.146e-06 s (0.01 %) + sorted arrays in 4.466e-03 s (17.29 %) + shuffled partitions in 7.025e-03 s (27.21 %) + memory allocations took 2.098e-05 s (0.08 %) + leafs setup took 8.106e-06 s (0.03 %) + halfword conversion took 5.615e-03 s (21.74 %) +Built (6 x 6)[0x227c6a0]{D} @ (0(0..0),0(0..0)) (36 nnz, 6 nnz/r) flags 0x42046186 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 16, symflags:'' Considering D clone. Base matrix: -(6 x 6)[0x22fba30]{D} @ (0(0..0),0(0..0)) (36 nnz, 6 nnz/r) flags 0x2046186 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 16, symflags:'' +(6 x 6)[0x227ea30]{D} @ (0(0..0),0(0..0)) (36 nnz, 6 nnz/r) flags 0x2046186 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 16, symflags:'' Will use autotuning routine to sample matrix: 6 x 6, type D, 36 nnz, 6 nnz/r, 21 subms, 16 lsubms, 4.8889 bpnz. Parameters: verbosity:1 mintimes:3 maxtimes:10 mindt:0 maxdt:0.1 -3 iterations (4 th.) took 0.01035s; avg 0.003451s ( +/- 68.94/136.23 %); best 0.001072s; worst 0.008153s; std dev. 0.003325 (taking best). -Reference operation time is 0.00107193 s (0.1343 Mflops) with 4 threads. -After 0.010442s, autotuning routine did not find a better threads count configuration. +3 iterations (4 th.) took 0.009956s; avg 0.003319s ( +/- 27.23/ 46.20 %); best 0.002415s; worst 0.004852s; std dev. 0.00109 (taking best). +Reference operation time is 0.00241494 s (0.05963 Mflops) with 4 threads. +After 0.010034s, autotuning routine did not find a better threads count configuration. Will autotune matrix: 6 x 6, type D, 36 nnz, 6 nnz/r, 21 subms, 16 lsubms, 4.8889 bpnz. Parameters: verbosity:1 mintimes:3 maxtimes:10 mindt:0 maxdt:0.1 -3 iterations (4 th.) took 0.002759s; avg 0.0009197s ( +/- 39.78/ 20.16 %); best 0.0005538s; worst 0.001105s; std dev. 0.0002587 (taking best). -Reference operation time is 0.000553846 s (0.26 Mflops) with 4 threads. -Starting merge (same threads) based auto-tuning procedure (transA=N, nrhs=2, order=cols) (max 6 steps, inclusive 3 grace steps) on: 6 x 6, type D, 36 nnz, 6 nnz/r, 21 subms, 16 lsubms, 4.8889 bpnz (tpop: 0.0005538 Mflops: 0.260) -Merge (16 -> 10 leaves) took w.c.t. of 0.0007081s, ~0.0001159s of computing time (of which 3.099e-06s sorting, 1.001e-05s analysis) -3 iterations (4 th.) took 0.05239s; avg 0.01746s ( +/- 93.92/111.81 %); best 0.001062s; worst 0.03699s; std dev. 0.01483 (taking best). -Reference operation time is 0.00106215 s (0.1356 Mflops) with 4 threads. -After merge step 1: tpop: 0.001062 s ~Mflops: 0.136 nsubm:10 otn:4 -Applying merge (16 -> 10 leaves, 4 th.) yielded SLOWDOWN (1th of 3 tolerable) of 1.918x: 0.0005538s -> 0.001062s. -Skipping further merge based tests after 1 definite performance degradations in a row (and last exceeding limit). -A total of 1 merge steps (of max 6) (16 -> 10 subms) took 0.05314s (of which 0.0007179s partitioning, 0s I/O); computing times: 0.0001159s in par. loops, 3.099e-06s sorting, 1.001e-05s analyzing) -Total merge + benchmarking process took 0.05314s, equivalent to 96.0/96.0 new/old ops (0.003302s for 1 clones -- as 6.0/6.0 ops, or 6.0/6.0 ops per clone), SPEEDUP of 1.000x (NO SPEEDUP) -Merging based autotuning FAILED (=NO SPEEDUP); let's try splitting then... -3 iterations (4 th.) took 0.004547s; avg 0.001516s ( +/- 21.68/ 13.14 %); best 0.001187s; worst 0.001715s; std dev. 0.0002341 (taking best). -Reference operation time is 0.00118709 s (0.1213 Mflops) with 4 threads. -Starting split (same threads) based auto-tuning procedure (transA=N, nrhs=2, order=cols) (max 6 steps, inclusive 3 grace steps) on: 6 x 6, type D, 36 nnz, 6 nnz/r, 21 subms, 16 lsubms, 4.8889 bpnz (tpop: 0.001187 Mflops: 0.121) -Split (16 -> 28 leaves, 21 -> 37 subms) took 0.001631s (of which: 6.914e-06s analysis, -6.842e+09s mem.mgmt); compute time: 0.0003128s overall, 6.199e-06s searches, 0.0003066s shuffle, 0.0001688s switch, 7.868e-06s quadrants. -3 iterations (4 th.) took 0.00902s; avg 0.003007s ( +/- 62.62/ 84.59 %); best 0.001124s; worst 0.00555s; std dev. 0.001866 (taking best). -Reference operation time is 0.00112391 s (0.1281 Mflops) with 4 threads. -After split step 1: tpop: 0.001124 s ~Mflops: 0.128 nsubm:28 otn:4 -Applying split (16 -> 28 leaves, 4 th.) yielded SPEEDUP of 1.056x: 0.001187s -> 0.001124s, so taking this instance. -Split (28 -> 28 leaves, 37 -> 37 subms) took 0.001191s (of which: 7.868e-06s analysis, 0s mem.mgmt); compute time: 0s overall, 0s searches, 0s shuffle, 0s switch, 0s quadrants. -3 iterations (4 th.) took 0.01846s; avg 0.006153s ( +/- 85.50/160.05 %); best 0.0008922s; worst 0.016s; std dev. 0.006969 (taking best). -Reference operation time is 0.000892162 s (0.1614 Mflops) with 4 threads. -After split step 2: tpop: 0.0008922 s ~Mflops: 0.161 nsubm:28 otn:4 -Applying split (28 -> 28 leaves, 4 th.) yielded SPEEDUP of 1.260x: 0.001124s -> 0.0008922s, so taking this instance. -Split (28 -> 28 leaves, 37 -> 37 subms) took 0.001543s (of which: 9.06e-06s analysis, 0s mem.mgmt); compute time: 0s overall, 0s searches, 0s shuffle, 0s switch, 0s quadrants. -3 iterations (4 th.) took 0.00363s; avg 0.00121s ( +/- 47.53/ 59.09 %); best 0.0006349s; worst 0.001925s; std dev. 0.0005359 (taking best). -Reference operation time is 0.000634909 s (0.2268 Mflops) with 4 threads. -After split step 3: tpop: 0.0006349 s ~Mflops: 0.227 nsubm:28 otn:4 -Applying split (28 -> 28 leaves, 4 th.) yielded SPEEDUP of 1.405x: 0.0008922s -> 0.0006349s, so taking this instance. -Split (28 -> 28 leaves, 37 -> 37 subms) took 0.001578s (of which: 7.868e-06s analysis, 0s mem.mgmt); compute time: 0s overall, 0s searches, 0s shuffle, 0s switch, 0s quadrants. -3 iterations (4 th.) took 0.003395s; avg 0.001132s ( +/- 1.83/ 2.49 %); best 0.001111s; worst 0.00116s; std dev. 2.066e-05 (taking best). -Reference operation time is 0.00111103 s (0.1296 Mflops) with 4 threads. -After split step 4: tpop: 0.001111 s ~Mflops: 0.130 nsubm:28 otn:4 -Applying split (28 -> 28 leaves, 4 th.) yielded SLOWDOWN (1th of 3 tolerable) of 1.750x: 0.0006349s -> 0.001111s. -Skipping further split based tests after 1 definite performance degradations in a row (and last exceeding limit). -A total of 4 split steps (of max 6) (16 -> 28 subms) took 0.05106s (of which 0.006187s partitioning, 0s I/O); computing times: 0.0003128s in par. loops, 6.199e-06s sorting, 3.171e-05s analyzing) -Total split + benchmarking process took 0.05106s, equivalent to 80.4/43.0 new/old ops (0.01277s for 4 clones -- as 20.1/10.8 ops, or 5.0/2.7 ops per clone), SPEEDUP of 1.870x -Applying multi-split (16 -> 28 leaves, 3 steps, 0 -> 4 th.sp.) yielded SPEEDUP of 1.870x (0.001187s -> 0.0006349s), will amortize in 92.5 ops by saving 0.0005522s per op. -In 1 tuning rounds (tot. 0.12s, 0.016s for constructor, 5 clones) obtained a SPEEDUP of 87.0% (1.87x) (from 0.1213 to 0.2268 Mflops). -After 0.118099s, global autotuning declared speedup of 1.8697 x, when using threads count of 4 and a new matrix: -(6 x 6)[0x230de58]{D} @ (0(0..0),0(0..0)) (36 nnz, 6 nnz/r) flags 0x2046186 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 28, symflags:'' +3 iterations (4 th.) took 0.01124s; avg 0.003746s ( +/- 31.62/ 25.49 %); best 0.002562s; worst 0.004701s; std dev. 0.0008884 (taking best). +Reference operation time is 0.00256181 s (0.05621 Mflops) with 4 threads. +Starting merge (same threads) based auto-tuning procedure (transA=N, nrhs=2, order=cols) (max 6 steps, inclusive 3 grace steps) on: 6 x 6, type D, 36 nnz, 6 nnz/r, 21 subms, 16 lsubms, 4.8889 bpnz (tpop: 0.002562 Mflops: 0.056) +Merge (16 -> 10 leaves) took w.c.t. of 0.001395s, ~0.000103s of computing time (of which 1.907e-06s sorting, 8.106e-06s analysis) +3 iterations (4 th.) took 0.01006s; avg 0.003354s ( +/- 27.46/ 27.85 %); best 0.002433s; worst 0.004288s; std dev. 0.0007573 (taking best). +Reference operation time is 0.00243306 s (0.05918 Mflops) with 4 threads. +After merge step 1: tpop: 0.002433 s ~Mflops: 0.059 nsubm:10 otn:4 +Applying merge (16 -> 10 leaves, 4 th.) yielded SPEEDUP of 1.053x: 0.002562s -> 0.002433s, so taking this instance. +Merge (10 -> 7 leaves) took w.c.t. of 2.193e-05s, ~6.914e-06s of computing time (of which 9.537e-07s sorting, 5.96e-06s analysis) +3 iterations (4 th.) took 0.008903s; avg 0.002968s ( +/- 25.90/ 23.40 %); best 0.002199s; worst 0.003662s; std dev. 0.0005996 (taking best). +Reference operation time is 0.00219893 s (0.06549 Mflops) with 4 threads. +After merge step 2: tpop: 0.002199 s ~Mflops: 0.065 nsubm:7 otn:4 +Applying merge (10 -> 7 leaves, 4 th.) yielded SPEEDUP of 1.106x: 0.002433s -> 0.002199s, so taking this instance. +Merge (7 -> 4 leaves) took w.c.t. of 1.502e-05s, ~5.007e-06s of computing time (of which 9.537e-07s sorting, 3.099e-06s analysis) +3 iterations (4 th.) took 0.01116s; avg 0.00372s ( +/- 31.46/ 15.80 %); best 0.00255s; worst 0.004308s; std dev. 0.0008277 (taking best). +Reference operation time is 0.00254989 s (0.05647 Mflops) with 4 threads. +After merge step 3: tpop: 0.00255 s ~Mflops: 0.056 nsubm:4 otn:4 +Applying merge (7 -> 4 leaves, 4 th.) yielded SLOWDOWN (1th of 3 tolerable) of 1.160x: 0.002199s -> 0.00255s. +Merge (4 -> 1 leaves) took w.c.t. of 1.407e-05s, ~5.96e-06s of computing time (of which 2.146e-06s sorting, 3.099e-06s analysis) +3 iterations (4 th.) took 4.053e-06s; avg 1.351e-06s ( +/- 29.41/ 58.82 %); best 9.537e-07s; worst 2.146e-06s; std dev. 5.62e-07 (taking best). +Reference operation time is 9.53674e-07 s (151 Mflops) with 4 threads. +After merge step 4: tpop: 9.537e-07 s ~Mflops: 150.995 nsubm:1 otn:4 +Applying merge (4 -> 1 leaves, 4 th.) yielded SPEEDUP of 2305.750x: 0.002199s -> 9.537e-07s, so taking this instance. +Merged all the matrix leaves: no reason to continue merging. +A total of 4 merge steps (of max 6) (16 -> 1 subms) took 0.06616s (of which 0.001475s partitioning, 0s I/O); computing times: 0.0001209s in par. loops, 5.96e-06s sorting, 2.027e-05s analyzing) +Total merge + benchmarking process took 0.06616s, equivalent to 69374.0/25.8 new/old ops (0.04436s for 4 clones -- as 46516.8/17.3 ops, or 11629.2/4.3 ops per clone), SPEEDUP of 2686.250x +Applying multi-merge (16 -> 1 leaves, 4 steps, 0 -> 4 th.sp.) yielded SPEEDUP of 2686.250x (0.002562s -> 9.537e-07s), will amortize in 25.8 ops by saving 0.002561s per op. +In 1 tuning rounds (tot. 0.088s, 0.044s for constructor, 4 clones) obtained a SPEEDUP of 268525.0% (2686x) (from 0.05621 to 151 Mflops). +After 0.087816s, global autotuning declared speedup of 2686.25 x, when using threads count of 4 and a new matrix: +(6 x 6)[0x227fdd0]{D} @ (0(0..6),0(0..6)) (36 nnz, 6 nnz/r) flags 0x2244086 (coo:0, csr:1, hw:1, ic:1, fi:0), storage: 1, subm: 1, symflags:'' Considering S clone. Building a matrix with 36 nnz, 6 x 6 Duplicates check: 36 - 0 = 36 - converted COO to RSB in 7.168e-03 s (100.00 %) - analyzed arrays in 3.238e-03 s (45.17 %) - cleaned-up arrays in 1.907e-06 s (0.03 %) - deduplicated arrays in 9.537e-07 s (0.01 %) + converted COO to RSB in 2.488e-02 s (100.00 %) + analyzed arrays in 8.921e-03 s (35.86 %) + cleaned-up arrays in 1.907e-06 s (0.01 %) + deduplicated arrays in 9.537e-07 s (0.00 %) sorted arrays in 0.000e+00 s (0.00 %) - shuffled partitions in 2.269e-03 s (31.65 %) - memory allocations took 1.121e-05 s (0.16 %) - leafs setup took 5.960e-06 s (0.08 %) - halfword conversion took 1.640e-03 s (22.88 %) -Built (6 x 6)[0x22ff2c0]{S} @ (0(0..0),0(0..0)) (36 nnz, 6 nnz/r) flags 0x42046186 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 16, symflags:'' + shuffled partitions in 7.444e-03 s (29.92 %) + memory allocations took 3.147e-05 s (0.13 %) + leafs setup took 4.053e-06 s (0.02 %) + halfword conversion took 8.473e-03 s (34.06 %) +Built (6 x 6)[0x2283a20]{S} @ (0(0..0),0(0..0)) (36 nnz, 6 nnz/r) flags 0x42046186 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 16, symflags:'' Base matrix: -(6 x 6)[0x22ff2c0]{S} @ (0(0..0),0(0..0)) (36 nnz, 6 nnz/r) flags 0x2046186 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 16, symflags:'' +(6 x 6)[0x2283a20]{S} @ (0(0..0),0(0..0)) (36 nnz, 6 nnz/r) flags 0x2046186 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 16, symflags:'' Will use autotuning routine to sample matrix: 6 x 6, type S, 36 nnz, 6 nnz/r, 21 subms, 16 lsubms, 4.8889 bpnz. Parameters: verbosity:1 mintimes:3 maxtimes:10 mindt:0 maxdt:0.1 -3 iterations (4 th.) took 0.003966s; avg 0.001322s ( +/- 8.09/ 7.71 %); best 0.001215s; worst 0.001424s; std dev. 8.534e-05 (taking best). -Reference operation time is 0.00121498 s (0.1185 Mflops) with 4 threads. -After 0.004008s, autotuning routine did not find a better threads count configuration. +3 iterations (4 th.) took 0.01025s; avg 0.003416s ( +/- 28.75/ 40.78 %); best 0.002434s; worst 0.004809s; std dev. 0.001012 (taking best). +Reference operation time is 0.00243402 s (0.05916 Mflops) with 4 threads. +After 0.010283s, autotuning routine did not find a better threads count configuration. Will autotune matrix: 6 x 6, type S, 36 nnz, 6 nnz/r, 21 subms, 16 lsubms, 4.8889 bpnz. Parameters: verbosity:1 mintimes:3 maxtimes:10 mindt:0 maxdt:0.1 -3 iterations (4 th.) took 0.00331s; avg 0.001103s ( +/- 46.91/ 55.18 %); best 0.0005858s; worst 0.001712s; std dev. 0.0004643 (taking best). -Reference operation time is 0.000585794 s (0.2458 Mflops) with 4 threads. -Starting merge (same threads) based auto-tuning procedure (transA=N, nrhs=2, order=cols) (max 6 steps, inclusive 3 grace steps) on: 6 x 6, type S, 36 nnz, 6 nnz/r, 21 subms, 16 lsubms, 4.8889 bpnz (tpop: 0.0005858 Mflops: 0.246) -Merge (16 -> 10 leaves) took w.c.t. of 5.507e-05s, ~1.907e-05s of computing time (of which 1.907e-06s sorting, 7.153e-06s analysis) -3 iterations (4 th.) took 0.01754s; avg 0.005848s ( +/- 80.59/150.44 %); best 0.001135s; worst 0.01464s; std dev. 0.006226 (taking best). -Reference operation time is 0.00113511 s (0.1269 Mflops) with 4 threads. -After merge step 1: tpop: 0.001135 s ~Mflops: 0.127 nsubm:10 otn:4 -Applying merge (16 -> 10 leaves, 4 th.) yielded SLOWDOWN (1th of 3 tolerable) of 1.938x: 0.0005858s -> 0.001135s. -Skipping further merge based tests after 1 definite performance degradations in a row (and last exceeding limit). -A total of 1 merge steps (of max 6) (16 -> 10 subms) took 0.01764s (of which 6.104e-05s partitioning, 0s I/O); computing times: 1.907e-05s in par. loops, 1.907e-06s sorting, 7.153e-06s analyzing) -Total merge + benchmarking process took 0.01764s, equivalent to 30.1/30.1 new/old ops (0.003246s for 1 clones -- as 5.5/5.5 ops, or 5.5/5.5 ops per clone), SPEEDUP of 1.000x (NO SPEEDUP) -Merging based autotuning FAILED (=NO SPEEDUP); let's try splitting then... -3 iterations (4 th.) took 0.004371s; avg 0.001457s ( +/- 24.37/ 39.33 %); best 0.001102s; worst 0.00203s; std dev. 0.0004091 (taking best). -Reference operation time is 0.00110197 s (0.1307 Mflops) with 4 threads. -Starting split (same threads) based auto-tuning procedure (transA=N, nrhs=2, order=cols) (max 6 steps, inclusive 3 grace steps) on: 6 x 6, type S, 36 nnz, 6 nnz/r, 21 subms, 16 lsubms, 4.8889 bpnz (tpop: 0.001102 Mflops: 0.131) -Split (16 -> 28 leaves, 21 -> 37 subms) took 0.001629s (of which: 5.96e-06s analysis, -6.842e+09s mem.mgmt); compute time: 0.0002763s overall, 5.007e-06s searches, 0.0002713s shuffle, 8.726e-05s switch, 7.629e-06s quadrants. -3 iterations (4 th.) took 0.03531s; avg 0.01177s ( +/- 90.61/ 47.21 %); best 0.001105s; worst 0.01733s; std dev. 0.007544 (taking best). -Reference operation time is 0.00110507 s (0.1303 Mflops) with 4 threads. -After split step 1: tpop: 0.001105 s ~Mflops: 0.130 nsubm:28 otn:4 -Applying split (16 -> 28 leaves, 4 th.) yielded NEGLIGIBLE change (1th in a row) (old/new=0.99720x): 0.001102s -> 0.001105s, so IGNORING this instance. -Split (28 -> 28 leaves, 37 -> 37 subms) took 0.001517s (of which: 1.001e-05s analysis, 0s mem.mgmt); compute time: 0s overall, 0s searches, 0s shuffle, 0s switch, 0s quadrants. -3 iterations (4 th.) took 0.004002s; avg 0.001334s ( +/- 13.64/ 16.35 %); best 0.001152s; worst 0.001552s; std dev. 0.0001653 (taking best). -Reference operation time is 0.00115204 s (0.125 Mflops) with 4 threads. -After split step 2: tpop: 0.001152 s ~Mflops: 0.125 nsubm:28 otn:4 -Applying split (28 -> 28 leaves, 4 th.) yielded SLOWDOWN (1th of 3 tolerable) of 1.045x: 0.001102s -> 0.001152s. -Split (28 -> 28 leaves, 37 -> 37 subms) took 0.001132s (of which: 7.868e-06s analysis, 0s mem.mgmt); compute time: 0s overall, 0s searches, 0s shuffle, 0s switch, 0s quadrants. -3 iterations (4 th.) took 0.004028s; avg 0.001343s ( +/- 19.49/ 27.88 %); best 0.001081s; worst 0.001717s; std dev. 0.0002716 (taking best). -Reference operation time is 0.00108099 s (0.1332 Mflops) with 4 threads. -After split step 3: tpop: 0.001081 s ~Mflops: 0.133 nsubm:28 otn:4 -Applying split (28 -> 28 leaves, 4 th.) yielded SPEEDUP of 1.019x: 0.001102s -> 0.001081s, so taking this instance. -Split (28 -> 28 leaves, 37 -> 37 subms) took 0.001144s (of which: 7.868e-06s analysis, 0s mem.mgmt); compute time: 0s overall, 0s searches, 0s shuffle, 0s switch, 0s quadrants. -3 iterations (4 th.) took 0.002758s; avg 0.0009193s ( +/- 41.91/ 23.91 %); best 0.0005341s; worst 0.001139s; std dev. 0.0002733 (taking best). -Reference operation time is 0.000534058 s (0.2696 Mflops) with 4 threads. -After split step 4: tpop: 0.0005341 s ~Mflops: 0.270 nsubm:28 otn:4 -Applying split (28 -> 28 leaves, 4 th.) yielded SPEEDUP of 2.024x: 0.001081s -> 0.0005341s, so taking this instance. -Split (28 -> 28 leaves, 37 -> 37 subms) took 0.001158s (of which: 8.106e-06s analysis, 0s mem.mgmt); compute time: 0s overall, 0s searches, 0s shuffle, 0s switch, 0s quadrants. -3 iterations (4 th.) took 0.00556s; avg 0.001853s ( +/- 35.42/ 70.72 %); best 0.001197s; worst 0.003164s; std dev. 0.0009268 (taking best). -Reference operation time is 0.00119686 s (0.1203 Mflops) with 4 threads. -After split step 5: tpop: 0.001197 s ~Mflops: 0.120 nsubm:28 otn:4 -Applying split (28 -> 28 leaves, 4 th.) yielded SLOWDOWN (1th of 3 tolerable) of 2.241x: 0.0005341s -> 0.001197s. -Skipping further split based tests after 1 definite performance degradations in a row (and last exceeding limit). -A total of 5 split steps (of max 6) (16 -> 28 subms) took 0.06601s (of which 0.007358s partitioning, 0s I/O); computing times: 0.0002763s in par. loops, 5.007e-06s sorting, 3.982e-05s analyzing) -Total split + benchmarking process took 0.06601s, equivalent to 123.6/59.9 new/old ops (0.01033s for 3 clones -- as 19.4/9.4 ops, or 6.5/3.1 ops per clone), SPEEDUP of 2.063x -Applying multi-split (16 -> 28 leaves, 4 steps, 0 -> 4 th.sp.) yielded SPEEDUP of 2.063x (0.001102s -> 0.0005341s), will amortize in 116.2 ops by saving 0.0005679s per op. -In 1 tuning rounds (tot. 0.098s, 0.014s for constructor, 4 clones) obtained a SPEEDUP of 106.3% (2.063x) (from 0.1307 to 0.2696 Mflops). -After 0.098221s, global autotuning declared speedup of 2.06339 x, when using threads count of 4 and a new matrix: -(6 x 6)[0x230ae30]{S} @ (0(0..0),0(0..0)) (36 nnz, 6 nnz/r) flags 0x2046186 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 28, symflags:'' +3 iterations (4 th.) took 0.0103s; avg 0.003434s ( +/- 29.48/ 22.85 %); best 0.002422s; worst 0.004219s; std dev. 0.0007512 (taking best). +Reference operation time is 0.00242186 s (0.05946 Mflops) with 4 threads. +Starting merge (same threads) based auto-tuning procedure (transA=N, nrhs=2, order=cols) (max 6 steps, inclusive 3 grace steps) on: 6 x 6, type S, 36 nnz, 6 nnz/r, 21 subms, 16 lsubms, 4.8889 bpnz (tpop: 0.002422 Mflops: 0.059) +Merge (16 -> 10 leaves) took w.c.t. of 0.002472s, ~1.311e-05s of computing time (of which 2.861e-06s sorting, 5.007e-06s analysis) +3 iterations (4 th.) took 0.01125s; avg 0.00375s ( +/- 36.63/ 18.33 %); best 0.002376s; worst 0.004437s; std dev. 0.0009713 (taking best). +Reference operation time is 0.00237608 s (0.0606 Mflops) with 4 threads. +After merge step 1: tpop: 0.002376 s ~Mflops: 0.061 nsubm:10 otn:4 +Applying merge (16 -> 10 leaves, 4 th.) yielded SPEEDUP of 1.019x: 0.002422s -> 0.002376s, so taking this instance. +Merge (10 -> 7 leaves) took w.c.t. of 2.098e-05s, ~7.153e-06s of computing time (of which 1.192e-06s sorting, 5.007e-06s analysis) +3 iterations (4 th.) took 0.01151s; avg 0.003837s ( +/- 38.50/ 20.73 %); best 0.00236s; worst 0.004633s; std dev. 0.001046 (taking best). +Reference operation time is 0.00236011 s (0.06101 Mflops) with 4 threads. +After merge step 2: tpop: 0.00236 s ~Mflops: 0.061 nsubm:7 otn:4 +Applying merge (10 -> 7 leaves, 4 th.) yielded NEGLIGIBLE change (1th in a row) (old/new=1.00677x): 0.002376s -> 0.00236s, so IGNORING this instance. +Merge (7 -> 4 leaves) took w.c.t. of 1.407e-05s, ~4.053e-06s of computing time (of which 9.537e-07s sorting, 3.099e-06s analysis) +3 iterations (4 th.) took 0.009077s; avg 0.003026s ( +/- 26.60/ 50.87 %); best 0.002221s; worst 0.004565s; std dev. 0.001089 (taking best). +Reference operation time is 0.00222087 s (0.06484 Mflops) with 4 threads. +After merge step 3: tpop: 0.002221 s ~Mflops: 0.065 nsubm:4 otn:4 +Applying merge (7 -> 4 leaves, 4 th.) yielded SPEEDUP of 1.070x: 0.002376s -> 0.002221s, so taking this instance. +Merge (4 -> 1 leaves) took w.c.t. of 1.812e-05s, ~7.868e-06s of computing time (of which 9.537e-07s sorting, 4.053e-06s analysis) +3 iterations (4 th.) took 7.153e-06s; avg 2.384e-06s ( +/- 60.00/110.00 %); best 9.537e-07s; worst 5.007e-06s; std dev. 1.857e-06 (taking best). +Reference operation time is 9.53674e-07 s (151 Mflops) with 4 threads. +After merge step 4: tpop: 9.537e-07 s ~Mflops: 150.995 nsubm:1 otn:4 +Applying merge (4 -> 1 leaves, 4 th.) yielded SPEEDUP of 2328.750x: 0.002221s -> 9.537e-07s, so taking this instance. +Merged all the matrix leaves: no reason to continue merging. +A total of 4 merge steps (of max 6) (16 -> 1 subms) took 0.06531s (of which 0.002549s partitioning, 0s I/O); computing times: 3.219e-05s in par. loops, 5.96e-06s sorting, 1.717e-05s analyzing) +Total merge + benchmarking process took 0.06531s, equivalent to 68484.5/27.0 new/old ops (0.04051s for 4 clones -- as 42478.0/16.7 ops, or 10619.5/4.2 ops per clone), SPEEDUP of 2539.500x +Applying multi-merge (16 -> 1 leaves, 4 steps, 0 -> 4 th.sp.) yielded SPEEDUP of 2539.500x (0.002422s -> 9.537e-07s), will amortize in 27.0 ops by saving 0.002421s per op. +In 1 tuning rounds (tot. 0.086s, 0.041s for constructor, 4 clones) obtained a SPEEDUP of 253850.0% (2540x) (from 0.05946 to 151 Mflops). +After 0.085739s, global autotuning declared speedup of 2539.5 x, when using threads count of 4 and a new matrix: +(6 x 6)[0x2282370]{S} @ (0(0..6),0(0..6)) (36 nnz, 6 nnz/r) flags 0x2244086 (coo:0, csr:1, hw:1, ic:1, fi:0), storage: 1, subm: 1, symflags:'' Considering C clone. Building a matrix with 36 nnz, 6 x 6 Duplicates check: 36 - 0 = 36 - converted COO to RSB in 6.967e-03 s (100.00 %) - analyzed arrays in 2.594e-03 s (37.23 %) - cleaned-up arrays in 2.146e-06 s (0.03 %) - deduplicated arrays in 1.907e-06 s (0.03 %) - sorted arrays in 0.000e+00 s (0.00 %) - shuffled partitions in 2.177e-03 s (31.25 %) - memory allocations took 8.821e-06 s (0.13 %) - leafs setup took 5.007e-06 s (0.07 %) - halfword conversion took 2.176e-03 s (31.23 %) -Built (6 x 6)[0x23017f0]{C} @ (0(0..0),0(0..0)) (36 nnz, 6 nnz/r) flags 0x42046186 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 16, symflags:'' + converted COO to RSB in 2.427e-02 s (100.00 %) + analyzed arrays in 1.005e-02 s (41.41 %) + cleaned-up arrays in 1.192e-06 s (0.00 %) + deduplicated arrays in 0.000e+00 s (0.00 %) + sorted arrays in 9.537e-07 s (0.00 %) + shuffled partitions in 7.268e-03 s (29.94 %) + memory allocations took 7.868e-06 s (0.03 %) + leafs setup took 2.861e-06 s (0.01 %) + halfword conversion took 6.939e-03 s (28.59 %) +Built (6 x 6)[0x2283a20]{C} @ (0(0..0),0(0..0)) (36 nnz, 6 nnz/r) flags 0x42046186 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 16, symflags:'' Base matrix: -(6 x 6)[0x23017f0]{C} @ (0(0..0),0(0..0)) (36 nnz, 6 nnz/r) flags 0x2046186 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 16, symflags:'' +(6 x 6)[0x2283a20]{C} @ (0(0..0),0(0..0)) (36 nnz, 6 nnz/r) flags 0x2046186 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 16, symflags:'' Will use autotuning routine to sample matrix: 6 x 6, type C, 36 nnz, 6 nnz/r, 21 subms, 16 lsubms, 4.8889 bpnz. Parameters: verbosity:1 mintimes:3 maxtimes:10 mindt:0 maxdt:0.1 -3 iterations (4 th.) took 0.1411s; avg 0.04702s ( +/- 98.77/195.08 %); best 0.0005801s; worst 0.1388s; std dev. 0.06486 (taking best). -Reference operation time is 0.000580072 s (0.993 Mflops) with 4 threads. -After 0.141126s, autotuning routine did not find a better threads count configuration. +3 iterations (4 th.) took 0.009969s; avg 0.003323s ( +/- 31.02/ 28.01 %); best 0.002292s; worst 0.004254s; std dev. 0.000804 (taking best). +Reference operation time is 0.00229216 s (0.2513 Mflops) with 4 threads. +After 0.010004s, autotuning routine did not find a better threads count configuration. Will autotune matrix: 6 x 6, type C, 36 nnz, 6 nnz/r, 21 subms, 16 lsubms, 4.8889 bpnz. Parameters: verbosity:1 mintimes:3 maxtimes:10 mindt:0 maxdt:0.1 -3 iterations (4 th.) took 0.00731s; avg 0.002437s ( +/- 71.85/103.02 %); best 0.0006859s; worst 0.004947s; std dev. 0.001821 (taking best). -Reference operation time is 0.00068593 s (0.8397 Mflops) with 4 threads. -Starting merge (same threads) based auto-tuning procedure (transA=N, nrhs=2, order=cols) (max 6 steps, inclusive 3 grace steps) on: 6 x 6, type C, 36 nnz, 6 nnz/r, 21 subms, 16 lsubms, 4.8889 bpnz (tpop: 0.0006859 Mflops: 0.840) -Merge (16 -> 10 leaves) took w.c.t. of 4.005e-05s, ~2.217e-05s of computing time (of which 3.815e-06s sorting, 8.821e-06s analysis) -3 iterations (4 th.) took 0.004852s; avg 0.001617s ( +/- 33.16/ 64.54 %); best 0.001081s; worst 0.002661s; std dev. 0.0007381 (taking best). -Reference operation time is 0.00108099 s (0.5328 Mflops) with 4 threads. -After merge step 1: tpop: 0.001081 s ~Mflops: 0.533 nsubm:10 otn:4 -Applying merge (16 -> 10 leaves, 4 th.) yielded SLOWDOWN (1th of 3 tolerable) of 1.576x: 0.0006859s -> 0.001081s. -Skipping further merge based tests after 1 definite performance degradations in a row (and last exceeding limit). -A total of 1 merge steps (of max 6) (16 -> 10 subms) took 0.005542s (of which 4.601e-05s partitioning, 0s I/O); computing times: 2.217e-05s in par. loops, 3.815e-06s sorting, 8.821e-06s analyzing) -Total merge + benchmarking process took 0.005542s, equivalent to 8.1/8.1 new/old ops (0.003628s for 1 clones -- as 5.3/5.3 ops, or 5.3/5.3 ops per clone), SPEEDUP of 1.000x (NO SPEEDUP) -Merging based autotuning FAILED (=NO SPEEDUP); let's try splitting then... -3 iterations (4 th.) took 0.009196s; avg 0.003065s ( +/- 62.91/125.07 %); best 0.001137s; worst 0.006899s; std dev. 0.002711 (taking best). -Reference operation time is 0.00113702 s (0.5066 Mflops) with 4 threads. -Starting split (same threads) based auto-tuning procedure (transA=N, nrhs=2, order=cols) (max 6 steps, inclusive 3 grace steps) on: 6 x 6, type C, 36 nnz, 6 nnz/r, 21 subms, 16 lsubms, 4.8889 bpnz (tpop: 0.001137 Mflops: 0.507) -Split (16 -> 28 leaves, 21 -> 37 subms) took 0.001228s (of which: 8.106e-06s analysis, -6.842e+09s mem.mgmt); compute time: 4.983e-05s overall, 2.861e-06s searches, 4.697e-05s shuffle, 1.478e-05s switch, 3.815e-06s quadrants. -3 iterations (4 th.) took 0.003782s; avg 0.001261s ( +/- 15.52/ 25.73 %); best 0.001065s; worst 0.001585s; std dev. 0.000231 (taking best). -Reference operation time is 0.00106502 s (0.5408 Mflops) with 4 threads. -After split step 1: tpop: 0.001065 s ~Mflops: 0.541 nsubm:28 otn:4 -Applying split (16 -> 28 leaves, 4 th.) yielded SPEEDUP of 1.068x: 0.001137s -> 0.001065s, so taking this instance. -Split (28 -> 28 leaves, 37 -> 37 subms) took 0.001712s (of which: 6.914e-06s analysis, 0s mem.mgmt); compute time: 0s overall, 0s searches, 0s shuffle, 0s switch, 0s quadrants. -3 iterations (4 th.) took 0.004178s; avg 0.001393s ( +/- 18.64/ 34.86 %); best 0.001133s; worst 0.001878s; std dev. 0.0003435 (taking best). -Reference operation time is 0.00113297 s (0.5084 Mflops) with 4 threads. -After split step 2: tpop: 0.001133 s ~Mflops: 0.508 nsubm:28 otn:4 -Applying split (28 -> 28 leaves, 4 th.) yielded SLOWDOWN (1th of 3 tolerable) of 1.064x: 0.001065s -> 0.001133s. -Split (28 -> 28 leaves, 37 -> 37 subms) took 0.001547s (of which: 8.821e-06s analysis, 0s mem.mgmt); compute time: 0s overall, 0s searches, 0s shuffle, 0s switch, 0s quadrants. -3 iterations (4 th.) took 0.0093s; avg 0.0031s ( +/- 49.42/ 56.06 %); best 0.001568s; worst 0.004838s; std dev. 0.001343 (taking best). -Reference operation time is 0.00156808 s (0.3673 Mflops) with 4 threads. -After split step 3: tpop: 0.001568 s ~Mflops: 0.367 nsubm:28 otn:4 -Applying split (28 -> 28 leaves, 4 th.) yielded SLOWDOWN (2th of 3 tolerable) of 1.472x: 0.001065s -> 0.001568s. -Skipping further split based tests after 2 definite performance degradations in a row (and last exceeding limit). -A total of 3 split steps (of max 6) (16 -> 28 subms) took 0.02516s (of which 0.004583s partitioning, 0s I/O); computing times: 4.983e-05s in par. loops, 2.861e-06s sorting, 2.384e-05s analyzing) -Total split + benchmarking process took 0.02516s, equivalent to 23.6/22.1 new/old ops (0.006114s for 2 clones -- as 5.7/5.4 ops, or 2.9/2.7 ops per clone), SPEEDUP of 1.068x -Applying multi-split (16 -> 28 leaves, 1 steps, 0 -> 4 th.sp.) yielded SPEEDUP of 1.068x (0.001137s -> 0.001065s), will amortize in 349.4 ops by saving 7.2e-05s per op. -In 1 tuning rounds (tot. 0.054s, 0.0097s for constructor, 3 clones) obtained a SPEEDUP of 6.8% (1.068x) (from 0.5066 to 0.5408 Mflops). -After 0.053889s, global autotuning declared speedup of 1.06761 x, when using threads count of 4 and a new matrix: -(6 x 6)[0x2303548]{C} @ (0(0..0),0(0..0)) (36 nnz, 6 nnz/r) flags 0x2046186 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 28, symflags:'' +3 iterations (4 th.) took 0.01041s; avg 0.003471s ( +/- 34.22/ 18.48 %); best 0.002283s; worst 0.004112s; std dev. 0.0008408 (taking best). +Reference operation time is 0.00228286 s (0.2523 Mflops) with 4 threads. +Starting merge (same threads) based auto-tuning procedure (transA=N, nrhs=2, order=cols) (max 6 steps, inclusive 3 grace steps) on: 6 x 6, type C, 36 nnz, 6 nnz/r, 21 subms, 16 lsubms, 4.8889 bpnz (tpop: 0.002283 Mflops: 0.252) +Merge (16 -> 10 leaves) took w.c.t. of 0.00141s, ~1.407e-05s of computing time (of which 3.099e-06s sorting, 6.199e-06s analysis) +3 iterations (4 th.) took 0.01066s; avg 0.003553s ( +/- 32.06/ 21.72 %); best 0.002414s; worst 0.004325s; std dev. 0.0008223 (taking best). +Reference operation time is 0.00241399 s (0.2386 Mflops) with 4 threads. +After merge step 1: tpop: 0.002414 s ~Mflops: 0.239 nsubm:10 otn:4 +Applying merge (16 -> 10 leaves, 4 th.) yielded SLOWDOWN (1th of 3 tolerable) of 1.057x: 0.002283s -> 0.002414s. +Merge (10 -> 7 leaves) took w.c.t. of 2.599e-05s, ~7.153e-06s of computing time (of which 1.192e-06s sorting, 8.106e-06s analysis) +3 iterations (4 th.) took 0.01159s; avg 0.003865s ( +/- 37.54/ 20.49 %); best 0.002414s; worst 0.004657s; std dev. 0.001027 (taking best). +Reference operation time is 0.00241399 s (0.2386 Mflops) with 4 threads. +After merge step 2: tpop: 0.002414 s ~Mflops: 0.239 nsubm:7 otn:4 +Applying merge (10 -> 7 leaves, 4 th.) yielded SLOWDOWN (2th of 3 tolerable) of 1.057x: 0.002283s -> 0.002414s. +Merge (7 -> 4 leaves) took w.c.t. of 1.812e-05s, ~5.007e-06s of computing time (of which 9.537e-07s sorting, 5.007e-06s analysis) +3 iterations (4 th.) took 0.01127s; avg 0.003757s ( +/- 38.73/ 41.29 %); best 0.002302s; worst 0.005309s; std dev. 0.001229 (taking best). +Reference operation time is 0.00230193 s (0.2502 Mflops) with 4 threads. +After merge step 3: tpop: 0.002302 s ~Mflops: 0.250 nsubm:4 otn:4 +Applying merge (7 -> 4 leaves, 4 th.) yielded NEGLIGIBLE change (1th in a row) (old/new=0.99171x): 0.002283s -> 0.002302s, so IGNORING this instance. +Merge (4 -> 1 leaves) took w.c.t. of 1.502e-05s, ~7.153e-06s of computing time (of which 1.907e-06s sorting, 3.099e-06s analysis) +3 iterations (4 th.) took 7.153e-06s; avg 2.384e-06s ( +/- 50.00/ 70.00 %); best 1.192e-06s; worst 4.053e-06s; std dev. 1.216e-06 (taking best). +Reference operation time is 1.19209e-06 s (483.2 Mflops) with 4 threads. +After merge step 4: tpop: 1.192e-06 s ~Mflops: 483.184 nsubm:1 otn:4 +Applying merge (4 -> 1 leaves, 4 th.) yielded SPEEDUP of 1915.000x: 0.002283s -> 1.192e-06s, so taking this instance. +Merged all the matrix leaves: no reason to continue merging. +A total of 4 merge steps (of max 6) (16 -> 1 subms) took 0.04503s (of which 0.001492s partitioning, 0s I/O); computing times: 3.338e-05s in par. loops, 7.153e-06s sorting, 2.241e-05s analyzing) +Total merge + benchmarking process took 0.04503s, equivalent to 37776.4/19.7 new/old ops (0.02122s for 2 clones -- as 17796.6/9.3 ops, or 8898.3/4.6 ops per clone), SPEEDUP of 1915.000x +Applying multi-merge (16 -> 1 leaves, 4 steps, 0 -> 4 th.sp.) yielded SPEEDUP of 1915.000x (0.002283s -> 1.192e-06s), will amortize in 19.7 ops by saving 0.002282s per op. +In 1 tuning rounds (tot. 0.067s, 0.021s for constructor, 2 clones) obtained a SPEEDUP of 191400.0% (1915x) (from 0.2523 to 483.2 Mflops). +After 0.067169s, global autotuning declared speedup of 1915 x, when using threads count of 4 and a new matrix: +(6 x 6)[0x2285790]{C} @ (0(0..6),0(0..6)) (36 nnz, 6 nnz/r) flags 0x2244086 (coo:0, csr:1, hw:1, ic:1, fi:0), storage: 1, subm: 1, symflags:'' Considering Z clone. Building a matrix with 36 nnz, 6 x 6 Duplicates check: 36 - 0 = 36 - converted COO to RSB in 6.485e-03 s (100.00 %) - analyzed arrays in 2.278e-03 s (35.13 %) - cleaned-up arrays in 1.907e-06 s (0.03 %) - deduplicated arrays in 9.537e-07 s (0.01 %) + converted COO to RSB in 2.302e-02 s (100.00 %) + analyzed arrays in 9.493e-03 s (41.24 %) + cleaned-up arrays in 9.537e-07 s (0.00 %) + deduplicated arrays in 9.537e-07 s (0.00 %) sorted arrays in 0.000e+00 s (0.00 %) - shuffled partitions in 2.134e-03 s (32.91 %) - memory allocations took 1.097e-05 s (0.17 %) - leafs setup took 5.007e-06 s (0.08 %) - halfword conversion took 2.053e-03 s (31.66 %) -Built (6 x 6)[0x2301080]{Z} @ (0(0..0),0(0..0)) (36 nnz, 6 nnz/r) flags 0x42046186 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 16, symflags:'' + shuffled partitions in 7.028e-03 s (30.53 %) + memory allocations took 9.060e-06 s (0.04 %) + leafs setup took 5.007e-06 s (0.02 %) + halfword conversion took 6.478e-03 s (28.14 %) +Built (6 x 6)[0x2283a20]{Z} @ (0(0..0),0(0..0)) (36 nnz, 6 nnz/r) flags 0x42046186 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 16, symflags:'' Base matrix: -(6 x 6)[0x2301080]{Z} @ (0(0..0),0(0..0)) (36 nnz, 6 nnz/r) flags 0x2046186 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 16, symflags:'' +(6 x 6)[0x2283a20]{Z} @ (0(0..0),0(0..0)) (36 nnz, 6 nnz/r) flags 0x2046186 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 16, symflags:'' Will use autotuning routine to sample matrix: 6 x 6, type Z, 36 nnz, 6 nnz/r, 21 subms, 16 lsubms, 4.8889 bpnz. Parameters: verbosity:1 mintimes:3 maxtimes:10 mindt:0 maxdt:0.1 -3 iterations (4 th.) took 0.00363s; avg 0.00121s ( +/- 3.23/ 4.71 %); best 0.001171s; worst 0.001267s; std dev. 4.121e-05 (taking best). -Reference operation time is 0.00117087 s (0.4919 Mflops) with 4 threads. -After 0.003675s, autotuning routine did not find a better threads count configuration. +3 iterations (4 th.) took 0.01013s; avg 0.003376s ( +/- 31.88/ 17.82 %); best 0.0023s; worst 0.003978s; std dev. 0.0007628 (taking best). +Reference operation time is 0.00230002 s (0.2504 Mflops) with 4 threads. +After 0.010163s, autotuning routine did not find a better threads count configuration. Will autotune matrix: 6 x 6, type Z, 36 nnz, 6 nnz/r, 21 subms, 16 lsubms, 4.8889 bpnz. Parameters: verbosity:1 mintimes:3 maxtimes:10 mindt:0 maxdt:0.1 -3 iterations (4 th.) took 0.03905s; avg 0.01302s ( +/- 87.06/173.57 %); best 0.001685s; worst 0.03561s; std dev. 0.01598 (taking best). -Reference operation time is 0.0016849 s (0.3419 Mflops) with 4 threads. -Starting merge (same threads) based auto-tuning procedure (transA=N, nrhs=2, order=cols) (max 6 steps, inclusive 3 grace steps) on: 6 x 6, type Z, 36 nnz, 6 nnz/r, 21 subms, 16 lsubms, 4.8889 bpnz (tpop: 0.001685 Mflops: 0.342) -Merge (16 -> 10 leaves) took w.c.t. of 0.0001659s, ~2.098e-05s of computing time (of which 3.815e-06s sorting, 1.001e-05s analysis) -3 iterations (4 th.) took 0.005172s; avg 0.001724s ( +/- 24.88/ 48.32 %); best 0.001295s; worst 0.002557s; std dev. 0.0005891 (taking best). -Reference operation time is 0.00129509 s (0.4448 Mflops) with 4 threads. -After merge step 1: tpop: 0.001295 s ~Mflops: 0.445 nsubm:10 otn:4 -Applying merge (16 -> 10 leaves, 4 th.) yielded SPEEDUP of 1.301x: 0.001685s -> 0.001295s, so taking this instance. -Merge (10 -> 7 leaves) took w.c.t. of 2.408e-05s, ~8.106e-06s of computing time (of which 1.192e-06s sorting, 5.96e-06s analysis) -3 iterations (4 th.) took 0.01302s; avg 0.004341s ( +/- 30.25/ 59.86 %); best 0.003028s; worst 0.00694s; std dev. 0.001837 (taking best). -Reference operation time is 0.00302815 s (0.1902 Mflops) with 4 threads. -After merge step 2: tpop: 0.003028 s ~Mflops: 0.190 nsubm:7 otn:4 -Applying merge (10 -> 7 leaves, 4 th.) yielded SLOWDOWN (1th of 3 tolerable) of 2.338x: 0.001295s -> 0.003028s. -Skipping further merge based tests after 1 definite performance degradations in a row (and last exceeding limit). -A total of 2 merge steps (of max 6) (16 -> 7 subms) took 0.02207s (of which 0.000205s partitioning, 0s I/O); computing times: 2.909e-05s in par. loops, 5.007e-06s sorting, 1.597e-05s analyzing) -Total merge + benchmarking process took 0.02207s, equivalent to 17.0/13.1 new/old ops (0.007399s for 2 clones -- as 5.7/4.4 ops, or 2.9/2.2 ops per clone), SPEEDUP of 1.301x -Applying multi-merge (16 -> 10 leaves, 1 steps, 0 -> 4 th.sp.) yielded SPEEDUP of 1.301x (0.001685s -> 0.001295s), will amortize in 56.6 ops by saving 0.0003898s per op. -In 1 tuning rounds (tot. 0.065s, 0.0074s for constructor, 2 clones) obtained a SPEEDUP of 30.1% (1.301x) (from 0.3419 to 0.4448 Mflops). -After 0.065022s, global autotuning declared speedup of 1.30099 x, when using threads count of 4 and a new matrix: -(6 x 6)[0x2303ae0]{Z} @ (0(0..0),0(0..0)) (36 nnz, 6 nnz/r) flags 0x2046186 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 10, symflags:'' +3 iterations (4 th.) took 0.009985s; avg 0.003328s ( +/- 28.13/ 43.25 %); best 0.002392s; worst 0.004768s; std dev. 0.001033 (taking best). +Reference operation time is 0.00239205 s (0.2408 Mflops) with 4 threads. +Starting merge (same threads) based auto-tuning procedure (transA=N, nrhs=2, order=cols) (max 6 steps, inclusive 3 grace steps) on: 6 x 6, type Z, 36 nnz, 6 nnz/r, 21 subms, 16 lsubms, 4.8889 bpnz (tpop: 0.002392 Mflops: 0.241) +Merge (16 -> 10 leaves) took w.c.t. of 0.002072s, ~1.597e-05s of computing time (of which 3.815e-06s sorting, 6.914e-06s analysis) +3 iterations (4 th.) took 0.01073s; avg 0.003577s ( +/- 32.35/ 31.43 %); best 0.00242s; worst 0.004701s; std dev. 0.0009316 (taking best). +Reference operation time is 0.00241995 s (0.238 Mflops) with 4 threads. +After merge step 1: tpop: 0.00242 s ~Mflops: 0.238 nsubm:10 otn:4 +Applying merge (16 -> 10 leaves, 4 th.) yielded NEGLIGIBLE change (1th in a row) (old/new=0.98847x): 0.002392s -> 0.00242s, so IGNORING this instance. +Merge (10 -> 7 leaves) took w.c.t. of 1.884e-05s, ~6.199e-06s of computing time (of which 1.907e-06s sorting, 5.96e-06s analysis) +3 iterations (4 th.) took 0.0116s; avg 0.003865s ( +/- 36.09/ 26.60 %); best 0.00247s; worst 0.004893s; std dev. 0.001023 (taking best). +Reference operation time is 0.00247002 s (0.2332 Mflops) with 4 threads. +After merge step 2: tpop: 0.00247 s ~Mflops: 0.233 nsubm:7 otn:4 +Applying merge (10 -> 7 leaves, 4 th.) yielded SLOWDOWN (1th of 3 tolerable) of 1.033x: 0.002392s -> 0.00247s. +Merge (7 -> 4 leaves) took w.c.t. of 1.597e-05s, ~4.053e-06s of computing time (of which 9.537e-07s sorting, 4.053e-06s analysis) +3 iterations (4 th.) took 0.01142s; avg 0.003806s ( +/- 39.32/ 28.73 %); best 0.002309s; worst 0.004899s; std dev. 0.001095 (taking best). +Reference operation time is 0.00230908 s (0.2494 Mflops) with 4 threads. +After merge step 3: tpop: 0.002309 s ~Mflops: 0.249 nsubm:4 otn:4 +Applying merge (7 -> 4 leaves, 4 th.) yielded SPEEDUP of 1.036x: 0.002392s -> 0.002309s, so taking this instance. +Merge (4 -> 1 leaves) took w.c.t. of 1.693e-05s, ~7.153e-06s of computing time (of which 1.907e-06s sorting, 2.146e-06s analysis) +3 iterations (4 th.) took 8.821e-06s; avg 2.94e-06s ( +/- 35.14/ 70.27 %); best 1.907e-06s; worst 5.007e-06s; std dev. 1.461e-06 (taking best). +Reference operation time is 1.90735e-06 s (302 Mflops) with 4 threads. +After merge step 4: tpop: 1.907e-06 s ~Mflops: 301.990 nsubm:1 otn:4 +Applying merge (4 -> 1 leaves, 4 th.) yielded SPEEDUP of 1210.625x: 0.002309s -> 1.907e-06s, so taking this instance. +Merged all the matrix leaves: no reason to continue merging. +A total of 4 merge steps (of max 6) (16 -> 1 subms) took 0.05698s (of which 0.002151s partitioning, 0s I/O); computing times: 3.338e-05s in par. loops, 8.583e-06s sorting, 1.907e-05s analyzing) +Total merge + benchmarking process took 0.05698s, equivalent to 29872.9/23.8 new/old ops (0.03236s for 3 clones -- as 16967.6/13.5 ops, or 5655.9/4.5 ops per clone), SPEEDUP of 1254.125x +Applying multi-merge (16 -> 1 leaves, 4 steps, 0 -> 4 th.sp.) yielded SPEEDUP of 1254.125x (0.002392s -> 1.907e-06s), will amortize in 23.8 ops by saving 0.00239s per op. +In 1 tuning rounds (tot. 0.078s, 0.032s for constructor, 3 clones) obtained a SPEEDUP of 125312.5% (1254x) (from 0.2408 to 302 Mflops). +After 0.078440s, global autotuning declared speedup of 1254.12 x, when using threads count of 4 and a new matrix: +(6 x 6)[0x227f2c0]{Z} @ (0(0..6),0(0..6)) (36 nnz, 6 nnz/r) flags 0x2244086 (coo:0, csr:1, hw:1, ic:1, fi:0), storage: 1, subm: 1, symflags:'' gmake[4]: Leaving directory '/build/reproducible-path/librsb-1.3.0.2+dfsg/examples' gmake[3]: Leaving directory '/build/reproducible-path/librsb-1.3.0.2+dfsg' @@ -10359,10 +10451,10 @@ 4 0 DIFF PRINT TEST END Beginning large binary search test. -Detected 2800267264 bytes of memory, comprehensive of 2352795648 of free memory. +Detected 2870853632 bytes of memory, comprehensive of 878264320 of free memory. On this system, maximal array of coordinates can have 2147483137 elements and occupy 4294965252 bytes. -Will perform the test using less memory (658 MB) than on the maximal coordinate indices array (690854912) allows. -(c)allocated 172713728 nnz (690854912 bytes) +Will perform the test using less memory (628 MB) than on the maximal coordinate indices array (658698240) allows. +(c)allocated 164674560 nnz (658698240 bytes) Succeeded retrieving array last element. Successfully performed large binary search test. BASIC SPARSE BLAS TEST: BEGIN @@ -10371,7 +10463,7 @@ got RSB_IO_WANT_IS_INITIALIZED_MARKER: 1 INIT INTERFACE TEST: END (SUCCESS) DEVEL PRINT TEST: BEGIN -(4 x 4)[0x2551590]{S} @ (0(0..0),0(0..0)) (4 nnz, 1 nnz/r) flags 0x2046186 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 2, symflags:'' +(4 x 4)[0x198e590]{S} @ (0(0..0),0(0..0)) (4 nnz, 1 nnz/r) flags 0x2046186 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 2, symflags:'' RSB_FLAG_USE_HALFWORD_INDICES | RSB_FLAG_SORTED_INPUT | RSB_FLAG_WANT_COO_STORAGE | @@ -10380,8 +10472,8 @@ RSB_FLAG_ASSEMBLED_IN_COO_ARRAYS | RSB_FLAG_OWN_PARTITIONING_ARRAYS | RSB_FLAG_SORT_INPUT -(2 x 2)[0x2551660]{S} @ (0(0..2),0(0..2)) (2 nnz, 1 nnz/r) flags 0x2144386 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 0, symflags:'' -(2 x 2)[0x2551730]{S} @ (2(2..4),2(2..4)) (2 nnz, 1 nnz/r) flags 0x2144386 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 0, symflags:'' +(2 x 2)[0x198e660]{S} @ (0(0..2),0(0..2)) (2 nnz, 1 nnz/r) flags 0x2144386 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 0, symflags:'' +(2 x 2)[0x198e730]{S} @ (2(2..4),2(2..4)) (2 nnz, 1 nnz/r) flags 0x2144386 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 0, symflags:'' #R 4 x 4, 4 nnz (16 bytes), 16 index space for bytes, 416 bytes for 2 structs (2 of which are on the diagonal) (1e+02% of nnz are on the diagonal) #N at 0 0, 4 x 4, 4 nnz ( 25%) #T at 0 0, 2 x 2, 2 nnz ( 50%) @@ -10389,9 +10481,9 @@ ( 0x2046186 = { rec:1 coo:1 css:1 hw:1 ic:1 fi:0 symflags: } ) DEVEL PRINT TEST: END PRINT TEST: BEGIN [QUIET] -(2 x 2)[0x2551660]{S} @ (0(0..2),0(0..2)) (2 nnz, 1 nnz/r) flags 0x2144386 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 0, symflags:'' -(2 x 2)[0x2551730]{S} @ (2(2..4),2(2..4)) (2 nnz, 1 nnz/r) flags 0x2144386 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 0, symflags:'' -(4 x 4)[0x2551590]{S} @ (0(0..0),0(0..0)) (4 nnz, 1 nnz/r) flags 0x2046186 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 2, symflags:'' +(2 x 2)[0x198e660]{S} @ (0(0..2),0(0..2)) (2 nnz, 1 nnz/r) flags 0x2144386 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 0, symflags:'' +(2 x 2)[0x198e730]{S} @ (2(2..4),2(2..4)) (2 nnz, 1 nnz/r) flags 0x2144386 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 0, symflags:'' +(4 x 4)[0x198e590]{S} @ (0(0..0),0(0..0)) (4 nnz, 1 nnz/r) flags 0x2046186 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 2, symflags:'' RSB_FLAG_USE_HALFWORD_INDICES | RSB_FLAG_SORTED_INPUT | RSB_FLAG_WANT_COO_STORAGE | @@ -10409,8 +10501,8 @@ BASIC PRIMITIVES TEST: BEGIN BASIC PRIMITIVES TEST: END (SUCCESS) ADVANCED SPARSE BLAS TEST: BEGIN [limit 30.000000s] [QUIET] -Terminating testing earlier due to user timeout request: test took 30.007475 s, max allowed was 30.000000. - PASSED:16137 +Terminating testing earlier due to user timeout request: test took 30.017954 s, max allowed was 30.000000. + PASSED:13081 FAILED:0 ADVANCED SPARSE BLAS TEST: END (SUCCESS) gmake qtests -C librsbpp @@ -10419,99 +10511,99 @@ gmake[4]: Entering directory '/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp' gmake[4]: Leaving directory '/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp' ./rsbtt -if ! test -f G.mtx ; then cp -p /build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp/G.mtx . ; fi ; /bin/bash /build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp/test.sh +if ! test -f G.mtx ; then cp -p /build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp/G.mtx . ; fi ; /bin/sh /build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp/test.sh ++ ./rsbpp Td,s G.mtx -++ grep Z-sort ++ wc -l +++ grep Z-sort + test 54 = 54 ++ ./rsbpp Td G.mtx -++ grep Z-sort ++ wc -l +++ grep Z-sort + test 27 = 27 ++ ./rsbpp Td,z G.mtx -++ grep Z-sort ++ wc -l +++ grep Z-sort + test 54 = 54 ++ ./rsbpp vTd,z G.mtx -++ grep Z-sort ++ wc -l +++ grep Z-sort + test 54 = 54 ++ ./rsbpp vTd,z G.mtx -++ grep Z-sort ++ wc -l +++ grep Z-sort + test 54 = 54 ++ ./rsbpp vvvTd,z G.mtx -++ grep Zorted ++ wc -l +++ grep Zorted + test 8 = 8 ++ ./rsbpp vvTd,z G.mtx -++ grep Z-sort ++ wc -l +++ grep Z-sort + test 54 = 54 ++ ./rsbpp vvTd,z G.mtx -++ grep Range ++ wc -l +++ grep Range + test 0 = 0 ++ ./rsbpp vvvTd,z G.mtx -++ grep Range ++ wc -l +++ grep Range + test 258 -gt 0 ++ ./rsbpp vvvTd,z S.mtx -++ grep Range ++ wc -l +++ grep Range + test 0 -eq 0 ++ ./rsbpp vvvTd,z G.mtx -++ grep Range ++ wc -l +++ grep Range + test 258 = 258 ++ OMP_NUM_THREADS=1 ++ ./rsbpp m10M10I1r1,4,8sFv -++ grep spmm- ++ wc -l +++ grep spmm- + test 9 = 9 ++ OMP_NUM_THREADS=1 ++ ./rsbpp C1000m100M100I1r1,4,8sFv -++ grep spmm- ++ wc -l +++ grep spmm- + test 9 = 9 ++ OMP_NUM_THREADS=1 -++ grep spmm- ++ ./rsbpp C1000m100M100I1r1sFvtN,T ++ wc -l +++ grep spmm- + test 3 = 3 ++ OMP_NUM_THREADS=1 -++ grep spmm- ++ ./rsbpp C1000m100M100I1r1vtN,TsF ++ wc -l +++ grep spmm- + test 2 = 2 ++ OMP_NUM_THREADS=1 -++ grep spmm- ++ ./rsbpp C1000m100M100I1r0vtN,TsF ++ wc -l +++ grep spmm- + test 0 = 0 ++ OMP_NUM_THREADS=1 -++ grep Recursing ++ RSB_NUM_THREADS=1 ++ ./rsbpp vvvC1000m100M100I1r1vtN,TorsF ++ wc -l +++ grep Recursing + test 4 = 4 ++ OMP_NUM_THREADS=2 ++ RSB_NUM_THREADS=2 -++ grep Recursing ++ ./rsbpp vvvC1000m100M100I1r1vtN,TorsF ++ wc -l +++ grep Recursing + test 4 = 4 ++ OMP_NUM_THREADS=1 ++ RSB_NUM_THREADS=1 ++ ./rsbpp vvvC1000m100M100I1r1vtN,ToRsF -++ grep Recursing ++ wc -l +++ grep Recursing + test 208 = 208 ++ OMP_NUM_THREADS=2 -++ grep Recursing ++ RSB_NUM_THREADS=2 ++ ./rsbpp vvvC1000m100M100I1r1vtN,ToRsF ++ wc -l +++ grep Recursing + test 410 = 410 echo "Skipping tests based on Google Test (not detected at configure time)" Skipping tests based on Google Test (not detected at configure time) @@ -10558,7 +10650,7 @@ 0 0 0 0 before tuning for SPMV: -(3 x 3)[0x1ebda80]{D} @ (0(0..0),0(0..0)) (6 nnz, 2 nnz/r) flags 0x2046186 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'' +(3 x 3)[0x4af840]{D} @ (0(0..0),0(0..0)) (6 nnz, 2 nnz/r) flags 0x2046186 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'' ** x: 1.1 @@ -10647,18 +10739,18 @@ BEGIN Rsb_Matrix_test_multimatrix_ms_mnrhs BEGIN -(3 x 3)[0x1ed4cb0]{D} @ (0(0..0),0(0..0)) (6 nnz, 2 nnz/r) flags 0x204619e (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'LT' +(3 x 3)[0x4d2160]{D} @ (0(0..0),0(0..0)) (6 nnz, 2 nnz/r) flags 0x204619e (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'LT' +Tuned with speedup factor of 1: +(3 x 3)[0x4d2160]{D} @ (0(0..0),0(0..0)) (6 nnz, 2 nnz/r) flags 0x204619e (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'LT' +(3 x 3)[0x4cda80]{D} @ (0(0..0),0(0..0)) (6 nnz, 2 nnz/r) flags 0x204619e (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'LT' Tuned with speedup factor of 1: -(3 x 3)[0x1ed4cb0]{D} @ (0(0..0),0(0..0)) (6 nnz, 2 nnz/r) flags 0x204619e (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'LT' -(3 x 3)[0x1edb230]{D} @ (0(0..0),0(0..0)) (6 nnz, 2 nnz/r) flags 0x204619e (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'LT' -Tuned with speedup factor of 1.03274: -(3 x 3)[0x1ede6b0]{D} @ (0(0..0),0(0..0)) (6 nnz, 2 nnz/r) flags 0x204619e (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'LT' -(3 x 3)[0x1ed4cb0]{D} @ (0(0..0),0(0..0)) (6 nnz, 2 nnz/r) flags 0x204619e (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'LT' -Tuned with speedup factor of 1.71912: -(3 x 3)[0x1edee20]{D} @ (0(0..0),0(0..0)) (6 nnz, 2 nnz/r) flags 0x204619e (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'LT' -(3 x 3)[0x1ed4cb0]{D} @ (0(0..0),0(0..0)) (6 nnz, 2 nnz/r) flags 0x204619e (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'LT' +(3 x 3)[0x4cda80]{D} @ (0(0..0),0(0..0)) (6 nnz, 2 nnz/r) flags 0x204619e (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'LT' +(3 x 3)[0x4d2160]{D} @ (0(0..0),0(0..0)) (6 nnz, 2 nnz/r) flags 0x204619e (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'LT' Tuned with speedup factor of 1: -(3 x 3)[0x1ed4cb0]{D} @ (0(0..0),0(0..0)) (6 nnz, 2 nnz/r) flags 0x204619e (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'LT' +(3 x 3)[0x4d2160]{D} @ (0(0..0),0(0..0)) (6 nnz, 2 nnz/r) flags 0x204619e (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'LT' +(3 x 3)[0x4cda80]{D} @ (0(0..0),0(0..0)) (6 nnz, 2 nnz/r) flags 0x204619e (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'LT' +Tuned with speedup factor of 1: +(3 x 3)[0x4cda80]{D} @ (0(0..0),0(0..0)) (6 nnz, 2 nnz/r) flags 0x204619e (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'LT' END OK: terminating with no allocations registered in librsb [*] tests terminated successfully ! @@ -10675,10 +10767,10 @@ ./rsbtest --no-tune --max_t 0.01 --serial | dd if=/dev/stdin of=/dev/stdout bs=16M status=none iflag=fullblock | grep -q Building ./rsbtest --no-tune --max_t 0.01 --max 1 --nrhs 1 --beta 1 --incy 1 --incx 1 --no-trans --alpha 1 --type d --rand --serial . | dd if=/dev/stdin of=/dev/stdout bs=16M status=none iflag=fullblock | grep -q adding ! ./rsbtest --mkl A.mkl -running on virt64c +running on i-capture-the-hostname Built without the MKL. ( ! ./rsbtest --unrecognized-option-triggers-abort ) -running on virt64c +running on i-capture-the-hostname /build/reproducible-path/librsb-1.3.0.2+dfsg/rsbtest/.libs/rsbtest: unrecognized option '--unrecognized-option-triggers-abort' unrecognized option, aborting. ( ./rsbtest --no-tune --max_t 0.01 --skip-loading-hermitian-matrices --skip-loading-unsymmetric-matrices --tune-maxt 10 --tune-maxr 10 --verbose-tuning --extra-verbose-interface --min_t 0.01 --max_t 0.01 --mintimes 1 --maxtimes 1 --verbose --skip-loading-symmetric-matrices A.mtx | dd if=/dev/stdin of=/dev/stdout bs=16M status=none iflag=fullblock | grep -q skip ) @@ -10687,7 +10779,7 @@ ( ! ./rsbtest --no-tune --max_t 0.01 --quiet --types all --nthreads 1,2 --maxtimes 1 -+ A.mtx | dd if=/dev/stdin of=/dev/stdout bs=16M status=none iflag=fullblock | grep -q 2.threads ) ( ! ./rsbtest --no-tune --max_t 0.01 --quiet --render-only A.mtx > /dev/null ) ! ./rsbtest --no-tune --max_t 0.01 --quiet --max 1 --nrhs 1 --beta 1 --incy 1 --incx 1 --render --no-trans --alpha 1 --type all A.mtx -running on virt64c +running on i-capture-the-hostname Will not invoke autotuning routine. Benchmark will sample for at most 0.01 s Built without render support! @@ -10739,7 +10831,7 @@ gmake[4]: Entering directory '/build/reproducible-path/librsb-1.3.0.2+dfsg' gmake[5]: Entering directory '/build/reproducible-path/librsb-1.3.0.2+dfsg' /bin/mkdir -p '/build/reproducible-path/librsb-1.3.0.2+dfsg/debian/tmp/usr/lib/arm-linux-gnueabihf' - /bin/bash ./libtool --mode=install /usr/bin/install -c librsb.la '/build/reproducible-path/librsb-1.3.0.2+dfsg/debian/tmp/usr/lib/arm-linux-gnueabihf' + /bin/sh ./libtool --mode=install /usr/bin/install -c librsb.la '/build/reproducible-path/librsb-1.3.0.2+dfsg/debian/tmp/usr/lib/arm-linux-gnueabihf' libtool: install: /usr/bin/install -c .libs/librsb.so.0.0.0 /build/reproducible-path/librsb-1.3.0.2+dfsg/debian/tmp/usr/lib/arm-linux-gnueabihf/librsb.so.0.0.0 libtool: install: (cd /build/reproducible-path/librsb-1.3.0.2+dfsg/debian/tmp/usr/lib/arm-linux-gnueabihf && { ln -s -f librsb.so.0.0.0 librsb.so.0 || { rm -f librsb.so.0 && ln -s librsb.so.0.0.0 librsb.so.0; }; }) libtool: install: (cd /build/reproducible-path/librsb-1.3.0.2+dfsg/debian/tmp/usr/lib/arm-linux-gnueabihf && { ln -s -f librsb.so.0.0.0 librsb.so || { rm -f librsb.so && ln -s librsb.so.0.0.0 librsb.so; }; }) @@ -10749,7 +10841,7 @@ libtool: install: ranlib /build/reproducible-path/librsb-1.3.0.2+dfsg/debian/tmp/usr/lib/arm-linux-gnueabihf/librsb.a libtool: warning: remember to run 'libtool --finish /usr/lib/arm-linux-gnueabihf' /bin/mkdir -p '/build/reproducible-path/librsb-1.3.0.2+dfsg/debian/tmp/usr/bin' - /bin/bash ./libtool --mode=install /usr/bin/install -c rsbench '/build/reproducible-path/librsb-1.3.0.2+dfsg/debian/tmp/usr/bin' + /bin/sh ./libtool --mode=install /usr/bin/install -c rsbench '/build/reproducible-path/librsb-1.3.0.2+dfsg/debian/tmp/usr/bin' libtool: warning: 'librsb.la' has not been installed in '/usr/lib/arm-linux-gnueabihf' libtool: install: /usr/bin/install -c .libs/rsbench /build/reproducible-path/librsb-1.3.0.2+dfsg/debian/tmp/usr/bin/rsbench /bin/mkdir -p '/build/reproducible-path/librsb-1.3.0.2+dfsg/debian/tmp/usr/bin' @@ -10878,9 +10970,9 @@ dh_gencontrol dh_md5sums dh_builddeb -dpkg-deb: building package 'librsb-tools-dbgsym' in '../librsb-tools-dbgsym_1.3.0.2+dfsg-4_armhf.deb'. -dpkg-deb: building package 'librsb-dev' in '../librsb-dev_1.3.0.2+dfsg-4_armhf.deb'. dpkg-deb: building package 'librsb0' in '../librsb0_1.3.0.2+dfsg-4_armhf.deb'. +dpkg-deb: building package 'librsb-dev' in '../librsb-dev_1.3.0.2+dfsg-4_armhf.deb'. +dpkg-deb: building package 'librsb-tools-dbgsym' in '../librsb-tools-dbgsym_1.3.0.2+dfsg-4_armhf.deb'. dpkg-deb: building package 'librsb-doc' in '../librsb-doc_1.3.0.2+dfsg-4_all.deb'. dpkg-deb: building package 'librsb-tools' in '../librsb-tools_1.3.0.2+dfsg-4_armhf.deb'. dpkg-deb: building package 'librsb0-dbgsym' in '../librsb0-dbgsym_1.3.0.2+dfsg-4_armhf.deb'. @@ -10892,12 +10984,14 @@ dpkg-buildpackage: info: binary-only upload (no source included) dpkg-genchanges: info: not including original source code in upload I: copying local configuration +I: user script /srv/workspace/pbuilder/10894/tmp/hooks/B01_cleanup starting +I: user script /srv/workspace/pbuilder/10894/tmp/hooks/B01_cleanup finished I: unmounting dev/ptmx filesystem I: unmounting dev/pts filesystem I: unmounting dev/shm filesystem I: unmounting proc filesystem I: unmounting sys filesystem I: cleaning the build env -I: removing directory /srv/workspace/pbuilder/21297 and its subdirectories -I: Current time: Sat Mar 16 08:04:22 -12 2024 -I: pbuilder-time-stamp: 1710619462 +I: removing directory /srv/workspace/pbuilder/10894 and its subdirectories +I: Current time: Sun Mar 17 11:02:28 +14 2024 +I: pbuilder-time-stamp: 1710622948