Diff of the two buildlogs: -- --- b1/build.log 2025-10-28 12:19:07.437033029 +0000 +++ b2/build.log 2025-10-28 12:30:42.777916626 +0000 @@ -1,6 +1,6 @@ I: pbuilder: network access will be disabled during build -I: Current time: Mon Nov 30 06:29:38 -12 2026 -I: pbuilder-time-stamp: 1796063378 +I: Current time: Wed Oct 29 02:19:09 +14 2025 +I: pbuilder-time-stamp: 1761653949 I: Building the build Environment I: extracting base tarball [/var/cache/pbuilder/unstable-reproducible-base.tgz] I: copying local configuration @@ -26,53 +26,85 @@ dpkg-source: info: applying auto-gitignore I: using fakeroot in build. I: Installing the build-deps -I: user script /srv/workspace/pbuilder/3017132/tmp/hooks/D02_print_environment starting +I: user script /srv/workspace/pbuilder/3598769/tmp/hooks/D01_modify_environment starting +debug: Running on codethink04-arm64. +I: Changing host+domainname to test build reproducibility +I: Adding a custom variable just for the fun of it... +I: Changing /bin/sh to bash +'/bin/sh' -> '/bin/bash' +lrwxrwxrwx 1 root root 9 Oct 28 12:19 /bin/sh -> /bin/bash +I: Setting pbuilder2's login shell to /bin/bash +I: Setting pbuilder2's GECOS to second user,second room,second work-phone,second home-phone,second other +I: user script /srv/workspace/pbuilder/3598769/tmp/hooks/D01_modify_environment finished +I: user script /srv/workspace/pbuilder/3598769/tmp/hooks/D02_print_environment starting I: set - BUILDDIR='/build/reproducible-path' - BUILDUSERGECOS='first user,first room,first work-phone,first home-phone,first other' - BUILDUSERNAME='pbuilder1' - BUILD_ARCH='arm64' - DEBIAN_FRONTEND='noninteractive' + BASH=/bin/sh + BASHOPTS=checkwinsize:cmdhist:complete_fullquote:extquote:force_fignore:globasciiranges:globskipdots:hostcomplete:interactive_comments:patsub_replacement:progcomp:promptvars:sourcepath + BASH_ALIASES=() + BASH_ARGC=() + BASH_ARGV=() + BASH_CMDS=() + BASH_LINENO=([0]="12" [1]="0") + BASH_LOADABLES_PATH=/usr/local/lib/bash:/usr/lib/bash:/opt/local/lib/bash:/usr/pkg/lib/bash:/opt/pkg/lib/bash:. + BASH_SOURCE=([0]="/tmp/hooks/D02_print_environment" [1]="/tmp/hooks/D02_print_environment") + BASH_VERSINFO=([0]="5" [1]="3" [2]="3" [3]="1" [4]="release" [5]="aarch64-unknown-linux-gnu") + BASH_VERSION='5.3.3(1)-release' + BUILDDIR=/build/reproducible-path + BUILDUSERGECOS='second user,second room,second work-phone,second home-phone,second other' + BUILDUSERNAME=pbuilder2 + BUILD_ARCH=arm64 + DEBIAN_FRONTEND=noninteractive DEB_BUILD_OPTIONS='buildinfo=+all reproducible=+all parallel=12 ' - DISTRIBUTION='unstable' - HOME='/root' - HOST_ARCH='arm64' + DIRSTACK=() + DISTRIBUTION=unstable + EUID=0 + FUNCNAME=([0]="Echo" [1]="main") + GROUPS=() + HOME=/root + HOSTNAME=i-capture-the-hostname + HOSTTYPE=aarch64 + HOST_ARCH=arm64 IFS=' ' - INVOCATION_ID='3e881ccda5c44779aea579f49f25163d' - LANG='C' - LANGUAGE='en_US:en' - LC_ALL='C' - MAIL='/var/mail/root' - OPTIND='1' - PATH='/usr/sbin:/usr/bin:/sbin:/bin:/usr/games' - PBCURRENTCOMMANDLINEOPERATION='build' - PBUILDER_OPERATION='build' - PBUILDER_PKGDATADIR='/usr/share/pbuilder' - PBUILDER_PKGLIBDIR='/usr/lib/pbuilder' - PBUILDER_SYSCONFDIR='/etc' - PPID='3017132' - PS1='# ' - PS2='> ' + INVOCATION_ID=fafd3e594c564a8cb5ba19660c7465ab + LANG=C + LANGUAGE=nl_BE:nl + LC_ALL=C + MACHTYPE=aarch64-unknown-linux-gnu + MAIL=/var/mail/root + OPTERR=1 + OPTIND=1 + OSTYPE=linux-gnu + PATH=/usr/sbin:/usr/bin:/sbin:/bin:/usr/games:/i/capture/the/path + PBCURRENTCOMMANDLINEOPERATION=build + PBUILDER_OPERATION=build + PBUILDER_PKGDATADIR=/usr/share/pbuilder + PBUILDER_PKGLIBDIR=/usr/lib/pbuilder + PBUILDER_SYSCONFDIR=/etc + PIPESTATUS=([0]="0") + POSIXLY_CORRECT=y + PPID=3598769 PS4='+ ' - PWD='/' - SHELL='/bin/bash' - SHLVL='2' - SUDO_COMMAND='/usr/bin/timeout -k 18.1h 18h /usr/bin/ionice -c 3 /usr/bin/nice /usr/sbin/pbuilder --build --configfile /srv/reproducible-results/rbuild-debian/r-b-build.KfbwNK8Z/pbuilderrc_v5YK --distribution unstable --hookdir /etc/pbuilder/first-build-hooks --debbuildopts -b --basetgz /var/cache/pbuilder/unstable-reproducible-base.tgz --buildresult /srv/reproducible-results/rbuild-debian/r-b-build.KfbwNK8Z/b1 --logfile b1/build.log librsb_1.3.0.2+dfsg-8.dsc' - SUDO_GID='109' - SUDO_HOME='/var/lib/jenkins' - SUDO_UID='104' - SUDO_USER='jenkins' - TERM='unknown' - TZ='/usr/share/zoneinfo/Etc/GMT+12' - USER='root' - _='/usr/bin/systemd-run' - http_proxy='http://192.168.101.4:3128' + PWD=/ + SHELL=/bin/bash + SHELLOPTS=braceexpand:errexit:hashall:interactive-comments:posix + SHLVL=3 + SUDO_COMMAND='/usr/bin/timeout -k 24.1h 24h /usr/bin/ionice -c 3 /usr/bin/nice -n 11 /usr/bin/unshare --uts -- /usr/sbin/pbuilder --build --configfile /srv/reproducible-results/rbuild-debian/r-b-build.KfbwNK8Z/pbuilderrc_cgD2 --distribution unstable --hookdir /etc/pbuilder/rebuild-hooks --debbuildopts -b --basetgz /var/cache/pbuilder/unstable-reproducible-base.tgz --buildresult /srv/reproducible-results/rbuild-debian/r-b-build.KfbwNK8Z/b2 --logfile b2/build.log librsb_1.3.0.2+dfsg-8.dsc' + SUDO_GID=109 + SUDO_HOME=/var/lib/jenkins + SUDO_UID=104 + SUDO_USER=jenkins + TERM=unknown + TZ=/usr/share/zoneinfo/Etc/GMT-14 + UID=0 + USER=root + _='I: set' + http_proxy=http://192.168.101.4:3128 I: uname -a - Linux codethink03-arm64 6.12.48+deb13-cloud-arm64 #1 SMP Debian 6.12.48-1 (2025-09-20) aarch64 GNU/Linux + Linux i-capture-the-hostname 6.12.48+deb13-cloud-arm64 #1 SMP Debian 6.12.48-1 (2025-09-20) aarch64 GNU/Linux I: ls -l /bin - lrwxrwxrwx 1 root root 7 Aug 10 2025 /bin -> usr/bin -I: user script /srv/workspace/pbuilder/3017132/tmp/hooks/D02_print_environment finished + lrwxrwxrwx 1 root root 7 Aug 10 12:30 /bin -> usr/bin +I: user script /srv/workspace/pbuilder/3598769/tmp/hooks/D02_print_environment finished -> Attempting to satisfy build-dependencies -> Creating pbuilder-satisfydepends-dummy package Package: pbuilder-satisfydepends-dummy @@ -297,7 +329,7 @@ Get: 177 http://deb.debian.org/debian unstable/main arm64 libltdl-dev arm64 2.5.4-7 [168 kB] Get: 178 http://deb.debian.org/debian unstable/main arm64 libhwloc-dev arm64 2.12.2-1 [239 kB] Get: 179 http://deb.debian.org/debian unstable/main arm64 zlib1g-dev arm64 1:1.3.dfsg+really1.3.1-1+b1 [917 kB] -Fetched 393 MB in 2s (216 MB/s) +Fetched 393 MB in 2s (223 MB/s) Preconfiguring packages ... Selecting previously unselected package libexpat1:arm64. (Reading database ... (Reading database ... 5% (Reading database ... 10% (Reading database ... 15% (Reading database ... 20% (Reading database ... 25% (Reading database ... 30% (Reading database ... 35% (Reading database ... 40% (Reading database ... 45% (Reading database ... 50% (Reading database ... 55% (Reading database ... 60% (Reading database ... 65% (Reading database ... 70% (Reading database ... 75% (Reading database ... 80% (Reading database ... 85% (Reading database ... 90% (Reading database ... 95% (Reading database ... 100% (Reading database ... 19964 files and directories currently installed.) @@ -892,8 +924,8 @@ Setting up tzdata (2025b-5) ... Current default time zone: 'Etc/UTC' -Local time is now: Mon Nov 30 18:30:13 UTC 2026. -Universal Time is now: Mon Nov 30 18:30:13 UTC 2026. +Local time is now: Tue Oct 28 12:19:41 UTC 2025. +Universal Time is now: Tue Oct 28 12:19:41 UTC 2025. Run 'dpkg-reconfigure tzdata' if you wish to change it. Setting up libfontenc1:arm64 (1:1.1.8-1+b2) ... @@ -1065,7 +1097,11 @@ Solving dependencies... 0 upgraded, 0 newly installed, 0 to remove and 0 not upgraded. I: Building the package -I: Running cd /build/reproducible-path/librsb-1.3.0.2+dfsg/ && env PATH="/usr/sbin:/usr/bin:/sbin:/bin:/usr/games" HOME="/nonexistent/first-build" dpkg-buildpackage -us -uc -b && env PATH="/usr/sbin:/usr/bin:/sbin:/bin:/usr/games" HOME="/nonexistent/first-build" dpkg-genchanges -S > ../librsb_1.3.0.2+dfsg-8_source.changes +I: user script /srv/workspace/pbuilder/3598769/tmp/hooks/A99_set_merged_usr starting +Not re-configuring usrmerge for unstable +I: user script /srv/workspace/pbuilder/3598769/tmp/hooks/A99_set_merged_usr finished +hostname: Name or service not known +I: Running cd /build/reproducible-path/librsb-1.3.0.2+dfsg/ && env PATH="/usr/sbin:/usr/bin:/sbin:/bin:/usr/games:/i/capture/the/path" HOME="/nonexistent/second-build" dpkg-buildpackage -us -uc -b && env PATH="/usr/sbin:/usr/bin:/sbin:/bin:/usr/games:/i/capture/the/path" HOME="/nonexistent/second-build" dpkg-genchanges -S > ../librsb_1.3.0.2+dfsg-8_source.changes dpkg-buildpackage: info: source package librsb dpkg-buildpackage: info: source version 1.3.0.2+dfsg-8 dpkg-buildpackage: info: source distribution unstable @@ -1085,62 +1121,62 @@ dh binary dh_update_autotools_config dh_autoreconf -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found libtoolize: putting auxiliary files in '.'. libtoolize: copying file './ltmain.sh' libtoolize: putting macros in AC_CONFIG_MACRO_DIRS, 'm4'. @@ -1182,90 +1218,90 @@ libtoolize: copying file 'm4/ltsugar.m4' libtoolize: copying file 'm4/ltversion.m4' libtoolize: copying file 'm4/lt~obsolete.m4' -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found configure.ac:66: installing './compile' configure.ac:65: installing './missing' Makefile.am: installing './depcomp' @@ -1293,8 +1329,8 @@ checking whether make sets $(MAKE)... yes checking whether make supports nested variables... yes checking xargs -n works... yes -checking whether UID '1111' is supported by ustar format... yes -checking whether GID '1111' is supported by ustar format... yes +checking whether UID '2222' is supported by ustar format... yes +checking whether GID '2222' is supported by ustar format... yes checking how to create a ustar tar archive... gnutar checking build system type... aarch64-unknown-linux-gnu checking host system type... aarch64-unknown-linux-gnu @@ -1454,7 +1490,7 @@ checking for m4... m4 checking for gmake... gmake checking for ggrep... /usr/bin/grep -checking for bash... /bin/bash +checking for bash... /bin/sh checking for gsed... /usr/bin/sed checking for cmp... cmp checking for basename... basename @@ -1575,7 +1611,7 @@ configure: It appears that Fortran programs can be linked without using the Fortran linker. configure: Using OPENMP_CFLAGS ok for linking an OpenMP program: adding it to LIBS. checking if your have a usable getrusage() ... 1 -checking for /bin/bash... /bin/bash +checking for /bin/sh... /bin/sh configure: Will not use Google Test. configure: You seem to not have GNU Octave or have disabled 'int' type. Part of the test suite will not be generated. If you want more testing capabilities, you should enable the 'int' type as well. checking that generated files are newer than configure... done @@ -1597,7 +1633,7 @@ config.status: executing depfiles commands config.status: executing libtool commands === configuring in librsbpp (/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp) -configure: running /bin/bash ./configure --disable-option-checking '--prefix=/usr' '--build=aarch64-linux-gnu' '--includedir=${prefix}/include' '--mandir=${prefix}/share/man' '--infodir=${prefix}/share/info' '--sysconfdir=/etc' '--localstatedir=/var' '--disable-silent-rules' '--libdir=${prefix}/lib/aarch64-linux-gnu' '--runstatedir=/run' '--disable-maintainer-mode' '--disable-dependency-tracking' '--with-memhinfo=L2:4/64/512K,L1:8/64/24K' '--with-hwloc' '--enable-matrix-types=blas' '--with-zlib=-lz' '--enable-doc-build' '--enable-fortran-module-install' '--enable-extra-patches' '--enable-pkg-config-install' '--disable-extra-patches' 'build_alias=aarch64-linux-gnu' 'CFLAGS=-g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3' 'LDFLAGS=-Wl,-z,relro' 'CPPFLAGS=-Wdate-time -D_FORTIFY_SOURCE=2' 'FCFLAGS=-g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -mbranch-protection=standard -pipe' 'CXXFLAGS=-g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard' 'BASH=/bin/bash' --cache-file=/dev/null --srcdir=. +configure: running /bin/sh ./configure --disable-option-checking '--prefix=/usr' '--build=aarch64-linux-gnu' '--includedir=${prefix}/include' '--mandir=${prefix}/share/man' '--infodir=${prefix}/share/info' '--sysconfdir=/etc' '--localstatedir=/var' '--disable-silent-rules' '--libdir=${prefix}/lib/aarch64-linux-gnu' '--runstatedir=/run' '--disable-maintainer-mode' '--disable-dependency-tracking' '--with-memhinfo=L2:4/64/512K,L1:8/64/24K' '--with-hwloc' '--enable-matrix-types=blas' '--with-zlib=-lz' '--enable-doc-build' '--enable-fortran-module-install' '--enable-extra-patches' '--enable-pkg-config-install' '--disable-extra-patches' 'build_alias=aarch64-linux-gnu' 'CFLAGS=-g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3' 'LDFLAGS=-Wl,-z,relro' 'CPPFLAGS=-Wdate-time -D_FORTIFY_SOURCE=2' 'FCFLAGS=-g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -mbranch-protection=standard -pipe' 'CXXFLAGS=-g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard' 'BASH=/bin/sh' --cache-file=/dev/null --srcdir=. checking for a BSD-compatible install... /usr/bin/install -c checking whether sleep supports fractional seconds... yes checking filesystem timestamp resolution... 0.01 @@ -1608,8 +1644,8 @@ checking whether make sets $(MAKE)... yes checking whether make supports nested variables... yes checking xargs -n works... yes -checking whether UID '1111' is supported by ustar format... yes -checking whether GID '1111' is supported by ustar format... yes +checking whether UID '2222' is supported by ustar format... yes +checking whether GID '2222' is supported by ustar format... yes checking how to create a ustar tar archive... gnutar checking build system type... aarch64-unknown-linux-gnu checking host system type... aarch64-unknown-linux-gnu @@ -1725,7 +1761,7 @@ configure: Will not use Google Test. checking whether you have std::thread... yes checking whether you have std::mutex... yes -/bin/bash +/bin/sh checking that generated files are newer than configure... done configure: creating ./config.status config.status: creating Makefile @@ -1734,7 +1770,7 @@ config.status: executing libtool commands configure: Successfully created a Makefile. === configuring in rsblib (/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib) -configure: running /bin/bash ./configure --disable-option-checking '--prefix=/usr' '--build=aarch64-linux-gnu' '--includedir=${prefix}/include' '--mandir=${prefix}/share/man' '--infodir=${prefix}/share/info' '--sysconfdir=/etc' '--localstatedir=/var' '--disable-silent-rules' '--libdir=${prefix}/lib/aarch64-linux-gnu' '--runstatedir=/run' '--disable-maintainer-mode' '--disable-dependency-tracking' '--with-memhinfo=L2:4/64/512K,L1:8/64/24K' '--with-hwloc' '--enable-matrix-types=blas' '--with-zlib=-lz' '--enable-doc-build' '--enable-fortran-module-install' '--enable-extra-patches' '--enable-pkg-config-install' '--disable-extra-patches' 'build_alias=aarch64-linux-gnu' 'CFLAGS=-g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3' 'LDFLAGS=-Wl,-z,relro' 'CPPFLAGS=-Wdate-time -D_FORTIFY_SOURCE=2' 'FCFLAGS=-g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -mbranch-protection=standard -pipe' 'CXXFLAGS=-g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard' 'BASH=/bin/bash' --cache-file=/dev/null --srcdir=. +configure: running /bin/sh ./configure --disable-option-checking '--prefix=/usr' '--build=aarch64-linux-gnu' '--includedir=${prefix}/include' '--mandir=${prefix}/share/man' '--infodir=${prefix}/share/info' '--sysconfdir=/etc' '--localstatedir=/var' '--disable-silent-rules' '--libdir=${prefix}/lib/aarch64-linux-gnu' '--runstatedir=/run' '--disable-maintainer-mode' '--disable-dependency-tracking' '--with-memhinfo=L2:4/64/512K,L1:8/64/24K' '--with-hwloc' '--enable-matrix-types=blas' '--with-zlib=-lz' '--enable-doc-build' '--enable-fortran-module-install' '--enable-extra-patches' '--enable-pkg-config-install' '--disable-extra-patches' 'build_alias=aarch64-linux-gnu' 'CFLAGS=-g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3' 'LDFLAGS=-Wl,-z,relro' 'CPPFLAGS=-Wdate-time -D_FORTIFY_SOURCE=2' 'FCFLAGS=-g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -mbranch-protection=standard -pipe' 'CXXFLAGS=-g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard' 'BASH=/bin/sh' --cache-file=/dev/null --srcdir=. checking for a BSD-compatible install... /usr/bin/install -c checking whether sleep supports fractional seconds... yes checking filesystem timestamp resolution... 0.01 @@ -1745,8 +1781,8 @@ checking whether make sets $(MAKE)... yes checking whether make supports nested variables... yes checking xargs -n works... yes -checking whether UID '1111' is supported by ustar format... yes -checking whether GID '1111' is supported by ustar format... yes +checking whether UID '2222' is supported by ustar format... yes +checking whether GID '2222' is supported by ustar format... yes checking how to create a ustar tar archive... gnutar checking build system type... aarch64-unknown-linux-gnu checking host system type... aarch64-unknown-linux-gnu @@ -1849,7 +1885,7 @@ checking for filesystem... yes checking for main in -lstdc++fs... yes configure: Assuming you are yet to build librsb.la. (set LIBS= -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la) -/bin/bash +/bin/sh checking that generated files are newer than configure... done configure: creating ./config.status config.status: creating Makefile @@ -1859,7 +1895,7 @@ config.status: executing libtool commands configure: Created a Makefile. === configuring in rsbtest (/build/reproducible-path/librsb-1.3.0.2+dfsg/rsbtest) -configure: running /bin/bash ./configure --disable-option-checking '--prefix=/usr' '--build=aarch64-linux-gnu' '--includedir=${prefix}/include' '--mandir=${prefix}/share/man' '--infodir=${prefix}/share/info' '--sysconfdir=/etc' '--localstatedir=/var' '--disable-silent-rules' '--libdir=${prefix}/lib/aarch64-linux-gnu' '--runstatedir=/run' '--disable-maintainer-mode' '--disable-dependency-tracking' '--with-memhinfo=L2:4/64/512K,L1:8/64/24K' '--with-hwloc' '--enable-matrix-types=blas' '--with-zlib=-lz' '--enable-doc-build' '--enable-fortran-module-install' '--enable-extra-patches' '--enable-pkg-config-install' '--disable-extra-patches' 'build_alias=aarch64-linux-gnu' 'CFLAGS=-g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3' 'LDFLAGS=-Wl,-z,relro' 'CPPFLAGS=-Wdate-time -D_FORTIFY_SOURCE=2' 'FCFLAGS=-g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -mbranch-protection=standard -pipe' 'CXXFLAGS=-g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard' 'BASH=/bin/bash' --cache-file=/dev/null --srcdir=. +configure: running /bin/sh ./configure --disable-option-checking '--prefix=/usr' '--build=aarch64-linux-gnu' '--includedir=${prefix}/include' '--mandir=${prefix}/share/man' '--infodir=${prefix}/share/info' '--sysconfdir=/etc' '--localstatedir=/var' '--disable-silent-rules' '--libdir=${prefix}/lib/aarch64-linux-gnu' '--runstatedir=/run' '--disable-maintainer-mode' '--disable-dependency-tracking' '--with-memhinfo=L2:4/64/512K,L1:8/64/24K' '--with-hwloc' '--enable-matrix-types=blas' '--with-zlib=-lz' '--enable-doc-build' '--enable-fortran-module-install' '--enable-extra-patches' '--enable-pkg-config-install' '--disable-extra-patches' 'build_alias=aarch64-linux-gnu' 'CFLAGS=-g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3' 'LDFLAGS=-Wl,-z,relro' 'CPPFLAGS=-Wdate-time -D_FORTIFY_SOURCE=2' 'FCFLAGS=-g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -mbranch-protection=standard -pipe' 'CXXFLAGS=-g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard' 'BASH=/bin/sh' --cache-file=/dev/null --srcdir=. checking for a BSD-compatible install... /usr/bin/install -c checking whether sleep supports fractional seconds... yes checking filesystem timestamp resolution... 0.01 @@ -1870,8 +1906,8 @@ checking whether make sets $(MAKE)... yes checking whether make supports nested variables... yes checking xargs -n works... yes -checking whether UID '1111' is supported by ustar format... yes -checking whether GID '1111' is supported by ustar format... yes +checking whether UID '2222' is supported by ustar format... yes +checking whether GID '2222' is supported by ustar format... yes checking how to create a ustar tar archive... gnutar checking build system type... aarch64-unknown-linux-gnu checking host system type... aarch64-unknown-linux-gnu @@ -1976,7 +2012,7 @@ checking for filesystem... yes checking for rsb_lib_init... no checking for dd... yes -/bin/bash +/bin/sh /usr/bin/timeout checking that generated files are newer than configure... done configure: creating ./config.status @@ -2008,7 +2044,7 @@ ARFLAGS : cru M4 : m4 MAKE : gmake - BASH : /bin/bash + BASH : /bin/sh OCTAVE : false DOXYGEN : doxygen HELP2MAN : help2man @@ -2087,19 +2123,19 @@ Making all in librsbpp gmake[4]: Entering directory '/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp' g++ -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -DRSBPP_HAS_RSB_H=1 -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -DRSBPP_HAS_RSB_H=1 -c -o rsbpp.o rsbpp.cpp -/bin/bash ./libtool --tag=CXX --mode=compile g++ -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -DRSBPP_HAS_RSB_H=1 -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -DRSBPP_HAS_RSB_H=1 -c -o rsbpp_coo.lo rsbpp_coo.cpp -/bin/bash ./libtool --tag=CXX --mode=compile g++ -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -DRSBPP_HAS_RSB_H=1 -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -DRSBPP_HAS_RSB_H=1 -c -o rsbpp_csr.lo rsbpp_csr.cpp +/bin/sh ./libtool --tag=CXX --mode=compile g++ -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -DRSBPP_HAS_RSB_H=1 -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -DRSBPP_HAS_RSB_H=1 -c -o rsbpp_coo.lo rsbpp_coo.cpp +/bin/sh ./libtool --tag=CXX --mode=compile g++ -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -DRSBPP_HAS_RSB_H=1 -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -DRSBPP_HAS_RSB_H=1 -c -o rsbpp_csr.lo rsbpp_csr.cpp g++ -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -DRSBPP_HAS_RSB_H=1 -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -DRSBPP_HAS_RSB_H=1 -c -o rsbtt.o rsbtt.cpp gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -DRSBPP_HAS_RSB_H=1 -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -c -o rsbct.o rsbct.c libtool: compile: g++ -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -DRSBPP_HAS_RSB_H=1 -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -DRSBPP_HAS_RSB_H=1 -c rsbpp_csr.cpp -fPIC -DPIC -o .libs/rsbpp_csr.o libtool: compile: g++ -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -DRSBPP_HAS_RSB_H=1 -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -DRSBPP_HAS_RSB_H=1 -c rsbpp_coo.cpp -fPIC -DPIC -o .libs/rsbpp_coo.o In file included from rsbpp.hpp:44, - from rsbpp.cpp:28: + from rsbtt.cpp:21: /usr/include/c++/15/ccomplex:51:4: warning: #warning " is deprecated in C++17, use instead" [-Wcpp] 51 | # warning " is deprecated in C++17, use instead" | ^~~~~~~ In file included from rsbpp.hpp:44, - from rsbtt.cpp:21: + from rsbpp.cpp:28: /usr/include/c++/15/ccomplex:51:4: warning: #warning " is deprecated in C++17, use instead" [-Wcpp] 51 | # warning " is deprecated in C++17, use instead" | ^~~~~~~ @@ -2115,15 +2151,15 @@ | ^~~~~~~ libtool: compile: g++ -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -DRSBPP_HAS_RSB_H=1 -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -DRSBPP_HAS_RSB_H=1 -c rsbpp_coo.cpp -o rsbpp_coo.o >/dev/null 2>&1 libtool: compile: g++ -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -DRSBPP_HAS_RSB_H=1 -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -DRSBPP_HAS_RSB_H=1 -c rsbpp_csr.cpp -o rsbpp_csr.o >/dev/null 2>&1 -/bin/bash ./libtool --tag=CXX --mode=link g++ -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -DRSBPP_HAS_RSB_H=1 -Wl,-z,relro -o librsbpp.la rsbpp_coo.lo rsbpp_csr.lo -lpthread -lstdc++fs +/bin/sh ./libtool --tag=CXX --mode=link g++ -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -DRSBPP_HAS_RSB_H=1 -Wl,-z,relro -o librsbpp.la rsbpp_coo.lo rsbpp_csr.lo -lpthread -lstdc++fs libtool: link: ar cr .libs/librsbpp.a .libs/rsbpp_coo.o .libs/rsbpp_csr.o libtool: link: ranlib .libs/librsbpp.a libtool: link: ( cd ".libs" && rm -f "librsbpp.la" && ln -s "../librsbpp.la" "librsbpp.la" ) -/bin/bash ./libtool --tag=CXX --mode=link g++ -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -DRSBPP_HAS_RSB_H=1 -Wl,-z,relro -o rsbtt rsbtt.o librsbpp.la -lpthread -lstdc++fs -/bin/bash ./libtool --tag=CXX --mode=link g++ -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -DRSBPP_HAS_RSB_H=1 -Wl,-z,relro -o rsbct rsbct.o librsbpp.la -lpthread -lstdc++fs -/bin/bash ./libtool --tag=CXX --mode=link g++ -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -DRSBPP_HAS_RSB_H=1 -Wl,-z,relro -o rsbpp rsbpp.o librsbpp.la -lpthread -lstdc++fs -libtool: link: g++ -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -DRSBPP_HAS_RSB_H=1 -Wl,-z -Wl,relro -o rsbct rsbct.o ./.libs/librsbpp.a -lpthread -lstdc++fs -fopenmp +/bin/sh ./libtool --tag=CXX --mode=link g++ -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -DRSBPP_HAS_RSB_H=1 -Wl,-z,relro -o rsbpp rsbpp.o librsbpp.la -lpthread -lstdc++fs +/bin/sh ./libtool --tag=CXX --mode=link g++ -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -DRSBPP_HAS_RSB_H=1 -Wl,-z,relro -o rsbct rsbct.o librsbpp.la -lpthread -lstdc++fs +/bin/sh ./libtool --tag=CXX --mode=link g++ -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -DRSBPP_HAS_RSB_H=1 -Wl,-z,relro -o rsbtt rsbtt.o librsbpp.la -lpthread -lstdc++fs libtool: link: g++ -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -DRSBPP_HAS_RSB_H=1 -Wl,-z -Wl,relro -o rsbtt rsbtt.o ./.libs/librsbpp.a -lpthread -lstdc++fs -fopenmp +libtool: link: g++ -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -DRSBPP_HAS_RSB_H=1 -Wl,-z -Wl,relro -o rsbct rsbct.o ./.libs/librsbpp.a -lpthread -lstdc++fs -fopenmp libtool: link: g++ -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -DRSBPP_HAS_RSB_H=1 -Wl,-z -Wl,relro -o rsbpp rsbpp.o ./.libs/librsbpp.a -lpthread -lstdc++fs -fopenmp gmake all-am gmake[5]: Entering directory '/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp' @@ -2142,109 +2178,88 @@ gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o rsbench-rsb_libspblas_tests.o `test -f 'rsb_libspblas_tests.c' || echo './'`rsb_libspblas_tests.c g++ -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -fopenmp -c -o rsb_dummy.o rsb_dummy.cpp gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o ch2icfb-ch2icfb.o `test -f 'ch2icfb.c' || echo './'`ch2icfb.c -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_nounroll_la-rsb_stropts.lo `test -f 'rsb_stropts.c' || echo './'`rsb_stropts.c +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_nounroll_la-rsb_stropts.lo `test -f 'rsb_stropts.c' || echo './'`rsb_stropts.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_stropts.c -fPIC -DPIC -o .libs/librsb_nounroll_la-rsb_stropts.o -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_nounroll_la-rsb_strmif.lo `test -f 'rsb_strmif.c' || echo './'`rsb_strmif.c -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_nounroll_la-rsb_unroll.lo `test -f 'rsb_unroll.c' || echo './'`rsb_unroll.c -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_nounroll_la-rsb_krnl_vb.lo `test -f 'rsb_krnl_vb.c' || echo './'`rsb_krnl_vb.c -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_nounroll_la-rsb_krnl_lb.lo `test -f 'rsb_krnl_lb.c' || echo './'`rsb_krnl_lb.c -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_nounroll_la-rsb_krnl.lo `test -f 'rsb_krnl.c' || echo './'`rsb_krnl.c -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_unroll.c -fPIC -DPIC -o .libs/librsb_nounroll_la-rsb_unroll.o +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_nounroll_la-rsb_strmif.lo `test -f 'rsb_strmif.c' || echo './'`rsb_strmif.c +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_nounroll_la-rsb_unroll.lo `test -f 'rsb_unroll.c' || echo './'`rsb_unroll.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_strmif.c -fPIC -DPIC -o .libs/librsb_nounroll_la-rsb_strmif.o +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_nounroll_la-rsb_krnl_vb.lo `test -f 'rsb_krnl_vb.c' || echo './'`rsb_krnl_vb.c +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_nounroll_la-rsb_krnl_lb.lo `test -f 'rsb_krnl_lb.c' || echo './'`rsb_krnl_lb.c +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_unroll.c -fPIC -DPIC -o .libs/librsb_nounroll_la-rsb_unroll.o +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_nounroll_la-rsb_krnl.lo `test -f 'rsb_krnl.c' || echo './'`rsb_krnl.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_krnl_vb.c -fPIC -DPIC -o .libs/librsb_nounroll_la-rsb_krnl_vb.o libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_stropts.c -o librsb_nounroll_la-rsb_stropts.o >/dev/null 2>&1 libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_krnl_lb.c -fPIC -DPIC -o .libs/librsb_nounroll_la-rsb_krnl_lb.o libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_krnl.c -fPIC -DPIC -o .libs/librsb_nounroll_la-rsb_krnl.o libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_unroll.c -o librsb_nounroll_la-rsb_unroll.o >/dev/null 2>&1 -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_krnl_vb.c -o librsb_nounroll_la-rsb_krnl_vb.o >/dev/null 2>&1 +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_nounroll_la-rsb_bench.lo `test -f 'rsb_bench.c' || echo './'`rsb_bench.c +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_bench.c -fPIC -DPIC -o .libs/librsb_nounroll_la-rsb_bench.o +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_nounroll_la-rsb_mergesort.lo `test -f 'rsb_mergesort.c' || echo './'`rsb_mergesort.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_krnl_lb.c -o librsb_nounroll_la-rsb_krnl_lb.o >/dev/null 2>&1 -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_nounroll_la-rsb_bench.lo `test -f 'rsb_bench.c' || echo './'`rsb_bench.c -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_nounroll_la-rsb_mergesort.lo `test -f 'rsb_mergesort.c' || echo './'`rsb_mergesort.c -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_nounroll_la-rsb_permute.lo `test -f 'rsb_permute.c' || echo './'`rsb_permute.c +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_krnl_vb.c -o librsb_nounroll_la-rsb_krnl_vb.o >/dev/null 2>&1 +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_nounroll_la-rsb_permute.lo `test -f 'rsb_permute.c' || echo './'`rsb_permute.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_mergesort.c -fPIC -DPIC -o .libs/librsb_nounroll_la-rsb_mergesort.o -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_bench.c -fPIC -DPIC -o .libs/librsb_nounroll_la-rsb_bench.o -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_nounroll_la-rsb_krnl_bcss_l.lo `test -f 'rsb_krnl_bcss_l.c' || echo './'`rsb_krnl_bcss_l.c -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_nounroll_la-rsb_krnl_bcss_u.lo `test -f 'rsb_krnl_bcss_u.c' || echo './'`rsb_krnl_bcss_u.c +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_strmif.c -o librsb_nounroll_la-rsb_strmif.o >/dev/null 2>&1 libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_permute.c -fPIC -DPIC -o .libs/librsb_nounroll_la-rsb_permute.o +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_nounroll_la-rsb_krnl_bcss_l.lo `test -f 'rsb_krnl_bcss_l.c' || echo './'`rsb_krnl_bcss_l.c +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_nounroll_la-rsb_krnl_bcss_u.lo `test -f 'rsb_krnl_bcss_u.c' || echo './'`rsb_krnl_bcss_u.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_krnl_bcss_l.c -fPIC -DPIC -o .libs/librsb_nounroll_la-rsb_krnl_bcss_l.o libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_krnl_bcss_u.c -fPIC -DPIC -o .libs/librsb_nounroll_la-rsb_krnl_bcss_u.o -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_strmif.c -o librsb_nounroll_la-rsb_strmif.o >/dev/null 2>&1 libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_mergesort.c -o librsb_nounroll_la-rsb_mergesort.o >/dev/null 2>&1 -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_nounroll_la-rsb_krnl_bcss_spsv_u.lo `test -f 'rsb_krnl_bcss_spsv_u.c' || echo './'`rsb_krnl_bcss_spsv_u.c -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_krnl_bcss_l.c -o librsb_nounroll_la-rsb_krnl_bcss_l.o >/dev/null 2>&1 libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_krnl_bcss_u.c -o librsb_nounroll_la-rsb_krnl_bcss_u.o >/dev/null 2>&1 +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_nounroll_la-rsb_krnl_bcss_spsv_u.lo `test -f 'rsb_krnl_bcss_spsv_u.c' || echo './'`rsb_krnl_bcss_spsv_u.c +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_krnl_bcss_l.c -o librsb_nounroll_la-rsb_krnl_bcss_l.o >/dev/null 2>&1 +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_nounroll_la-rsb_krnl_bcss_spmv_u.lo `test -f 'rsb_krnl_bcss_spmv_u.c' || echo './'`rsb_krnl_bcss_spmv_u.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_krnl_bcss_spsv_u.c -fPIC -DPIC -o .libs/librsb_nounroll_la-rsb_krnl_bcss_spsv_u.o -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_nounroll_la-rsb_krnl_bcss_spmv_u.lo `test -f 'rsb_krnl_bcss_spmv_u.c' || echo './'`rsb_krnl_bcss_spmv_u.c -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_nounroll_la-rsb_krnl_bcss_misc_u.lo `test -f 'rsb_krnl_bcss_misc_u.c' || echo './'`rsb_krnl_bcss_misc_u.c +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_nounroll_la-rsb_krnl_bcss_misc_u.lo `test -f 'rsb_krnl_bcss_misc_u.c' || echo './'`rsb_krnl_bcss_misc_u.c +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_nounroll_la-rsb_krnl_bcoo_spmv_u.lo `test -f 'rsb_krnl_bcoo_spmv_u.c' || echo './'`rsb_krnl_bcoo_spmv_u.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_krnl_bcss_misc_u.c -fPIC -DPIC -o .libs/librsb_nounroll_la-rsb_krnl_bcss_misc_u.o libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_krnl_bcss_spmv_u.c -fPIC -DPIC -o .libs/librsb_nounroll_la-rsb_krnl_bcss_spmv_u.o -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_nounroll_la-rsb_krnl_bcoo_spmv_u.lo `test -f 'rsb_krnl_bcoo_spmv_u.c' || echo './'`rsb_krnl_bcoo_spmv_u.c -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_nounroll_la-rsb_krnl_bcss.lo `test -f 'rsb_krnl_bcss.c' || echo './'`rsb_krnl_bcss.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_krnl_bcoo_spmv_u.c -fPIC -DPIC -o .libs/librsb_nounroll_la-rsb_krnl_bcoo_spmv_u.o +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_nounroll_la-rsb_krnl_bcss.lo `test -f 'rsb_krnl_bcss.c' || echo './'`rsb_krnl_bcss.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_krnl_bcss.c -fPIC -DPIC -o .libs/librsb_nounroll_la-rsb_krnl_bcss.o -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_krnl_bcss.c -o librsb_nounroll_la-rsb_krnl_bcss.o >/dev/null 2>&1 -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_nounroll_la-rsb_spmv.lo `test -f 'rsb_spmv.c' || echo './'`rsb_spmv.c -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_nounroll_la-rsb_merge.lo `test -f 'rsb_merge.c' || echo './'`rsb_merge.c -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_bench.c -o librsb_nounroll_la-rsb_bench.o >/dev/null 2>&1 +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_nounroll_la-rsb_spmv.lo `test -f 'rsb_spmv.c' || echo './'`rsb_spmv.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_spmv.c -fPIC -DPIC -o .libs/librsb_nounroll_la-rsb_spmv.o +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_krnl_bcss.c -o librsb_nounroll_la-rsb_krnl_bcss.o >/dev/null 2>&1 +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_nounroll_la-rsb_merge.lo `test -f 'rsb_merge.c' || echo './'`rsb_merge.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_merge.c -fPIC -DPIC -o .libs/librsb_nounroll_la-rsb_merge.o -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_merge.c -o librsb_nounroll_la-rsb_merge.o >/dev/null 2>&1 libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_permute.c -o librsb_nounroll_la-rsb_permute.o >/dev/null 2>&1 +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_bench.c -o librsb_nounroll_la-rsb_bench.o >/dev/null 2>&1 libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_spmv.c -o librsb_nounroll_la-rsb_spmv.o >/dev/null 2>&1 -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_nounroll_la-rsb_ompio.lo `test -f 'rsb_ompio.c' || echo './'`rsb_ompio.c +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_merge.c -o librsb_nounroll_la-rsb_merge.o >/dev/null 2>&1 +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_nounroll_la-rsb_ompio.lo `test -f 'rsb_ompio.c' || echo './'`rsb_ompio.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_ompio.c -fPIC -DPIC -o .libs/librsb_nounroll_la-rsb_ompio.o -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_nounroll_la-rsb_util.lo `test -f 'rsb_util.c' || echo './'`rsb_util.c -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_nounroll_la-rsb_spgemm_csr.lo `test -f 'rsb_spgemm_csr.c' || echo './'`rsb_spgemm_csr.c -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_nounroll_la-rsb_spsum_misc.lo `test -f 'rsb_spsum_misc.c' || echo './'`rsb_spsum_misc.c -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_util.c -fPIC -DPIC -o .libs/librsb_nounroll_la-rsb_util.o libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_ompio.c -o librsb_nounroll_la-rsb_ompio.o >/dev/null 2>&1 +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_nounroll_la-rsb_util.lo `test -f 'rsb_util.c' || echo './'`rsb_util.c +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_nounroll_la-rsb_spgemm_csr.lo `test -f 'rsb_spgemm_csr.c' || echo './'`rsb_spgemm_csr.c +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_util.c -fPIC -DPIC -o .libs/librsb_nounroll_la-rsb_util.o libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_spgemm_csr.c -fPIC -DPIC -o .libs/librsb_nounroll_la-rsb_spgemm_csr.o +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_nounroll_la-rsb_spsum_misc.lo `test -f 'rsb_spsum_misc.c' || echo './'`rsb_spsum_misc.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_spsum_misc.c -fPIC -DPIC -o .libs/librsb_nounroll_la-rsb_spsum_misc.o -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_nounroll_la-rsb_prec.lo `test -f 'rsb_prec.c' || echo './'`rsb_prec.c -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_is.lo `test -f 'rsb_is.c' || echo './'`rsb_is.c +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_spgemm_csr.c -o librsb_nounroll_la-rsb_spgemm_csr.o >/dev/null 2>&1 +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_nounroll_la-rsb_prec.lo `test -f 'rsb_prec.c' || echo './'`rsb_prec.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_prec.c -fPIC -DPIC -o .libs/librsb_nounroll_la-rsb_prec.o +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_is.lo `test -f 'rsb_is.c' || echo './'`rsb_is.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_is.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_is.o -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_spgemm_csr.c -o librsb_nounroll_la-rsb_spgemm_csr.o >/dev/null 2>&1 -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_is.c -o librsb_base_la-rsb_is.o >/dev/null 2>&1 -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_prec.c -o librsb_nounroll_la-rsb_prec.o >/dev/null 2>&1 -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_mio.lo `test -f 'rsb_mio.c' || echo './'`rsb_mio.c +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_mio.lo `test -f 'rsb_mio.c' || echo './'`rsb_mio.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_spsum_misc.c -o librsb_nounroll_la-rsb_spsum_misc.o >/dev/null 2>&1 +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_prec.c -o librsb_nounroll_la-rsb_prec.o >/dev/null 2>&1 libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_mio.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_mio.o -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_op.lo `test -f 'rsb_op.c' || echo './'`rsb_op.c -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_bio.lo `test -f 'rsb_bio.c' || echo './'`rsb_bio.c +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_is.c -o librsb_base_la-rsb_is.o >/dev/null 2>&1 +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_op.lo `test -f 'rsb_op.c' || echo './'`rsb_op.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_op.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_op.o -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_bio.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_bio.o libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_op.c -o librsb_base_la-rsb_op.o >/dev/null 2>&1 -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_get.lo `test -f 'rsb_get.c' || echo './'`rsb_get.c +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_bio.lo `test -f 'rsb_bio.c' || echo './'`rsb_bio.c +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_get.lo `test -f 'rsb_get.c' || echo './'`rsb_get.c +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_set.lo `test -f 'rsb_set.c' || echo './'`rsb_set.c +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_bio.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_bio.o libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_get.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_get.o +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_set.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_set.o libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_bio.c -o librsb_base_la-rsb_bio.o >/dev/null 2>&1 -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_set.lo `test -f 'rsb_set.c' || echo './'`rsb_set.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_mio.c -o librsb_base_la-rsb_mio.o >/dev/null 2>&1 -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_set.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_set.o -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_coo.lo `test -f 'rsb_coo.c' || echo './'`rsb_coo.c -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_coo.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_coo.o libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_set.c -o librsb_base_la-rsb_set.o >/dev/null 2>&1 -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_csr.lo `test -f 'rsb_csr.c' || echo './'`rsb_csr.c -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_csr.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_csr.o -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_coo_check.lo `test -f 'rsb_coo_check.c' || echo './'`rsb_coo_check.c -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_coo.c -o librsb_base_la-rsb_coo.o >/dev/null 2>&1 -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_coo_check.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_coo_check.o -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_csr.c -o librsb_base_la-rsb_csr.o >/dev/null 2>&1 -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_get.c -o librsb_base_la-rsb_get.o >/dev/null 2>&1 -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_coo_symm.lo `test -f 'rsb_coo_symm.c' || echo './'`rsb_coo_symm.c -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_coo_check.c -o librsb_base_la-rsb_coo_check.o >/dev/null 2>&1 -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_coo_symm.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_coo_symm.o -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_idx.lo `test -f 'rsb_idx.c' || echo './'`rsb_idx.c -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_idx.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_idx.o -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_srt.lo `test -f 'rsb_srt.c' || echo './'`rsb_srt.c -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_coo_symm.c -o librsb_base_la-rsb_coo_symm.o >/dev/null 2>&1 -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_srt.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_srt.o -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_srtp.lo `test -f 'rsb_srtp.c' || echo './'`rsb_srtp.c -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_srtp.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_srtp.o -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_srt.c -o librsb_base_la-rsb_srt.o >/dev/null 2>&1 -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_src.lo `test -f 'rsb_src.c' || echo './'`rsb_src.c -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_srtp.c -o librsb_base_la-rsb_srtp.o >/dev/null 2>&1 -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_src.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_src.o +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_coo.lo `test -f 'rsb_coo.c' || echo './'`rsb_coo.c +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_coo.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_coo.o rsb_test_matops.c: In function 'rsb__main_block_partitioned_spmv_sxsa': rsb_test_matops.c:214:41: warning: '%s' directive writing up to 2047 bytes into a region of size 1011 [-Wformat-overflow=] 214 | rsb__sprintf(dst,"%s%s_%s_%.0lf_%s%s" "%s%s%s" "%s%s" "%s",pp?pp:"",h,rsb__getenv_nnr("HOSTNAME"),rsb_time(),buf,ap?ap:"", @@ -2263,136 +2278,154 @@ | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ 32 | __va_arg_pack ()); | ~~~~~~~~~~~~~~~~~ -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_idx.c -o librsb_base_la-rsb_idx.o >/dev/null 2>&1 -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_test_accuracy.lo `test -f 'rsb_test_accuracy.c' || echo './'`rsb_test_accuracy.c +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_csr.lo `test -f 'rsb_csr.c' || echo './'`rsb_csr.c +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_csr.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_csr.o +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_csr.c -o librsb_base_la-rsb_csr.o >/dev/null 2>&1 +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_coo.c -o librsb_base_la-rsb_coo.o >/dev/null 2>&1 +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_get.c -o librsb_base_la-rsb_get.o >/dev/null 2>&1 +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_coo_check.lo `test -f 'rsb_coo_check.c' || echo './'`rsb_coo_check.c +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_coo_check.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_coo_check.o +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_coo_symm.lo `test -f 'rsb_coo_symm.c' || echo './'`rsb_coo_symm.c +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_coo_symm.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_coo_symm.o +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_coo_check.c -o librsb_base_la-rsb_coo_check.o >/dev/null 2>&1 +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_idx.lo `test -f 'rsb_idx.c' || echo './'`rsb_idx.c +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_idx.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_idx.o +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_coo_symm.c -o librsb_base_la-rsb_coo_symm.o >/dev/null 2>&1 +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_srt.lo `test -f 'rsb_srt.c' || echo './'`rsb_srt.c +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_srtp.lo `test -f 'rsb_srtp.c' || echo './'`rsb_srtp.c +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_src.lo `test -f 'rsb_src.c' || echo './'`rsb_src.c +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_srt.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_srt.o +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_krnl_bcss_spsv_u.c -o librsb_nounroll_la-rsb_krnl_bcss_spsv_u.o >/dev/null 2>&1 +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_srtp.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_srtp.o +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_src.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_src.o +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_srtp.c -o librsb_base_la-rsb_srtp.o >/dev/null 2>&1 libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_src.c -o librsb_base_la-rsb_src.o >/dev/null 2>&1 -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_test_accuracy.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_test_accuracy.o -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_clone.lo `test -f 'rsb_clone.c' || echo './'`rsb_clone.c +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_idx.c -o librsb_base_la-rsb_idx.o >/dev/null 2>&1 +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_srt.c -o librsb_base_la-rsb_srt.o >/dev/null 2>&1 +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_test_accuracy.lo `test -f 'rsb_test_accuracy.c' || echo './'`rsb_test_accuracy.c +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_clone.lo `test -f 'rsb_clone.c' || echo './'`rsb_clone.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_clone.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_clone.o -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_rec.lo `test -f 'rsb_rec.c' || echo './'`rsb_rec.c -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_rec.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_rec.o +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_test_accuracy.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_test_accuracy.o libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_test_accuracy.c -o librsb_base_la-rsb_test_accuracy.o >/dev/null 2>&1 -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_render.lo `test -f 'rsb_render.c' || echo './'`rsb_render.c +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_rec.lo `test -f 'rsb_rec.c' || echo './'`rsb_rec.c +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_render.lo `test -f 'rsb_render.c' || echo './'`rsb_render.c +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_rec.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_rec.o libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_render.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_render.o -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_eps.lo `test -f 'rsb_eps.c' || echo './'`rsb_eps.c +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_clone.c -o librsb_base_la-rsb_clone.o >/dev/null 2>&1 +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_eps.lo `test -f 'rsb_eps.c' || echo './'`rsb_eps.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_render.c -o librsb_base_la-rsb_render.o >/dev/null 2>&1 libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_eps.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_eps.o -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_krnl_bcss_spsv_u.c -o librsb_nounroll_la-rsb_krnl_bcss_spsv_u.o >/dev/null 2>&1 -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_clone.c -o librsb_base_la-rsb_clone.o >/dev/null 2>&1 -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_msort_up.lo `test -f 'rsb_msort_up.c' || echo './'`rsb_msort_up.c +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_msort_up.lo `test -f 'rsb_msort_up.c' || echo './'`rsb_msort_up.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_msort_up.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_msort_up.o +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_sys.lo `test -f 'rsb_sys.c' || echo './'`rsb_sys.c +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_sys.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_sys.o libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_rec.c -o librsb_base_la-rsb_rec.o >/dev/null 2>&1 libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_msort_up.c -o librsb_base_la-rsb_msort_up.o >/dev/null 2>&1 -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_eps.c -o librsb_base_la-rsb_eps.o >/dev/null 2>&1 -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_sys.lo `test -f 'rsb_sys.c' || echo './'`rsb_sys.c -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_sys.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_sys.o -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_blas_stuff.lo `test -f 'rsb_blas_stuff.c' || echo './'`rsb_blas_stuff.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_sys.c -o librsb_base_la-rsb_sys.o >/dev/null 2>&1 +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_eps.c -o librsb_base_la-rsb_eps.o >/dev/null 2>&1 +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_blas_stuff.lo `test -f 'rsb_blas_stuff.c' || echo './'`rsb_blas_stuff.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_blas_stuff.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_blas_stuff.o -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_blas_stuff.c -o librsb_base_la-rsb_blas_stuff.o >/dev/null 2>&1 -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_gen.lo `test -f 'rsb_gen.c' || echo './'`rsb_gen.c -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_perf.lo `test -f 'rsb_perf.c' || echo './'`rsb_perf.c +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_gen.lo `test -f 'rsb_gen.c' || echo './'`rsb_gen.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_gen.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_gen.o +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_blas_stuff.c -o librsb_base_la-rsb_blas_stuff.o >/dev/null 2>&1 +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_perf.lo `test -f 'rsb_perf.c' || echo './'`rsb_perf.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_perf.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_perf.o -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_rsb.lo `test -f 'rsb_rsb.c' || echo './'`rsb_rsb.c -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_err.lo `test -f 'rsb_err.c' || echo './'`rsb_err.c +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_rsb.lo `test -f 'rsb_rsb.c' || echo './'`rsb_rsb.c +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_err.lo `test -f 'rsb_err.c' || echo './'`rsb_err.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_rsb.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_rsb.o libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_err.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_err.o -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_perf.c -o librsb_base_la-rsb_perf.o >/dev/null 2>&1 -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_rsb.c -o librsb_base_la-rsb_rsb.o >/dev/null 2>&1 libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_gen.c -o librsb_base_la-rsb_gen.o >/dev/null 2>&1 +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_perf.c -o librsb_base_la-rsb_perf.o >/dev/null 2>&1 libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_err.c -o librsb_base_la-rsb_err.o >/dev/null 2>&1 -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_tune.lo `test -f 'rsb_tune.c' || echo './'`rsb_tune.c +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_tune.lo `test -f 'rsb_tune.c' || echo './'`rsb_tune.c +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_rsb.c -o librsb_base_la-rsb_rsb.o >/dev/null 2>&1 +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_do.lo `test -f 'rsb_do.c' || echo './'`rsb_do.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_tune.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_tune.o -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_do.lo `test -f 'rsb_do.c' || echo './'`rsb_do.c -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_internals.lo `test -f 'rsb_internals.c' || echo './'`rsb_internals.c +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_internals.lo `test -f 'rsb_internals.c' || echo './'`rsb_internals.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_do.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_do.o libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_internals.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_internals.o -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_garbage.lo `test -f 'rsb_garbage.c' || echo './'`rsb_garbage.c +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_garbage.lo `test -f 'rsb_garbage.c' || echo './'`rsb_garbage.c +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_mmio.lo `test -f 'rsb_mmio.c' || echo './'`rsb_mmio.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_garbage.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_garbage.o -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_do.c -o librsb_base_la-rsb_do.o >/dev/null 2>&1 -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_garbage.c -o librsb_base_la-rsb_garbage.o >/dev/null 2>&1 -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_mmio.lo `test -f 'rsb_mmio.c' || echo './'`rsb_mmio.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_mmio.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_mmio.o -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_partition.lo `test -f 'rsb_partition.c' || echo './'`rsb_partition.c -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_partition.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_partition.o +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_garbage.c -o librsb_base_la-rsb_garbage.o >/dev/null 2>&1 +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_do.c -o librsb_base_la-rsb_do.o >/dev/null 2>&1 libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_mmio.c -o librsb_base_la-rsb_mmio.o >/dev/null 2>&1 -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_partition.c -o librsb_base_la-rsb_partition.o >/dev/null 2>&1 -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_mbw.lo `test -f 'rsb_mbw.c' || echo './'`rsb_mbw.c -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_mbw.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_mbw.o +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_partition.lo `test -f 'rsb_partition.c' || echo './'`rsb_partition.c +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_partition.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_partition.o +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_mbw.lo `test -f 'rsb_mbw.c' || echo './'`rsb_mbw.c +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_limiter.lo `test -f 'rsb_limiter.c' || echo './'`rsb_limiter.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_internals.c -o librsb_base_la-rsb_internals.o >/dev/null 2>&1 -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_limiter.lo `test -f 'rsb_limiter.c' || echo './'`rsb_limiter.c +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_fpb.lo `test -f 'rsb_fpb.c' || echo './'`rsb_fpb.c +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_mbw.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_mbw.o libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_limiter.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_limiter.o -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_limiter.c -o librsb_base_la-rsb_limiter.o >/dev/null 2>&1 -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_fpb.lo `test -f 'rsb_fpb.c' || echo './'`rsb_fpb.c +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_partition.c -o librsb_base_la-rsb_partition.o >/dev/null 2>&1 libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_fpb.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_fpb.o +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_limiter.c -o librsb_base_la-rsb_limiter.o >/dev/null 2>&1 +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_spgemm.lo `test -f 'rsb_spgemm.c' || echo './'`rsb_spgemm.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_tune.c -o librsb_base_la-rsb_tune.o >/dev/null 2>&1 -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_mbw.c -o librsb_base_la-rsb_mbw.o >/dev/null 2>&1 libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_fpb.c -o librsb_base_la-rsb_fpb.o >/dev/null 2>&1 -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_spgemm.lo `test -f 'rsb_spgemm.c' || echo './'`rsb_spgemm.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_spgemm.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_spgemm.o -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_spsum.lo `test -f 'rsb_spsum.c' || echo './'`rsb_spsum.c -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_spsv.lo `test -f 'rsb_spsv.c' || echo './'`rsb_spsv.c +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_spsum.lo `test -f 'rsb_spsum.c' || echo './'`rsb_spsum.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_spsum.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_spsum.o -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_lock.lo `test -f 'rsb_lock.c' || echo './'`rsb_lock.c +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_mbw.c -o librsb_base_la-rsb_mbw.o >/dev/null 2>&1 +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_util.c -o librsb_nounroll_la-rsb_util.o >/dev/null 2>&1 +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_spsv.lo `test -f 'rsb_spsv.c' || echo './'`rsb_spsv.c +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_spsum.c -o librsb_base_la-rsb_spsum.o >/dev/null 2>&1 libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_spsv.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_spsv.o -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_lock.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_lock.o libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_spgemm.c -o librsb_base_la-rsb_spgemm.o >/dev/null 2>&1 -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_spsum.c -o librsb_base_la-rsb_spsum.o >/dev/null 2>&1 -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_lock.c -o librsb_base_la-rsb_lock.o >/dev/null 2>&1 -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_swt.lo `test -f 'rsb_swt.c' || echo './'`rsb_swt.c -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_init.lo `test -f 'rsb_init.c' || echo './'`rsb_init.c +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_lock.lo `test -f 'rsb_lock.c' || echo './'`rsb_lock.c +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_swt.lo `test -f 'rsb_swt.c' || echo './'`rsb_swt.c +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_init.lo `test -f 'rsb_init.c' || echo './'`rsb_init.c +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_lock.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_lock.o libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_swt.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_swt.o libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_init.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_init.o -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_dump.lo `test -f 'rsb_dump.c' || echo './'`rsb_dump.c +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_lock.c -o librsb_base_la-rsb_lock.o >/dev/null 2>&1 libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_spsv.c -o librsb_base_la-rsb_spsv.o >/dev/null 2>&1 -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_cpmv.lo `test -f 'rsb_cpmv.c' || echo './'`rsb_cpmv.c -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_dump.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_dump.o -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_cpmv.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_cpmv.o -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_util.c -o librsb_nounroll_la-rsb_util.o >/dev/null 2>&1 libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_swt.c -o librsb_base_la-rsb_swt.o >/dev/null 2>&1 libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_krnl_bcss_misc_u.c -o librsb_nounroll_la-rsb_krnl_bcss_misc_u.o >/dev/null 2>&1 +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_dump.lo `test -f 'rsb_dump.c' || echo './'`rsb_dump.c +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_cpmv.lo `test -f 'rsb_cpmv.c' || echo './'`rsb_cpmv.c +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_dump.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_dump.o +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_cpmv.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_cpmv.o libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_init.c -o librsb_base_la-rsb_init.o >/dev/null 2>&1 +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_asm.lo `test -f 'rsb_asm.c' || echo './'`rsb_asm.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_cpmv.c -o librsb_base_la-rsb_cpmv.o >/dev/null 2>&1 -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_dump.c -o librsb_base_la-rsb_dump.o >/dev/null 2>&1 -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_asm.lo `test -f 'rsb_asm.c' || echo './'`rsb_asm.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_asm.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_asm.o -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_user.lo `test -f 'rsb_user.c' || echo './'`rsb_user.c +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_user.lo `test -f 'rsb_user.c' || echo './'`rsb_user.c +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_coo2rec.lo `test -f 'rsb_coo2rec.c' || echo './'`rsb_coo2rec.c +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_dump.c -o librsb_base_la-rsb_dump.o >/dev/null 2>&1 libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_user.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_user.o -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_asm.c -o librsb_base_la-rsb_asm.o >/dev/null 2>&1 -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_coo2rec.lo `test -f 'rsb_coo2rec.c' || echo './'`rsb_coo2rec.c -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_rec2coo.lo `test -f 'rsb_rec2coo.c' || echo './'`rsb_rec2coo.c -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_rec2csr.lo `test -f 'rsb_rec2csr.c' || echo './'`rsb_rec2csr.c +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_rec2coo.lo `test -f 'rsb_rec2coo.c' || echo './'`rsb_rec2coo.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_coo2rec.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_coo2rec.o +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_asm.c -o librsb_base_la-rsb_asm.o >/dev/null 2>&1 +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_rec2csr.lo `test -f 'rsb_rec2csr.c' || echo './'`rsb_rec2csr.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_rec2coo.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_rec2coo.o -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_csr2coo.lo `test -f 'rsb_csr2coo.c' || echo './'`rsb_csr2coo.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_rec2csr.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_rec2csr.o -/bin/bash ./libtool --tag=FC --mode=compile gfortran -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -mbranch-protection=standard -pipe -fopenmp -c -o rsb_blas_sparse.lo rsb_blas_sparse.F90 -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_csr2coo.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_csr2coo.o +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_csr2coo.lo `test -f 'rsb_csr2coo.c' || echo './'`rsb_csr2coo.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_user.c -o librsb_base_la-rsb_user.o >/dev/null 2>&1 -libtool: compile: gfortran -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -mbranch-protection=standard -pipe -fopenmp -c rsb_blas_sparse.F90 -fPIC -o .libs/rsb_blas_sparse.o -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_rec2csr.c -o librsb_base_la-rsb_rec2csr.o >/dev/null 2>&1 libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_rec2coo.c -o librsb_base_la-rsb_rec2coo.o >/dev/null 2>&1 -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_csr2coo.c -o librsb_base_la-rsb_csr2coo.o >/dev/null 2>&1 -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o rsb_libspblas_handle.lo rsb_libspblas_handle.c -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_libspblas_handle.c -fPIC -DPIC -o .libs/rsb_libspblas_handle.o -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o rsb_libspblas.lo rsb_libspblas.c +/bin/sh ./libtool --tag=FC --mode=compile gfortran -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -mbranch-protection=standard -pipe -fopenmp -c -o rsb_blas_sparse.lo rsb_blas_sparse.F90 +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_csr2coo.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_csr2coo.o +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_rec2csr.c -o librsb_base_la-rsb_rec2csr.o >/dev/null 2>&1 +libtool: compile: gfortran -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -mbranch-protection=standard -pipe -fopenmp -c rsb_blas_sparse.F90 -fPIC -o .libs/rsb_blas_sparse.o +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o rsb_libspblas_handle.lo rsb_libspblas_handle.c +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o rsb_libspblas.lo rsb_libspblas.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_libspblas.c -fPIC -DPIC -o .libs/rsb_libspblas.o +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_libspblas_handle.c -fPIC -DPIC -o .libs/rsb_libspblas_handle.o gfortran -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -mbranch-protection=standard -pipe -fopenmp -c -o rsb_blas_sparse.o rsb_blas_sparse.F90 -/bin/bash ./libtool --tag=CC --mode=link gcc -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -no-undefined -version-info 0:0:0 -Wl,-z,relro -o ch2icfb ch2icfb-ch2icfb.o -lm -lhwloc -lz -fopenmp -L/usr/lib/gcc/aarch64-linux-gnu/15 -L/usr/lib/gcc/aarch64-linux-gnu/15/../../../aarch64-linux-gnu -L/usr/lib/gcc/aarch64-linux-gnu/15/../../../../lib -L/lib/aarch64-linux-gnu -L/lib/../lib -L/usr/lib/aarch64-linux-gnu -L/usr/lib/../lib -L/usr/lib/gcc/aarch64-linux-gnu/15/../../.. -L/lib -L/usr/lib -lgfortran -lm +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_csr2coo.c -o librsb_base_la-rsb_csr2coo.o >/dev/null 2>&1 +/bin/sh ./libtool --tag=CC --mode=link gcc -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -no-undefined -version-info 0:0:0 -Wl,-z,relro -o ch2icfb ch2icfb-ch2icfb.o -lm -lhwloc -lz -fopenmp -L/usr/lib/gcc/aarch64-linux-gnu/15 -L/usr/lib/gcc/aarch64-linux-gnu/15/../../../aarch64-linux-gnu -L/usr/lib/gcc/aarch64-linux-gnu/15/../../../../lib -L/lib/aarch64-linux-gnu -L/lib/../lib -L/usr/lib/aarch64-linux-gnu -L/usr/lib/../lib -L/usr/lib/gcc/aarch64-linux-gnu/15/../../.. -L/lib -L/usr/lib -lgfortran -lm libtool: warning: '-version-info' is ignored for programs libtool: link: gcc -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -Wl,-z -Wl,relro -o ch2icfb ch2icfb-ch2icfb.o -fopenmp -lhwloc -lz -L/usr/lib/gcc/aarch64-linux-gnu/15 -L/usr/lib/gcc/aarch64-linux-gnu/15/../../../aarch64-linux-gnu -L/usr/lib/gcc/aarch64-linux-gnu/15/../../../../lib -L/lib/aarch64-linux-gnu -L/lib/../lib -L/usr/lib/aarch64-linux-gnu -L/usr/lib/../lib -L/usr/lib/gcc/aarch64-linux-gnu/15/../../.. -L/lib -L/usr/lib -lgfortran -lm -fopenmp -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_coo2rec.c -o librsb_base_la-rsb_coo2rec.o >/dev/null 2>&1 if test -f ./rsb_types.h -a ! -f ./rsb_types.h ; then cp -pv ./rsb_types.h ./rsb_types.h ; fi # out-of-dir behaviour varies between installations -if test -f ch2icfb ; then if SED=/usr/bin/sed GREP=/usr/bin/grep /bin/bash ./scripts/rsb_h_to_rsb_fi.sh . /build/reproducible-path/librsb-1.3.0.2+dfsg > rsb.F90 ; then true; else rm "rsb.F90"; echo "Failure generating rsb.F90!" ; exit ; fi ; else echo "Warning: Your system did not build ch2icfb for some reason --- skipping rebuild of "rsb.F90 ;true ; fi -/bin/bash ./libtool --tag=FC --mode=compile gfortran -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -mbranch-protection=standard -pipe -fopenmp -c -o rsb.lo rsb.F90 +if test -f ch2icfb ; then if SED=/usr/bin/sed GREP=/usr/bin/grep /bin/sh ./scripts/rsb_h_to_rsb_fi.sh . /build/reproducible-path/librsb-1.3.0.2+dfsg > rsb.F90 ; then true; else rm "rsb.F90"; echo "Failure generating rsb.F90!" ; exit ; fi ; else echo "Warning: Your system did not build ch2icfb for some reason --- skipping rebuild of "rsb.F90 ;true ; fi +/bin/sh ./libtool --tag=FC --mode=compile gfortran -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -mbranch-protection=standard -pipe -fopenmp -c -o rsb.lo rsb.F90 +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_coo2rec.c -o librsb_base_la-rsb_coo2rec.o >/dev/null 2>&1 libtool: compile: gfortran -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -mbranch-protection=standard -pipe -fopenmp -c rsb.F90 -fPIC -o .libs/rsb.o libtool: compile: gfortran -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -mbranch-protection=standard -pipe -fopenmp -c rsb.F90 -o rsb.o >/dev/null 2>&1 -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_libspblas_handle.c -o rsb_libspblas_handle.o >/dev/null 2>&1 gfortran -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -mbranch-protection=standard -pipe -fopenmp -c -o rsb.o rsb.F90 -libtool: compile: gfortran -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -mbranch-protection=standard -pipe -fopenmp -c rsb_blas_sparse.F90 -o rsb_blas_sparse.o >/dev/null 2>&1 -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_libspblas.c -o rsb_libspblas.o >/dev/null 2>&1 -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_krnl.c -o librsb_nounroll_la-rsb_krnl.o >/dev/null 2>&1 +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_libspblas_handle.c -o rsb_libspblas_handle.o >/dev/null 2>&1 rsb_test_matops.c: In function 'rsb__main_block_partitioned_spsv_sxsx': rsb_test_matops.c:214:41: warning: '%s' directive writing up to 2047 bytes into a region of size 1011 [-Wformat-overflow=] 214 | rsb__sprintf(dst,"%s%s_%s_%.0lf_%s%s" "%s%s%s" "%s%s" "%s",pp?pp:"",h,rsb__getenv_nnr("HOSTNAME"),rsb_time(),buf,ap?ap:"", @@ -2407,16 +2440,19 @@ | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ 32 | __va_arg_pack ()); | ~~~~~~~~~~~~~~~~~ -/bin/bash ./libtool --tag=CC --mode=link gcc -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -no-undefined -version-info 0:0:0 -Wl,-z,relro -o librsb_base.la librsb_base_la-rsb_is.lo librsb_base_la-rsb_mio.lo librsb_base_la-rsb_op.lo librsb_base_la-rsb_bio.lo librsb_base_la-rsb_get.lo librsb_base_la-rsb_set.lo librsb_base_la-rsb_coo.lo librsb_base_la-rsb_csr.lo librsb_base_la-rsb_coo_check.lo librsb_base_la-rsb_coo_symm.lo librsb_base_la-rsb_idx.lo librsb_base_la-rsb_srt.lo librsb_base_la-rsb_srtp.lo librsb_base_la-rsb_src.lo librsb_base_la-rsb_test_accuracy.lo librsb_base_la-rsb_clone.lo librsb_base_la-rsb_rec.lo librsb_base_la-rsb_render.lo librsb_base_la-rsb_eps.lo librsb_base_la-rsb_msort_up.lo librsb_base_la-rsb_sys.lo librsb_base_la-rsb_blas_stuff.lo librsb_base_la-rsb_gen.lo librsb_base_la-rsb_perf.lo librsb_base_la-rsb_rsb.lo librsb_base_la-rsb_err.lo librsb_base_la-rsb_tune.lo librsb_base_la-rsb_do.lo librsb_base_la-rsb_internals.lo librsb_base_la-rsb_garbage.lo librsb_base_la-rsb_mmio.lo librsb_base_la-rsb_partition.lo librsb_base_la-rsb_mbw.lo librsb_base_la-rsb_limiter.lo librsb_base_la-rsb_fpb.lo librsb_base_la-rsb_spgemm.lo librsb_base_la-rsb_spsum.lo librsb_base_la-rsb_spsv.lo librsb_base_la-rsb_lock.lo librsb_base_la-rsb_swt.lo librsb_base_la-rsb_init.lo librsb_base_la-rsb_dump.lo librsb_base_la-rsb_cpmv.lo librsb_base_la-rsb_asm.lo librsb_base_la-rsb_user.lo librsb_base_la-rsb_coo2rec.lo librsb_base_la-rsb_rec2coo.lo librsb_base_la-rsb_rec2csr.lo librsb_base_la-rsb_csr2coo.lo rsb_blas_sparse.lo -lm -lhwloc -lz -fopenmp -L/usr/lib/gcc/aarch64-linux-gnu/15 -L/usr/lib/gcc/aarch64-linux-gnu/15/../../../aarch64-linux-gnu -L/usr/lib/gcc/aarch64-linux-gnu/15/../../../../lib -L/lib/aarch64-linux-gnu -L/lib/../lib -L/usr/lib/aarch64-linux-gnu -L/usr/lib/../lib -L/usr/lib/gcc/aarch64-linux-gnu/15/../../.. -L/lib -L/usr/lib -lgfortran -lm -/bin/bash ./libtool --tag=CC --mode=link gcc -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -no-undefined -version-info 0:0:0 -Wl,-z,relro -o librsb_spblas.la rsb_libspblas_handle.lo rsb_libspblas.lo -lm -lhwloc -lz -fopenmp -L/usr/lib/gcc/aarch64-linux-gnu/15 -L/usr/lib/gcc/aarch64-linux-gnu/15/../../../aarch64-linux-gnu -L/usr/lib/gcc/aarch64-linux-gnu/15/../../../../lib -L/lib/aarch64-linux-gnu -L/lib/../lib -L/usr/lib/aarch64-linux-gnu -L/usr/lib/../lib -L/usr/lib/gcc/aarch64-linux-gnu/15/../../.. -L/lib -L/usr/lib -lgfortran -lm +libtool: compile: gfortran -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -mbranch-protection=standard -pipe -fopenmp -c rsb_blas_sparse.F90 -o rsb_blas_sparse.o >/dev/null 2>&1 +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_libspblas.c -o rsb_libspblas.o >/dev/null 2>&1 +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_krnl.c -o librsb_nounroll_la-rsb_krnl.o >/dev/null 2>&1 +/bin/sh ./libtool --tag=CC --mode=link gcc -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -no-undefined -version-info 0:0:0 -Wl,-z,relro -o librsb_base.la librsb_base_la-rsb_is.lo librsb_base_la-rsb_mio.lo librsb_base_la-rsb_op.lo librsb_base_la-rsb_bio.lo librsb_base_la-rsb_get.lo librsb_base_la-rsb_set.lo librsb_base_la-rsb_coo.lo librsb_base_la-rsb_csr.lo librsb_base_la-rsb_coo_check.lo librsb_base_la-rsb_coo_symm.lo librsb_base_la-rsb_idx.lo librsb_base_la-rsb_srt.lo librsb_base_la-rsb_srtp.lo librsb_base_la-rsb_src.lo librsb_base_la-rsb_test_accuracy.lo librsb_base_la-rsb_clone.lo librsb_base_la-rsb_rec.lo librsb_base_la-rsb_render.lo librsb_base_la-rsb_eps.lo librsb_base_la-rsb_msort_up.lo librsb_base_la-rsb_sys.lo librsb_base_la-rsb_blas_stuff.lo librsb_base_la-rsb_gen.lo librsb_base_la-rsb_perf.lo librsb_base_la-rsb_rsb.lo librsb_base_la-rsb_err.lo librsb_base_la-rsb_tune.lo librsb_base_la-rsb_do.lo librsb_base_la-rsb_internals.lo librsb_base_la-rsb_garbage.lo librsb_base_la-rsb_mmio.lo librsb_base_la-rsb_partition.lo librsb_base_la-rsb_mbw.lo librsb_base_la-rsb_limiter.lo librsb_base_la-rsb_fpb.lo librsb_base_la-rsb_spgemm.lo librsb_base_la-rsb_spsum.lo librsb_base_la-rsb_spsv.lo librsb_base_la-rsb_lock.lo librsb_base_la-rsb_swt.lo librsb_base_la-rsb_init.lo librsb_base_la-rsb_dump.lo librsb_base_la-rsb_cpmv.lo librsb_base_la-rsb_asm.lo librsb_base_la-rsb_user.lo librsb_base_la-rsb_coo2rec.lo librsb_base_la-rsb_rec2coo.lo librsb_base_la-rsb_rec2csr.lo librsb_base_la-rsb_csr2coo.lo rsb_blas_sparse.lo -lm -lhwloc -lz -fopenmp -L/usr/lib/gcc/aarch64-linux-gnu/15 -L/usr/lib/gcc/aarch64-linux-gnu/15/../../../aarch64-linux-gnu -L/usr/lib/gcc/aarch64-linux-gnu/15/../../../../lib -L/lib/aarch64-linux-gnu -L/lib/../lib -L/usr/lib/aarch64-linux-gnu -L/usr/lib/../lib -L/usr/lib/gcc/aarch64-linux-gnu/15/../../.. -L/lib -L/usr/lib -lgfortran -lm libtool: warning: '-version-info/-version-number' is ignored for convenience libraries +libtool: link: ar cr .libs/librsb_base.a .libs/librsb_base_la-rsb_is.o .libs/librsb_base_la-rsb_mio.o .libs/librsb_base_la-rsb_op.o .libs/librsb_base_la-rsb_bio.o .libs/librsb_base_la-rsb_get.o .libs/librsb_base_la-rsb_set.o .libs/librsb_base_la-rsb_coo.o .libs/librsb_base_la-rsb_csr.o .libs/librsb_base_la-rsb_coo_check.o .libs/librsb_base_la-rsb_coo_symm.o .libs/librsb_base_la-rsb_idx.o .libs/librsb_base_la-rsb_srt.o .libs/librsb_base_la-rsb_srtp.o .libs/librsb_base_la-rsb_src.o .libs/librsb_base_la-rsb_test_accuracy.o .libs/librsb_base_la-rsb_clone.o .libs/librsb_base_la-rsb_rec.o .libs/librsb_base_la-rsb_render.o .libs/librsb_base_la-rsb_eps.o .libs/librsb_base_la-rsb_msort_up.o .libs/librsb_base_la-rsb_sys.o .libs/librsb_base_la-rsb_blas_stuff.o .libs/librsb_base_la-rsb_gen.o .libs/librsb_base_la-rsb_perf.o .libs/librsb_base_la-rsb_rsb.o .libs/librsb_base_la-rsb_err.o .libs/librsb_base_la-rsb_tune.o .libs/librsb_base_la-rsb_do.o .libs/librsb_base_la-rsb_internals.o .libs/librsb_base_la-rsb_garbage.o .libs/librsb_base_la-rsb_mmio.o .libs/librsb_base_la-rsb_partition.o .libs/librsb_base_la-rsb_mbw.o .libs/librsb_base_la-rsb_limiter.o .libs/librsb_base_la-rsb_fpb.o .libs/librsb_base_la-rsb_spgemm.o .libs/librsb_base_la-rsb_spsum.o .libs/librsb_base_la-rsb_spsv.o .libs/librsb_base_la-rsb_lock.o .libs/librsb_base_la-rsb_swt.o .libs/librsb_base_la-rsb_init.o .libs/librsb_base_la-rsb_dump.o .libs/librsb_base_la-rsb_cpmv.o .libs/librsb_base_la-rsb_asm.o .libs/librsb_base_la-rsb_user.o .libs/librsb_base_la-rsb_coo2rec.o .libs/librsb_base_la-rsb_rec2coo.o .libs/librsb_base_la-rsb_rec2csr.o .libs/librsb_base_la-rsb_csr2coo.o .libs/rsb_blas_sparse.o +libtool: link: ranlib .libs/librsb_base.a +/bin/sh ./libtool --tag=CC --mode=link gcc -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -no-undefined -version-info 0:0:0 -Wl,-z,relro -o librsb_spblas.la rsb_libspblas_handle.lo rsb_libspblas.lo -lm -lhwloc -lz -fopenmp -L/usr/lib/gcc/aarch64-linux-gnu/15 -L/usr/lib/gcc/aarch64-linux-gnu/15/../../../aarch64-linux-gnu -L/usr/lib/gcc/aarch64-linux-gnu/15/../../../../lib -L/lib/aarch64-linux-gnu -L/lib/../lib -L/usr/lib/aarch64-linux-gnu -L/usr/lib/../lib -L/usr/lib/gcc/aarch64-linux-gnu/15/../../.. -L/lib -L/usr/lib -lgfortran -lm +libtool: link: ( cd ".libs" && rm -f "librsb_base.la" && ln -s "../librsb_base.la" "librsb_base.la" ) libtool: warning: '-version-info/-version-number' is ignored for convenience libraries libtool: link: ar cr .libs/librsb_spblas.a .libs/rsb_libspblas_handle.o .libs/rsb_libspblas.o libtool: link: ranlib .libs/librsb_spblas.a libtool: link: ( cd ".libs" && rm -f "librsb_spblas.la" && ln -s "../librsb_spblas.la" "librsb_spblas.la" ) -libtool: link: ar cr .libs/librsb_base.a .libs/librsb_base_la-rsb_is.o .libs/librsb_base_la-rsb_mio.o .libs/librsb_base_la-rsb_op.o .libs/librsb_base_la-rsb_bio.o .libs/librsb_base_la-rsb_get.o .libs/librsb_base_la-rsb_set.o .libs/librsb_base_la-rsb_coo.o .libs/librsb_base_la-rsb_csr.o .libs/librsb_base_la-rsb_coo_check.o .libs/librsb_base_la-rsb_coo_symm.o .libs/librsb_base_la-rsb_idx.o .libs/librsb_base_la-rsb_srt.o .libs/librsb_base_la-rsb_srtp.o .libs/librsb_base_la-rsb_src.o .libs/librsb_base_la-rsb_test_accuracy.o .libs/librsb_base_la-rsb_clone.o .libs/librsb_base_la-rsb_rec.o .libs/librsb_base_la-rsb_render.o .libs/librsb_base_la-rsb_eps.o .libs/librsb_base_la-rsb_msort_up.o .libs/librsb_base_la-rsb_sys.o .libs/librsb_base_la-rsb_blas_stuff.o .libs/librsb_base_la-rsb_gen.o .libs/librsb_base_la-rsb_perf.o .libs/librsb_base_la-rsb_rsb.o .libs/librsb_base_la-rsb_err.o .libs/librsb_base_la-rsb_tune.o .libs/librsb_base_la-rsb_do.o .libs/librsb_base_la-rsb_internals.o .libs/librsb_base_la-rsb_garbage.o .libs/librsb_base_la-rsb_mmio.o .libs/librsb_base_la-rsb_partition.o .libs/librsb_base_la-rsb_mbw.o .libs/librsb_base_la-rsb_limiter.o .libs/librsb_base_la-rsb_fpb.o .libs/librsb_base_la-rsb_spgemm.o .libs/librsb_base_la-rsb_spsum.o .libs/librsb_base_la-rsb_spsv.o .libs/librsb_base_la-rsb_lock.o .libs/librsb_base_la-rsb_swt.o .libs/librsb_base_la-rsb_init.o .libs/librsb_base_la-rsb_dump.o .libs/librsb_base_la-rsb_cpmv.o .libs/librsb_base_la-rsb_asm.o .libs/librsb_base_la-rsb_user.o .libs/librsb_base_la-rsb_coo2rec.o .libs/librsb_base_la-rsb_rec2coo.o .libs/librsb_base_la-rsb_rec2csr.o .libs/librsb_base_la-rsb_csr2coo.o .libs/rsb_blas_sparse.o -libtool: link: ranlib .libs/librsb_base.a -libtool: link: ( cd ".libs" && rm -f "librsb_base.la" && ln -s "../librsb_base.la" "librsb_base.la" ) rsb_test_matops.c: In function 'rsb__main_block_partitioned_mat_stats': rsb_test_matops.c:214:41: warning: '%s' directive writing up to 2047 bytes into a region of size 1011 [-Wformat-overflow=] 214 | rsb__sprintf(dst,"%s%s_%s_%.0lf_%s%s" "%s%s%s" "%s%s" "%s",pp?pp:"",h,rsb__getenv_nnr("HOSTNAME"),rsb_time(),buf,ap?ap:"", @@ -2433,12 +2469,12 @@ | ~~~~~~~~~~~~~~~~~ libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_krnl_bcss_spmv_u.c -o librsb_nounroll_la-rsb_krnl_bcss_spmv_u.o >/dev/null 2>&1 libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_krnl_bcoo_spmv_u.c -o librsb_nounroll_la-rsb_krnl_bcoo_spmv_u.o >/dev/null 2>&1 -/bin/bash ./libtool --tag=CC --mode=link gcc -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -no-undefined -version-info 0:0:0 -Wl,-z,relro -o librsb_nounroll.la librsb_nounroll_la-rsb_stropts.lo librsb_nounroll_la-rsb_strmif.lo librsb_nounroll_la-rsb_unroll.lo librsb_nounroll_la-rsb_krnl_vb.lo librsb_nounroll_la-rsb_krnl_lb.lo librsb_nounroll_la-rsb_krnl.lo librsb_nounroll_la-rsb_bench.lo librsb_nounroll_la-rsb_mergesort.lo librsb_nounroll_la-rsb_permute.lo librsb_nounroll_la-rsb_krnl_bcss_l.lo librsb_nounroll_la-rsb_krnl_bcss_u.lo librsb_nounroll_la-rsb_krnl_bcss_spsv_u.lo librsb_nounroll_la-rsb_krnl_bcss_spmv_u.lo librsb_nounroll_la-rsb_krnl_bcss_misc_u.lo librsb_nounroll_la-rsb_krnl_bcoo_spmv_u.lo librsb_nounroll_la-rsb_krnl_bcss.lo librsb_nounroll_la-rsb_spmv.lo librsb_nounroll_la-rsb_merge.lo librsb_nounroll_la-rsb_ompio.lo librsb_nounroll_la-rsb_util.lo librsb_nounroll_la-rsb_spgemm_csr.lo librsb_nounroll_la-rsb_spsum_misc.lo librsb_nounroll_la-rsb_prec.lo -lm -lhwloc -lz -fopenmp -L/usr/lib/gcc/aarch64-linux-gnu/15 -L/usr/lib/gcc/aarch64-linux-gnu/15/../../../aarch64-linux-gnu -L/usr/lib/gcc/aarch64-linux-gnu/15/../../../../lib -L/lib/aarch64-linux-gnu -L/lib/../lib -L/usr/lib/aarch64-linux-gnu -L/usr/lib/../lib -L/usr/lib/gcc/aarch64-linux-gnu/15/../../.. -L/lib -L/usr/lib -lgfortran -lm +/bin/sh ./libtool --tag=CC --mode=link gcc -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -no-undefined -version-info 0:0:0 -Wl,-z,relro -o librsb_nounroll.la librsb_nounroll_la-rsb_stropts.lo librsb_nounroll_la-rsb_strmif.lo librsb_nounroll_la-rsb_unroll.lo librsb_nounroll_la-rsb_krnl_vb.lo librsb_nounroll_la-rsb_krnl_lb.lo librsb_nounroll_la-rsb_krnl.lo librsb_nounroll_la-rsb_bench.lo librsb_nounroll_la-rsb_mergesort.lo librsb_nounroll_la-rsb_permute.lo librsb_nounroll_la-rsb_krnl_bcss_l.lo librsb_nounroll_la-rsb_krnl_bcss_u.lo librsb_nounroll_la-rsb_krnl_bcss_spsv_u.lo librsb_nounroll_la-rsb_krnl_bcss_spmv_u.lo librsb_nounroll_la-rsb_krnl_bcss_misc_u.lo librsb_nounroll_la-rsb_krnl_bcoo_spmv_u.lo librsb_nounroll_la-rsb_krnl_bcss.lo librsb_nounroll_la-rsb_spmv.lo librsb_nounroll_la-rsb_merge.lo librsb_nounroll_la-rsb_ompio.lo librsb_nounroll_la-rsb_util.lo librsb_nounroll_la-rsb_spgemm_csr.lo librsb_nounroll_la-rsb_spsum_misc.lo librsb_nounroll_la-rsb_prec.lo -lm -lhwloc -lz -fopenmp -L/usr/lib/gcc/aarch64-linux-gnu/15 -L/usr/lib/gcc/aarch64-linux-gnu/15/../../../aarch64-linux-gnu -L/usr/lib/gcc/aarch64-linux-gnu/15/../../../../lib -L/lib/aarch64-linux-gnu -L/lib/../lib -L/usr/lib/aarch64-linux-gnu -L/usr/lib/../lib -L/usr/lib/gcc/aarch64-linux-gnu/15/../../.. -L/lib -L/usr/lib -lgfortran -lm libtool: warning: '-version-info/-version-number' is ignored for convenience libraries libtool: link: ar cr .libs/librsb_nounroll.a .libs/librsb_nounroll_la-rsb_stropts.o .libs/librsb_nounroll_la-rsb_strmif.o .libs/librsb_nounroll_la-rsb_unroll.o .libs/librsb_nounroll_la-rsb_krnl_vb.o .libs/librsb_nounroll_la-rsb_krnl_lb.o .libs/librsb_nounroll_la-rsb_krnl.o .libs/librsb_nounroll_la-rsb_bench.o .libs/librsb_nounroll_la-rsb_mergesort.o .libs/librsb_nounroll_la-rsb_permute.o .libs/librsb_nounroll_la-rsb_krnl_bcss_l.o .libs/librsb_nounroll_la-rsb_krnl_bcss_u.o .libs/librsb_nounroll_la-rsb_krnl_bcss_spsv_u.o .libs/librsb_nounroll_la-rsb_krnl_bcss_spmv_u.o .libs/librsb_nounroll_la-rsb_krnl_bcss_misc_u.o .libs/librsb_nounroll_la-rsb_krnl_bcoo_spmv_u.o .libs/librsb_nounroll_la-rsb_krnl_bcss.o .libs/librsb_nounroll_la-rsb_spmv.o .libs/librsb_nounroll_la-rsb_merge.o .libs/librsb_nounroll_la-rsb_ompio.o .libs/librsb_nounroll_la-rsb_util.o .libs/librsb_nounroll_la-rsb_spgemm_csr.o .libs/librsb_nounroll_la-rsb_spsum_misc.o .libs/librsb_nounroll_la-rsb_prec.o libtool: link: ranlib .libs/librsb_nounroll.a libtool: link: ( cd ".libs" && rm -f "librsb_nounroll.la" && ln -s "../librsb_nounroll.la" "librsb_nounroll.la" ) -/bin/bash ./libtool --tag=CC --mode=link gcc -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -no-undefined -version-info 0:0:0 -Wl,-z,relro -o librsb.la -rpath /usr/lib/aarch64-linux-gnu rsb.lo librsb_nounroll.la librsb_base.la librsb_spblas.la /build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp/librsbpp.la -lstdc++ -lm -lhwloc -lz -fopenmp -L/usr/lib/gcc/aarch64-linux-gnu/15 -L/usr/lib/gcc/aarch64-linux-gnu/15/../../../aarch64-linux-gnu -L/usr/lib/gcc/aarch64-linux-gnu/15/../../../../lib -L/lib/aarch64-linux-gnu -L/lib/../lib -L/usr/lib/aarch64-linux-gnu -L/usr/lib/../lib -L/usr/lib/gcc/aarch64-linux-gnu/15/../../.. -L/lib -L/usr/lib -lgfortran -lm +/bin/sh ./libtool --tag=CC --mode=link gcc -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -no-undefined -version-info 0:0:0 -Wl,-z,relro -o librsb.la -rpath /usr/lib/aarch64-linux-gnu rsb.lo librsb_nounroll.la librsb_base.la librsb_spblas.la /build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp/librsbpp.la -lstdc++ -lm -lhwloc -lz -fopenmp -L/usr/lib/gcc/aarch64-linux-gnu/15 -L/usr/lib/gcc/aarch64-linux-gnu/15/../../../aarch64-linux-gnu -L/usr/lib/gcc/aarch64-linux-gnu/15/../../../../lib -L/lib/aarch64-linux-gnu -L/lib/../lib -L/usr/lib/aarch64-linux-gnu -L/usr/lib/../lib -L/usr/lib/gcc/aarch64-linux-gnu/15/../../.. -L/lib -L/usr/lib -lgfortran -lm libtool: link: gcc -shared -fPIC -DPIC .libs/rsb.o -Wl,--whole-archive ./.libs/librsb_nounroll.a ./.libs/librsb_base.a ./.libs/librsb_spblas.a /build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp/.libs/librsbpp.a -Wl,--no-whole-archive -L/usr/lib/gcc/aarch64-linux-gnu/15 -L/usr/lib/gcc/aarch64-linux-gnu/15/../../../aarch64-linux-gnu -L/usr/lib/gcc/aarch64-linux-gnu/15/../../../../lib -L/lib/aarch64-linux-gnu -L/lib/../lib -L/usr/lib/aarch64-linux-gnu -L/usr/lib/../lib -L/usr/lib/gcc/aarch64-linux-gnu/15/../../.. -L/lib -L/usr/lib -lpthread -lstdc++fs -lstdc++ -lhwloc -lz -lgfortran -lm -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Werror=format-security -mbranch-protection=standard -O3 -Wl,-z -Wl,relro -fopenmp -fopenmp -Wl,-soname -Wl,librsb.so.0 -o .libs/librsb.so.0.0.0 /usr/lib/gcc/aarch64-linux-gnu/15/libstdc++.so: warning: GCS is required by -z gcs, but this shared library lacks the necessary property note. The dynamic loader might not enable GCS or refuse to load the program unless all the shared library dependencies have the GCS marking. /usr/lib/gcc/aarch64-linux-gnu/15/../../../aarch64-linux-gnu/libhwloc.so: warning: GCS is required by -z gcs, but this shared library lacks the necessary property note. The dynamic loader might not enable GCS or refuse to load the program unless all the shared library dependencies have the GCS marking. @@ -2459,7 +2495,7 @@ libtool: link: ranlib .libs/librsb.a libtool: link: rm -fr .libs/librsb.lax libtool: link: ( cd ".libs" && rm -f "librsb.la" && ln -s "../librsb.la" "librsb.la" ) -/bin/bash ./libtool --tag=CXX --mode=link g++ -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -fopenmp -no-undefined -version-info 0:0:0 -Wl,-z,relro -o rsbench rsbench-rsbench.o rsbench-rsb_test_matops.o rsbench-rsb_mkl.o rsbench-rsb_genmm.o rsbench-rsb_mmls.o rsbench-rsb_pr.o rsbench-rsb_pcnt.o rsbench-rsb_failure_tests.o rsbench-rsb_libspblas_tests.o rsb_dummy.o librsb.la -lhwloc -lm -lhwloc -lz -fopenmp -L/usr/lib/gcc/aarch64-linux-gnu/15 -L/usr/lib/gcc/aarch64-linux-gnu/15/../../../aarch64-linux-gnu -L/usr/lib/gcc/aarch64-linux-gnu/15/../../../../lib -L/lib/aarch64-linux-gnu -L/lib/../lib -L/usr/lib/aarch64-linux-gnu -L/usr/lib/../lib -L/usr/lib/gcc/aarch64-linux-gnu/15/../../.. -L/lib -L/usr/lib -lgfortran -lm +/bin/sh ./libtool --tag=CXX --mode=link g++ -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -fopenmp -no-undefined -version-info 0:0:0 -Wl,-z,relro -o rsbench rsbench-rsbench.o rsbench-rsb_test_matops.o rsbench-rsb_mkl.o rsbench-rsb_genmm.o rsbench-rsb_mmls.o rsbench-rsb_pr.o rsbench-rsb_pcnt.o rsbench-rsb_failure_tests.o rsbench-rsb_libspblas_tests.o rsb_dummy.o librsb.la -lhwloc -lm -lhwloc -lz -fopenmp -L/usr/lib/gcc/aarch64-linux-gnu/15 -L/usr/lib/gcc/aarch64-linux-gnu/15/../../../aarch64-linux-gnu -L/usr/lib/gcc/aarch64-linux-gnu/15/../../../../lib -L/lib/aarch64-linux-gnu -L/lib/../lib -L/usr/lib/aarch64-linux-gnu -L/usr/lib/../lib -L/usr/lib/gcc/aarch64-linux-gnu/15/../../.. -L/lib -L/usr/lib -lgfortran -lm libtool: warning: '-version-info' is ignored for programs libtool: link: g++ -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -fopenmp -Wl,-z -Wl,relro -o .libs/rsbench rsbench-rsbench.o rsbench-rsb_test_matops.o rsbench-rsb_mkl.o rsbench-rsb_genmm.o rsbench-rsb_mmls.o rsbench-rsb_pr.o rsbench-rsb_pcnt.o rsbench-rsb_failure_tests.o rsbench-rsb_libspblas_tests.o rsb_dummy.o -fopenmp ./.libs/librsb.so -lhwloc -lz -L/usr/lib/gcc/aarch64-linux-gnu/15 -L/usr/lib/gcc/aarch64-linux-gnu/15/../../../aarch64-linux-gnu -L/usr/lib/gcc/aarch64-linux-gnu/15/../../../../lib -L/lib/aarch64-linux-gnu -L/lib/../lib -L/usr/lib/aarch64-linux-gnu -L/usr/lib/../lib -L/usr/lib/gcc/aarch64-linux-gnu/15/../../.. -L/lib -L/usr/lib -lgfortran -lm -fopenmp gmake[4]: Leaving directory '/build/reproducible-path/librsb-1.3.0.2+dfsg' @@ -2476,27 +2512,27 @@ gfortran -DHAVE_CONFIG_H -I. -I.. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -I.. -I.. -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -mbranch-protection=standard -pipe -fopenmp -c -o fortran.o fortran.F90 gfortran -DHAVE_CONFIG_H -I. -I.. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -I.. -I.. -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -mbranch-protection=standard -pipe -fopenmp -c -o fortran_rsb_fi.o fortran_rsb_fi.F90 g++ -DHAVE_CONFIG_H -I. -I.. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -fopenmp -c -o cplusplus.o cplusplus.cpp -/bin/bash ../libtool --tag=CXX --mode=link g++ -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -fopenmp -Wl,-z,relro -o transpose transpose.o -L.. /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la -lhwloc -lm -lhwloc -lz -fopenmp -L/usr/lib/gcc/aarch64-linux-gnu/15 -L/usr/lib/gcc/aarch64-linux-gnu/15/../../../aarch64-linux-gnu -L/usr/lib/gcc/aarch64-linux-gnu/15/../../../../lib -L/lib/aarch64-linux-gnu -L/lib/../lib -L/usr/lib/aarch64-linux-gnu -L/usr/lib/../lib -L/usr/lib/gcc/aarch64-linux-gnu/15/../../.. -L/lib -L/usr/lib -lgfortran -lm -/bin/bash ../libtool --tag=CXX --mode=link g++ -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -fopenmp -Wl,-z,relro -o hello hello.o -L.. /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la -lhwloc -lm -lhwloc -lz -fopenmp -L/usr/lib/gcc/aarch64-linux-gnu/15 -L/usr/lib/gcc/aarch64-linux-gnu/15/../../../aarch64-linux-gnu -L/usr/lib/gcc/aarch64-linux-gnu/15/../../../../lib -L/lib/aarch64-linux-gnu -L/lib/../lib -L/usr/lib/aarch64-linux-gnu -L/usr/lib/../lib -L/usr/lib/gcc/aarch64-linux-gnu/15/../../.. -L/lib -L/usr/lib -lgfortran -lm -/bin/bash ../libtool --tag=CXX --mode=link g++ -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -fopenmp -Wl,-z,relro -o hello-spblas hello-spblas.o -L.. /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la -lhwloc -lm -lhwloc -lz -fopenmp -L/usr/lib/gcc/aarch64-linux-gnu/15 -L/usr/lib/gcc/aarch64-linux-gnu/15/../../../aarch64-linux-gnu -L/usr/lib/gcc/aarch64-linux-gnu/15/../../../../lib -L/lib/aarch64-linux-gnu -L/lib/../lib -L/usr/lib/aarch64-linux-gnu -L/usr/lib/../lib -L/usr/lib/gcc/aarch64-linux-gnu/15/../../.. -L/lib -L/usr/lib -lgfortran -lm -/bin/bash ../libtool --tag=CXX --mode=link g++ -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -fopenmp -Wl,-z,relro -o io-spblas io-spblas.o -L.. /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la -lhwloc -lm -lhwloc -lz -fopenmp -L/usr/lib/gcc/aarch64-linux-gnu/15 -L/usr/lib/gcc/aarch64-linux-gnu/15/../../../aarch64-linux-gnu -L/usr/lib/gcc/aarch64-linux-gnu/15/../../../../lib -L/lib/aarch64-linux-gnu -L/lib/../lib -L/usr/lib/aarch64-linux-gnu -L/usr/lib/../lib -L/usr/lib/gcc/aarch64-linux-gnu/15/../../.. -L/lib -L/usr/lib -lgfortran -lm -/bin/bash ../libtool --tag=CXX --mode=link g++ -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -fopenmp -Wl,-z,relro -o power power.o -L.. /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la -lhwloc -lm -lhwloc -lz -fopenmp -L/usr/lib/gcc/aarch64-linux-gnu/15 -L/usr/lib/gcc/aarch64-linux-gnu/15/../../../aarch64-linux-gnu -L/usr/lib/gcc/aarch64-linux-gnu/15/../../../../lib -L/lib/aarch64-linux-gnu -L/lib/../lib -L/usr/lib/aarch64-linux-gnu -L/usr/lib/../lib -L/usr/lib/gcc/aarch64-linux-gnu/15/../../.. -L/lib -L/usr/lib -lgfortran -lm -/bin/bash ../libtool --tag=CXX --mode=link g++ -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -fopenmp -Wl,-z,relro -o backsolve backsolve.o -L.. /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la -lhwloc -lm -lhwloc -lz -fopenmp -L/usr/lib/gcc/aarch64-linux-gnu/15 -L/usr/lib/gcc/aarch64-linux-gnu/15/../../../aarch64-linux-gnu -L/usr/lib/gcc/aarch64-linux-gnu/15/../../../../lib -L/lib/aarch64-linux-gnu -L/lib/../lib -L/usr/lib/aarch64-linux-gnu -L/usr/lib/../lib -L/usr/lib/gcc/aarch64-linux-gnu/15/../../.. -L/lib -L/usr/lib -lgfortran -lm -/bin/bash ../libtool --tag=CXX --mode=link g++ -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -fopenmp -Wl,-z,relro -o fortran_rsb_fi fortran_rsb_fi.o -L.. /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la -lhwloc -lm -lhwloc -lz -fopenmp -L/usr/lib/gcc/aarch64-linux-gnu/15 -L/usr/lib/gcc/aarch64-linux-gnu/15/../../../aarch64-linux-gnu -L/usr/lib/gcc/aarch64-linux-gnu/15/../../../../lib -L/lib/aarch64-linux-gnu -L/lib/../lib -L/usr/lib/aarch64-linux-gnu -L/usr/lib/../lib -L/usr/lib/gcc/aarch64-linux-gnu/15/../../.. -L/lib -L/usr/lib -lgfortran -lm -/bin/bash ../libtool --tag=CXX --mode=link g++ -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -fopenmp -Wl,-z,relro -o fortran fortran.o -L.. /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la -lhwloc -lm -lhwloc -lz -fopenmp -L/usr/lib/gcc/aarch64-linux-gnu/15 -L/usr/lib/gcc/aarch64-linux-gnu/15/../../../aarch64-linux-gnu -L/usr/lib/gcc/aarch64-linux-gnu/15/../../../../lib -L/lib/aarch64-linux-gnu -L/lib/../lib -L/usr/lib/aarch64-linux-gnu -L/usr/lib/../lib -L/usr/lib/gcc/aarch64-linux-gnu/15/../../.. -L/lib -L/usr/lib -lgfortran -lm -/bin/bash ../libtool --tag=CXX --mode=link g++ -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -fopenmp -Wl,-z,relro -o autotune autotune.o -L.. /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la -lhwloc -lm -lhwloc -lz -fopenmp -L/usr/lib/gcc/aarch64-linux-gnu/15 -L/usr/lib/gcc/aarch64-linux-gnu/15/../../../aarch64-linux-gnu -L/usr/lib/gcc/aarch64-linux-gnu/15/../../../../lib -L/lib/aarch64-linux-gnu -L/lib/../lib -L/usr/lib/aarch64-linux-gnu -L/usr/lib/../lib -L/usr/lib/gcc/aarch64-linux-gnu/15/../../.. -L/lib -L/usr/lib -lgfortran -lm -libtool: link: g++ -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -fopenmp -Wl,-z -Wl,relro -o .libs/transpose transpose.o -fopenmp -L.. /build/reproducible-path/librsb-1.3.0.2+dfsg/.libs/librsb.so -lhwloc -lz -L/usr/lib/gcc/aarch64-linux-gnu/15 -L/usr/lib/gcc/aarch64-linux-gnu/15/../../../aarch64-linux-gnu -L/usr/lib/gcc/aarch64-linux-gnu/15/../../../../lib -L/lib/aarch64-linux-gnu -L/lib/../lib -L/usr/lib/aarch64-linux-gnu -L/usr/lib/../lib -L/usr/lib/gcc/aarch64-linux-gnu/15/../../.. -L/lib -L/usr/lib -lgfortran -lm -fopenmp +/bin/sh ../libtool --tag=CXX --mode=link g++ -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -fopenmp -Wl,-z,relro -o backsolve backsolve.o -L.. /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la -lhwloc -lm -lhwloc -lz -fopenmp -L/usr/lib/gcc/aarch64-linux-gnu/15 -L/usr/lib/gcc/aarch64-linux-gnu/15/../../../aarch64-linux-gnu -L/usr/lib/gcc/aarch64-linux-gnu/15/../../../../lib -L/lib/aarch64-linux-gnu -L/lib/../lib -L/usr/lib/aarch64-linux-gnu -L/usr/lib/../lib -L/usr/lib/gcc/aarch64-linux-gnu/15/../../.. -L/lib -L/usr/lib -lgfortran -lm +/bin/sh ../libtool --tag=CXX --mode=link g++ -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -fopenmp -Wl,-z,relro -o io-spblas io-spblas.o -L.. /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la -lhwloc -lm -lhwloc -lz -fopenmp -L/usr/lib/gcc/aarch64-linux-gnu/15 -L/usr/lib/gcc/aarch64-linux-gnu/15/../../../aarch64-linux-gnu -L/usr/lib/gcc/aarch64-linux-gnu/15/../../../../lib -L/lib/aarch64-linux-gnu -L/lib/../lib -L/usr/lib/aarch64-linux-gnu -L/usr/lib/../lib -L/usr/lib/gcc/aarch64-linux-gnu/15/../../.. -L/lib -L/usr/lib -lgfortran -lm +/bin/sh ../libtool --tag=CXX --mode=link g++ -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -fopenmp -Wl,-z,relro -o transpose transpose.o -L.. /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la -lhwloc -lm -lhwloc -lz -fopenmp -L/usr/lib/gcc/aarch64-linux-gnu/15 -L/usr/lib/gcc/aarch64-linux-gnu/15/../../../aarch64-linux-gnu -L/usr/lib/gcc/aarch64-linux-gnu/15/../../../../lib -L/lib/aarch64-linux-gnu -L/lib/../lib -L/usr/lib/aarch64-linux-gnu -L/usr/lib/../lib -L/usr/lib/gcc/aarch64-linux-gnu/15/../../.. -L/lib -L/usr/lib -lgfortran -lm +/bin/sh ../libtool --tag=CXX --mode=link g++ -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -fopenmp -Wl,-z,relro -o hello hello.o -L.. /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la -lhwloc -lm -lhwloc -lz -fopenmp -L/usr/lib/gcc/aarch64-linux-gnu/15 -L/usr/lib/gcc/aarch64-linux-gnu/15/../../../aarch64-linux-gnu -L/usr/lib/gcc/aarch64-linux-gnu/15/../../../../lib -L/lib/aarch64-linux-gnu -L/lib/../lib -L/usr/lib/aarch64-linux-gnu -L/usr/lib/../lib -L/usr/lib/gcc/aarch64-linux-gnu/15/../../.. -L/lib -L/usr/lib -lgfortran -lm +/bin/sh ../libtool --tag=CXX --mode=link g++ -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -fopenmp -Wl,-z,relro -o hello-spblas hello-spblas.o -L.. /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la -lhwloc -lm -lhwloc -lz -fopenmp -L/usr/lib/gcc/aarch64-linux-gnu/15 -L/usr/lib/gcc/aarch64-linux-gnu/15/../../../aarch64-linux-gnu -L/usr/lib/gcc/aarch64-linux-gnu/15/../../../../lib -L/lib/aarch64-linux-gnu -L/lib/../lib -L/usr/lib/aarch64-linux-gnu -L/usr/lib/../lib -L/usr/lib/gcc/aarch64-linux-gnu/15/../../.. -L/lib -L/usr/lib -lgfortran -lm +/bin/sh ../libtool --tag=CXX --mode=link g++ -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -fopenmp -Wl,-z,relro -o power power.o -L.. /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la -lhwloc -lm -lhwloc -lz -fopenmp -L/usr/lib/gcc/aarch64-linux-gnu/15 -L/usr/lib/gcc/aarch64-linux-gnu/15/../../../aarch64-linux-gnu -L/usr/lib/gcc/aarch64-linux-gnu/15/../../../../lib -L/lib/aarch64-linux-gnu -L/lib/../lib -L/usr/lib/aarch64-linux-gnu -L/usr/lib/../lib -L/usr/lib/gcc/aarch64-linux-gnu/15/../../.. -L/lib -L/usr/lib -lgfortran -lm +/bin/sh ../libtool --tag=CXX --mode=link g++ -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -fopenmp -Wl,-z,relro -o fortran_rsb_fi fortran_rsb_fi.o -L.. /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la -lhwloc -lm -lhwloc -lz -fopenmp -L/usr/lib/gcc/aarch64-linux-gnu/15 -L/usr/lib/gcc/aarch64-linux-gnu/15/../../../aarch64-linux-gnu -L/usr/lib/gcc/aarch64-linux-gnu/15/../../../../lib -L/lib/aarch64-linux-gnu -L/lib/../lib -L/usr/lib/aarch64-linux-gnu -L/usr/lib/../lib -L/usr/lib/gcc/aarch64-linux-gnu/15/../../.. -L/lib -L/usr/lib -lgfortran -lm +/bin/sh ../libtool --tag=CXX --mode=link g++ -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -fopenmp -Wl,-z,relro -o autotune autotune.o -L.. /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la -lhwloc -lm -lhwloc -lz -fopenmp -L/usr/lib/gcc/aarch64-linux-gnu/15 -L/usr/lib/gcc/aarch64-linux-gnu/15/../../../aarch64-linux-gnu -L/usr/lib/gcc/aarch64-linux-gnu/15/../../../../lib -L/lib/aarch64-linux-gnu -L/lib/../lib -L/usr/lib/aarch64-linux-gnu -L/usr/lib/../lib -L/usr/lib/gcc/aarch64-linux-gnu/15/../../.. -L/lib -L/usr/lib -lgfortran -lm +libtool: link: g++ -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -fopenmp -Wl,-z -Wl,relro -o .libs/backsolve backsolve.o -fopenmp -L.. /build/reproducible-path/librsb-1.3.0.2+dfsg/.libs/librsb.so -lhwloc -lz -L/usr/lib/gcc/aarch64-linux-gnu/15 -L/usr/lib/gcc/aarch64-linux-gnu/15/../../../aarch64-linux-gnu -L/usr/lib/gcc/aarch64-linux-gnu/15/../../../../lib -L/lib/aarch64-linux-gnu -L/lib/../lib -L/usr/lib/aarch64-linux-gnu -L/usr/lib/../lib -L/usr/lib/gcc/aarch64-linux-gnu/15/../../.. -L/lib -L/usr/lib -lgfortran -lm -fopenmp +/bin/sh ../libtool --tag=CXX --mode=link g++ -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -fopenmp -Wl,-z,relro -o fortran fortran.o -L.. /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la -lhwloc -lm -lhwloc -lz -fopenmp -L/usr/lib/gcc/aarch64-linux-gnu/15 -L/usr/lib/gcc/aarch64-linux-gnu/15/../../../aarch64-linux-gnu -L/usr/lib/gcc/aarch64-linux-gnu/15/../../../../lib -L/lib/aarch64-linux-gnu -L/lib/../lib -L/usr/lib/aarch64-linux-gnu -L/usr/lib/../lib -L/usr/lib/gcc/aarch64-linux-gnu/15/../../.. -L/lib -L/usr/lib -lgfortran -lm libtool: link: g++ -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -fopenmp -Wl,-z -Wl,relro -o .libs/io-spblas io-spblas.o -fopenmp -L.. /build/reproducible-path/librsb-1.3.0.2+dfsg/.libs/librsb.so -lhwloc -lz -L/usr/lib/gcc/aarch64-linux-gnu/15 -L/usr/lib/gcc/aarch64-linux-gnu/15/../../../aarch64-linux-gnu -L/usr/lib/gcc/aarch64-linux-gnu/15/../../../../lib -L/lib/aarch64-linux-gnu -L/lib/../lib -L/usr/lib/aarch64-linux-gnu -L/usr/lib/../lib -L/usr/lib/gcc/aarch64-linux-gnu/15/../../.. -L/lib -L/usr/lib -lgfortran -lm -fopenmp +libtool: link: g++ -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -fopenmp -Wl,-z -Wl,relro -o .libs/hello hello.o -fopenmp -L.. /build/reproducible-path/librsb-1.3.0.2+dfsg/.libs/librsb.so -lhwloc -lz -L/usr/lib/gcc/aarch64-linux-gnu/15 -L/usr/lib/gcc/aarch64-linux-gnu/15/../../../aarch64-linux-gnu -L/usr/lib/gcc/aarch64-linux-gnu/15/../../../../lib -L/lib/aarch64-linux-gnu -L/lib/../lib -L/usr/lib/aarch64-linux-gnu -L/usr/lib/../lib -L/usr/lib/gcc/aarch64-linux-gnu/15/../../.. -L/lib -L/usr/lib -lgfortran -lm -fopenmp +libtool: link: g++ -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -fopenmp -Wl,-z -Wl,relro -o .libs/transpose transpose.o -fopenmp -L.. /build/reproducible-path/librsb-1.3.0.2+dfsg/.libs/librsb.so -lhwloc -lz -L/usr/lib/gcc/aarch64-linux-gnu/15 -L/usr/lib/gcc/aarch64-linux-gnu/15/../../../aarch64-linux-gnu -L/usr/lib/gcc/aarch64-linux-gnu/15/../../../../lib -L/lib/aarch64-linux-gnu -L/lib/../lib -L/usr/lib/aarch64-linux-gnu -L/usr/lib/../lib -L/usr/lib/gcc/aarch64-linux-gnu/15/../../.. -L/lib -L/usr/lib -lgfortran -lm -fopenmp libtool: link: g++ -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -fopenmp -Wl,-z -Wl,relro -o .libs/hello-spblas hello-spblas.o -fopenmp -L.. /build/reproducible-path/librsb-1.3.0.2+dfsg/.libs/librsb.so -lhwloc -lz -L/usr/lib/gcc/aarch64-linux-gnu/15 -L/usr/lib/gcc/aarch64-linux-gnu/15/../../../aarch64-linux-gnu -L/usr/lib/gcc/aarch64-linux-gnu/15/../../../../lib -L/lib/aarch64-linux-gnu -L/lib/../lib -L/usr/lib/aarch64-linux-gnu -L/usr/lib/../lib -L/usr/lib/gcc/aarch64-linux-gnu/15/../../.. -L/lib -L/usr/lib -lgfortran -lm -fopenmp libtool: link: g++ -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -fopenmp -Wl,-z -Wl,relro -o .libs/power power.o -fopenmp -L.. /build/reproducible-path/librsb-1.3.0.2+dfsg/.libs/librsb.so -lhwloc -lz -L/usr/lib/gcc/aarch64-linux-gnu/15 -L/usr/lib/gcc/aarch64-linux-gnu/15/../../../aarch64-linux-gnu -L/usr/lib/gcc/aarch64-linux-gnu/15/../../../../lib -L/lib/aarch64-linux-gnu -L/lib/../lib -L/usr/lib/aarch64-linux-gnu -L/usr/lib/../lib -L/usr/lib/gcc/aarch64-linux-gnu/15/../../.. -L/lib -L/usr/lib -lgfortran -lm -fopenmp -libtool: link: g++ -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -fopenmp -Wl,-z -Wl,relro -o .libs/backsolve backsolve.o -fopenmp -L.. /build/reproducible-path/librsb-1.3.0.2+dfsg/.libs/librsb.so -lhwloc -lz -L/usr/lib/gcc/aarch64-linux-gnu/15 -L/usr/lib/gcc/aarch64-linux-gnu/15/../../../aarch64-linux-gnu -L/usr/lib/gcc/aarch64-linux-gnu/15/../../../../lib -L/lib/aarch64-linux-gnu -L/lib/../lib -L/usr/lib/aarch64-linux-gnu -L/usr/lib/../lib -L/usr/lib/gcc/aarch64-linux-gnu/15/../../.. -L/lib -L/usr/lib -lgfortran -lm -fopenmp -libtool: link: g++ -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -fopenmp -Wl,-z -Wl,relro -o .libs/hello hello.o -fopenmp -L.. /build/reproducible-path/librsb-1.3.0.2+dfsg/.libs/librsb.so -lhwloc -lz -L/usr/lib/gcc/aarch64-linux-gnu/15 -L/usr/lib/gcc/aarch64-linux-gnu/15/../../../aarch64-linux-gnu -L/usr/lib/gcc/aarch64-linux-gnu/15/../../../../lib -L/lib/aarch64-linux-gnu -L/lib/../lib -L/usr/lib/aarch64-linux-gnu -L/usr/lib/../lib -L/usr/lib/gcc/aarch64-linux-gnu/15/../../.. -L/lib -L/usr/lib -lgfortran -lm -fopenmp libtool: link: g++ -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -fopenmp -Wl,-z -Wl,relro -o .libs/fortran_rsb_fi fortran_rsb_fi.o -fopenmp -L.. /build/reproducible-path/librsb-1.3.0.2+dfsg/.libs/librsb.so -lhwloc -lz -L/usr/lib/gcc/aarch64-linux-gnu/15 -L/usr/lib/gcc/aarch64-linux-gnu/15/../../../aarch64-linux-gnu -L/usr/lib/gcc/aarch64-linux-gnu/15/../../../../lib -L/lib/aarch64-linux-gnu -L/lib/../lib -L/usr/lib/aarch64-linux-gnu -L/usr/lib/../lib -L/usr/lib/gcc/aarch64-linux-gnu/15/../../.. -L/lib -L/usr/lib -lgfortran -lm -fopenmp -/bin/bash ../libtool --tag=CXX --mode=link g++ -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -fopenmp -Wl,-z,relro -o snippets snippets.o -L.. /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la -lhwloc -lm -lhwloc -lz -fopenmp -L/usr/lib/gcc/aarch64-linux-gnu/15 -L/usr/lib/gcc/aarch64-linux-gnu/15/../../../aarch64-linux-gnu -L/usr/lib/gcc/aarch64-linux-gnu/15/../../../../lib -L/lib/aarch64-linux-gnu -L/lib/../lib -L/usr/lib/aarch64-linux-gnu -L/usr/lib/../lib -L/usr/lib/gcc/aarch64-linux-gnu/15/../../.. -L/lib -L/usr/lib -lgfortran -lm -libtool: link: g++ -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -fopenmp -Wl,-z -Wl,relro -o .libs/fortran fortran.o -fopenmp -L.. /build/reproducible-path/librsb-1.3.0.2+dfsg/.libs/librsb.so -lhwloc -lz -L/usr/lib/gcc/aarch64-linux-gnu/15 -L/usr/lib/gcc/aarch64-linux-gnu/15/../../../aarch64-linux-gnu -L/usr/lib/gcc/aarch64-linux-gnu/15/../../../../lib -L/lib/aarch64-linux-gnu -L/lib/../lib -L/usr/lib/aarch64-linux-gnu -L/usr/lib/../lib -L/usr/lib/gcc/aarch64-linux-gnu/15/../../.. -L/lib -L/usr/lib -lgfortran -lm -fopenmp libtool: link: g++ -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -fopenmp -Wl,-z -Wl,relro -o .libs/autotune autotune.o -fopenmp -L.. /build/reproducible-path/librsb-1.3.0.2+dfsg/.libs/librsb.so -lhwloc -lz -L/usr/lib/gcc/aarch64-linux-gnu/15 -L/usr/lib/gcc/aarch64-linux-gnu/15/../../../aarch64-linux-gnu -L/usr/lib/gcc/aarch64-linux-gnu/15/../../../../lib -L/lib/aarch64-linux-gnu -L/lib/../lib -L/usr/lib/aarch64-linux-gnu -L/usr/lib/../lib -L/usr/lib/gcc/aarch64-linux-gnu/15/../../.. -L/lib -L/usr/lib -lgfortran -lm -fopenmp +/bin/sh ../libtool --tag=CXX --mode=link g++ -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -fopenmp -Wl,-z,relro -o snippets snippets.o -L.. /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la -lhwloc -lm -lhwloc -lz -fopenmp -L/usr/lib/gcc/aarch64-linux-gnu/15 -L/usr/lib/gcc/aarch64-linux-gnu/15/../../../aarch64-linux-gnu -L/usr/lib/gcc/aarch64-linux-gnu/15/../../../../lib -L/lib/aarch64-linux-gnu -L/lib/../lib -L/usr/lib/aarch64-linux-gnu -L/usr/lib/../lib -L/usr/lib/gcc/aarch64-linux-gnu/15/../../.. -L/lib -L/usr/lib -lgfortran -lm +libtool: link: g++ -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -fopenmp -Wl,-z -Wl,relro -o .libs/fortran fortran.o -fopenmp -L.. /build/reproducible-path/librsb-1.3.0.2+dfsg/.libs/librsb.so -lhwloc -lz -L/usr/lib/gcc/aarch64-linux-gnu/15 -L/usr/lib/gcc/aarch64-linux-gnu/15/../../../aarch64-linux-gnu -L/usr/lib/gcc/aarch64-linux-gnu/15/../../../../lib -L/lib/aarch64-linux-gnu -L/lib/../lib -L/usr/lib/aarch64-linux-gnu -L/usr/lib/../lib -L/usr/lib/gcc/aarch64-linux-gnu/15/../../.. -L/lib -L/usr/lib -lgfortran -lm -fopenmp +/bin/sh ../libtool --tag=CXX --mode=link g++ -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -fopenmp -Wl,-z,relro -o cplusplus cplusplus.o -L.. /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la -lhwloc -lm -lhwloc -lz -fopenmp -L/usr/lib/gcc/aarch64-linux-gnu/15 -L/usr/lib/gcc/aarch64-linux-gnu/15/../../../aarch64-linux-gnu -L/usr/lib/gcc/aarch64-linux-gnu/15/../../../../lib -L/lib/aarch64-linux-gnu -L/lib/../lib -L/usr/lib/aarch64-linux-gnu -L/usr/lib/../lib -L/usr/lib/gcc/aarch64-linux-gnu/15/../../.. -L/lib -L/usr/lib -lgfortran -lm libtool: link: g++ -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -fopenmp -Wl,-z -Wl,relro -o .libs/snippets snippets.o -fopenmp -L.. /build/reproducible-path/librsb-1.3.0.2+dfsg/.libs/librsb.so -lhwloc -lz -L/usr/lib/gcc/aarch64-linux-gnu/15 -L/usr/lib/gcc/aarch64-linux-gnu/15/../../../aarch64-linux-gnu -L/usr/lib/gcc/aarch64-linux-gnu/15/../../../../lib -L/lib/aarch64-linux-gnu -L/lib/../lib -L/usr/lib/aarch64-linux-gnu -L/usr/lib/../lib -L/usr/lib/gcc/aarch64-linux-gnu/15/../../.. -L/lib -L/usr/lib -lgfortran -lm -fopenmp -/bin/bash ../libtool --tag=CXX --mode=link g++ -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -fopenmp -Wl,-z,relro -o cplusplus cplusplus.o -L.. /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la -lhwloc -lm -lhwloc -lz -fopenmp -L/usr/lib/gcc/aarch64-linux-gnu/15 -L/usr/lib/gcc/aarch64-linux-gnu/15/../../../aarch64-linux-gnu -L/usr/lib/gcc/aarch64-linux-gnu/15/../../../../lib -L/lib/aarch64-linux-gnu -L/lib/../lib -L/usr/lib/aarch64-linux-gnu -L/usr/lib/../lib -L/usr/lib/gcc/aarch64-linux-gnu/15/../../.. -L/lib -L/usr/lib -lgfortran -lm libtool: link: g++ -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -fopenmp -Wl,-z -Wl,relro -o .libs/cplusplus cplusplus.o -fopenmp -L.. /build/reproducible-path/librsb-1.3.0.2+dfsg/.libs/librsb.so -lhwloc -lz -L/usr/lib/gcc/aarch64-linux-gnu/15 -L/usr/lib/gcc/aarch64-linux-gnu/15/../../../aarch64-linux-gnu -L/usr/lib/gcc/aarch64-linux-gnu/15/../../../../lib -L/lib/aarch64-linux-gnu -L/lib/../lib -L/usr/lib/aarch64-linux-gnu -L/usr/lib/../lib -L/usr/lib/gcc/aarch64-linux-gnu/15/../../.. -L/lib -L/usr/lib -lgfortran -lm -fopenmp gmake[4]: Leaving directory '/build/reproducible-path/librsb-1.3.0.2+dfsg/examples' Making all in scripts @@ -2516,9 +2552,9 @@ /usr/bin/mkdir -p man /usr/bin/mkdir -p man gmake makedox -SOURCE_DATE_EPOCH=1767272461 \ +SOURCE_DATE_EPOCH=1735642861 \ help2man --name="benchmark and test for librsb" --no-info ../rsbench | /usr/bin/sed 's/January //g' > man/rsbench.1 -SOURCE_DATE_EPOCH=1767272461 \ +SOURCE_DATE_EPOCH=1735642861 \ help2man --name="provide configuration information for librsb" --no-info /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb-config | /usr/bin/sed 's/January //g' > man/librsb-config.1 gmake[5]: Entering directory '/build/reproducible-path/librsb-1.3.0.2+dfsg/doc' DOXYGEN_PROJECT_NUMBER=1.3.0.2 doxygen Doxyfile || echo "are you sure you have doxygen installed ?" @@ -3230,13 +3266,13 @@ g++ -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -c -o rgt-rgt.o `test -f 'rgt.cpp' || echo './'`rgt.cpp g++ -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -DRSBP_NOTHROW=1 -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -c -o rgt_ne-rgt.o `test -f 'rgt.cpp' || echo './'`rgt.cpp g++ -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -DRSBP_NOTHROW=1 -DRSBP_WANT_REV=1 -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -c -o rgt_rv-rgt.o `test -f 'rgt.cpp' || echo './'`rgt.cpp -/bin/bash ./libtool --tag=CXX --mode=link g++ -DRSBP_NOTHROW=1 -DRSBP_WANT_REV=1 -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -Wl,-z,relro -o rgt_rv rgt_rv-rgt.o -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la -/bin/bash ./libtool --tag=CXX --mode=link g++ -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -Wl,-z,relro -o rgt rgt-rgt.o -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la -/bin/bash ./libtool --tag=CXX --mode=link g++ -DRSBP_NOTHROW=1 -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -Wl,-z,relro -o rgt_ne rgt_ne-rgt.o -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la +/bin/sh ./libtool --tag=CXX --mode=link g++ -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -Wl,-z,relro -o rgt rgt-rgt.o -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la +/bin/sh ./libtool --tag=CXX --mode=link g++ -DRSBP_NOTHROW=1 -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -Wl,-z,relro -o rgt_ne rgt_ne-rgt.o -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la +/bin/sh ./libtool --tag=CXX --mode=link g++ -DRSBP_NOTHROW=1 -DRSBP_WANT_REV=1 -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -Wl,-z,relro -o rgt_rv rgt_rv-rgt.o -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la +libtool: link: g++ -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -Wl,-z -Wl,relro -o .libs/rgt rgt-rgt.o -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/.libs/librsb.so -fopenmp libtool: link: g++ -DRSBP_NOTHROW=1 -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -Wl,-z -Wl,relro -o .libs/rgt_ne rgt_ne-rgt.o -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/.libs/librsb.so -fopenmp libtool: link: g++ -DRSBP_NOTHROW=1 -DRSBP_WANT_REV=1 -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -Wl,-z -Wl,relro -o .libs/rgt_rv rgt_rv-rgt.o -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/.libs/librsb.so -fopenmp -libtool: link: g++ -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -Wl,-z -Wl,relro -o .libs/rgt rgt-rgt.o -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/.libs/librsb.so -fopenmp -/bin/bash ./libtool --tag=CXX --mode=link g++ -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -Wl,-z,relro -o rsb rsb.o -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la +/bin/sh ./libtool --tag=CXX --mode=link g++ -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -Wl,-z,relro -o rsb rsb.o -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la libtool: link: g++ -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -Wl,-z -Wl,relro -o .libs/rsb rsb.o -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/.libs/librsb.so -fopenmp gmake[6]: Leaving directory '/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib' Making all in examples @@ -3251,25 +3287,25 @@ g++ -DHAVE_CONFIG_H -I.. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I.. -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -c -o mtx2bin.o mtx2bin.cpp g++ -DHAVE_CONFIG_H -I.. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I.. -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -c -o render.o render.cpp g++ -DHAVE_CONFIG_H -I.. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I.. -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -c -o span.o span.cpp -/bin/bash ../libtool --tag=CXX --mode=link g++ -I.. -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -Wl,-z,relro -o span span.o -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la -/bin/bash ../libtool --tag=CXX --mode=link g++ -I.. -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -Wl,-z,relro -o assemble assemble.o -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la -/bin/bash ../libtool --tag=CXX --mode=link g++ -I.. -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -Wl,-z,relro -o render render.o -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la +/bin/sh ../libtool --tag=CXX --mode=link g++ -I.. -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -Wl,-z,relro -o span span.o -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la +/bin/sh ../libtool --tag=CXX --mode=link g++ -I.. -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -Wl,-z,relro -o assemble assemble.o -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la +/bin/sh ../libtool --tag=CXX --mode=link g++ -I.. -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -Wl,-z,relro -o render render.o -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la libtool: link: g++ -I.. -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -Wl,-z -Wl,relro -o .libs/span span.o -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/.libs/librsb.so -fopenmp -/bin/bash ../libtool --tag=CXX --mode=link g++ -I.. -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -Wl,-z,relro -o example example.o -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la +/bin/sh ../libtool --tag=CXX --mode=link g++ -I.. -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -Wl,-z,relro -o example example.o -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la libtool: link: g++ -I.. -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -Wl,-z -Wl,relro -o .libs/assemble assemble.o -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/.libs/librsb.so -fopenmp libtool: link: g++ -I.. -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -Wl,-z -Wl,relro -o .libs/render render.o -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/.libs/librsb.so -fopenmp libtool: link: g++ -I.. -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -Wl,-z -Wl,relro -o .libs/example example.o -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/.libs/librsb.so -fopenmp -/bin/bash ../libtool --tag=CXX --mode=link g++ -I.. -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -Wl,-z,relro -o misc misc.o -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la +/bin/sh ../libtool --tag=CXX --mode=link g++ -I.. -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -Wl,-z,relro -o misc misc.o -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la libtool: link: g++ -I.. -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -Wl,-z -Wl,relro -o .libs/misc misc.o -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/.libs/librsb.so -fopenmp -/bin/bash ../libtool --tag=CXX --mode=link g++ -I.. -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -Wl,-z,relro -o build build.o -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la +/bin/sh ../libtool --tag=CXX --mode=link g++ -I.. -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -Wl,-z,relro -o build build.o -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la libtool: link: g++ -I.. -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -Wl,-z -Wl,relro -o .libs/build build.o -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/.libs/librsb.so -fopenmp -/bin/bash ../libtool --tag=CXX --mode=link g++ -I.. -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -Wl,-z,relro -o twonnz twonnz.o -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la -/bin/bash ../libtool --tag=CXX --mode=link g++ -I.. -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -Wl,-z,relro -o mtx2bin mtx2bin.o -lstdc++fs -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la +/bin/sh ../libtool --tag=CXX --mode=link g++ -I.. -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -Wl,-z,relro -o twonnz twonnz.o -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la +/bin/sh ../libtool --tag=CXX --mode=link g++ -I.. -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -Wl,-z,relro -o mtx2bin mtx2bin.o -lstdc++fs -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la libtool: link: g++ -I.. -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -Wl,-z -Wl,relro -o .libs/twonnz twonnz.o -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/.libs/librsb.so -fopenmp libtool: link: g++ -I.. -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -Wl,-z -Wl,relro -o .libs/mtx2bin mtx2bin.o -lstdc++fs -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/.libs/librsb.so -fopenmp -/bin/bash ../libtool --tag=CXX --mode=link g++ -I.. -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -Wl,-z,relro -o autotune autotune.o -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la +/bin/sh ../libtool --tag=CXX --mode=link g++ -I.. -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -Wl,-z,relro -o autotune autotune.o -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la libtool: link: g++ -I.. -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -Wl,-z -Wl,relro -o .libs/autotune autotune.o -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/.libs/librsb.so -fopenmp -/bin/bash ../libtool --tag=CXX --mode=link g++ -I.. -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -Wl,-z,relro -o bench bench.o -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la +/bin/sh ../libtool --tag=CXX --mode=link g++ -I.. -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -Wl,-z,relro -o bench bench.o -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la libtool: link: g++ -I.. -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -Wl,-z -Wl,relro -o .libs/bench bench.o -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/.libs/librsb.so -fopenmp gmake[6]: Leaving directory '/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib/examples' gmake[5]: Leaving directory '/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib' @@ -3279,7 +3315,7 @@ gmake all-am gmake[5]: Entering directory '/build/reproducible-path/librsb-1.3.0.2+dfsg/rsbtest' g++ -DHAVE_CONFIG_H -I. -I/build/reproducible-path/librsb-1.3.0.2+dfsg -Wdate-time -D_FORTIFY_SOURCE=2 -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -c -o rsbtest.o rsbtest.cpp -/bin/bash ./libtool --tag=CXX --mode=link g++ -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -Wl,-z,relro -o rsbtest rsbtest.o /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la -lstdc++fs -lstdc++fs +/bin/sh ./libtool --tag=CXX --mode=link g++ -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -Wl,-z,relro -o rsbtest rsbtest.o /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la -lstdc++fs -lstdc++fs libtool: link: g++ -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -Wl,-z -Wl,relro -o .libs/rsbtest rsbtest.o /build/reproducible-path/librsb-1.3.0.2+dfsg/.libs/librsb.so -lstdc++fs -fopenmp gmake[5]: Leaving directory '/build/reproducible-path/librsb-1.3.0.2+dfsg/rsbtest' gmake[4]: Leaving directory '/build/reproducible-path/librsb-1.3.0.2+dfsg/rsbtest' @@ -3355,7 +3391,7 @@ gmake[3]: Leaving directory '/build/reproducible-path/librsb-1.3.0.2+dfsg' gmake mtests -C . gmake[3]: Entering directory '/build/reproducible-path/librsb-1.3.0.2+dfsg' -srcdir="/build/reproducible-path/librsb-1.3.0.2+dfsg" /bin/bash -ex ./scripts/readme-tests.sh +srcdir="/build/reproducible-path/librsb-1.3.0.2+dfsg" /bin/sh -ex ./scripts/readme-tests.sh + test x/build/reproducible-path/librsb-1.3.0.2+dfsg = x + ./rsbench -oa -Ob --bench -f /build/reproducible-path/librsb-1.3.0.2+dfsg/A.mtx -qH -R -n1,4 -T z --verbose --nrhs 1,2 --by-rows # --bench option implies -qH -R --write-performance-record --want-mkl-autotune --mkl-benchmark --types : --split-experimental 6 --merge-experimental 6 --also-transpose --sort-filenames-list --want-memory-benchmark @@ -3365,15 +3401,15 @@ Adding matrix file: /build/reproducible-path/librsb-1.3.0.2+dfsg/A.mtx # Sorting matrices list (use --no-sort-filenames-list to prevent this) # Using matrices: A.mtx -# beginning run at 1796064017 +# beginning run at 1761654533 # /build/reproducible-path/librsb-1.3.0.2+dfsg/.libs/rsbench -oa -Ob --bench -f /build/reproducible-path/librsb-1.3.0.2+dfsg/A.mtx -qH -R -n1,4 -T z --verbose --nrhs 1,2 --by-rows # compiled with: CC=gcc CFLAGS=-g -O2 -Werror=implicit-function-declaration -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -# average timer granularity: 7.74e-08 s -# Will write a final performance record to file rsbench_pr__1796064017_gcc-15.2-1,4th.rpr and periodic checkpoints to rsbench_pr__1796064017_gcc-15.2-1,4th.rpr.tmp +# average timer granularity: 2.87e-08 s +# Will write a final performance record to file rsbench_pr__1761654533_gcc-15.2-1,4th.rpr and periodic checkpoints to rsbench_pr__1761654533_gcc-15.2-1,4th.rpr.tmp # will NOT perform ancillary tests. # will flush cache memory: between each operation measurement series, and NOT between each operation. # will keep any zero encountered in the matrix. -# env: export PATH=/usr/sbin:/usr/bin:/sbin:/bin:/usr/games +# env: export PATH=/usr/sbin:/usr/bin:/sbin:/bin:/usr/games:/i/capture/the/path # env: export LD_LIBRARY_PATH=/build/reproducible-path/librsb-1.3.0.2+dfsg/.libs # env: HOSTNAME is not set # env: KMP_AFFINITY is not set @@ -3412,61 +3448,61 @@ # env: SLURM_NTASKS is not set # env: SLURM_STEP_TASKS_PER_NODE is not set # env: SLURM_TASKS_PER_NODE is not set -# detected hostname: codethink03-arm64 +# detected hostname: i-capture-the-hostname # user specified a verbosity level of 1 (each --verbose occurrence counts +1) # This test will measure times in scanning arrays sized and aligned to fit in caches. # 2 cache levels detected Will fill struct with 40 samples... -# Memory benchmark took 5.382s +# Memory benchmark took 5.344s # auto-tuning oriented output implies times==0 iterations and sort-after-load. #pr: allocated a performance record for 8 samples (2240 bytes). # Cache block size total 524288 bytes, per-thread 43690 bytes -# so far, program took 5.386s of wall clock time; ancillary tests 0.000s; I/O 0.000s; checks 0.000s; conversions 0.000s; rsb/mkl tuning 0.000s/0.000s . +# so far, program took 5.345s of wall clock time; ancillary tests 0.000s; I/O 0.000s; checks 0.000s; conversions 0.000s; rsb/mkl tuning 0.000s/0.000s . # Using 1 threads # reading A.mtx (184 bytes / 1 MiB / 6 nnz / 3 rows / 3 columns / 1 MiB COO) as type Z... -# file input of A.mtx took 0.00 s (6 nnz, 28150 nnz/s ) (0.86 MB/s ) -#pre-sorting (6 elements) took 0.00174379 s -#weeding duplicates (to 6 elements) took 1.90735e-06 s (and check, 1.90735e-06 s ) +# file input of A.mtx took 0.00 s (6 nnz, 36792 nnz/s ) (1.13 MB/s ) +#pre-sorting (6 elements) took 0.00146914 s +#weeding duplicates (to 6 elements) took 1.90735e-06 s (and check, 2.14577e-06 s ) # multi-nrhs benchmarking (1,2) -- now using nrhs 1. # Using alpha=1 beta=1 order=rows for rsb_spmv/rsb_spsv/rsb_spmm/rsb_spsm. # multi-transpose benchmarking -- now using transA = N. # will use input matrix flags: RSB_FLAG_USE_HALFWORD_INDICES, RSB_FLAG_SORTED_INPUT, RSB_FLAG_QUAD_PARTITIONING, RSB_FLAG_SYMMETRIC, RSB_FLAG_OWN_PARTITIONING_ARRAYS # Using 1 threads -# Constructed matrix (took 0.007s): (3 x 3)[0xaaaafa567840]{Z} @ (0(0..0),0(0..0)) (6 nnz, 2 nnz/r) flags 0x2442186 (coo:1, csr:0, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'S' +# Constructed matrix (took 0.007s): (3 x 3)[0xaaaaf8a73880]{Z} @ (0(0..0),0(0..0)) (6 nnz, 2 nnz/r) flags 0x2442186 (coo:1, csr:0, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'S' # matrix consistency check took 0.000s (ok) RSB Sparse Blocks Autotuner invoked requesting max 6 splits and max 6 merges in 1 rounds, threads spec.0 (specify negative values to enable threads tuning). Will autotune matrix: 3 x 3, type Z, 6 nnz, 2 nnz/r, 4 subms, 3 lsubms, 4.0000 bpnz. Parameters: verbosity:1 mintimes:3 maxtimes:10 mindt:0 maxdt:3 -3 iterations (1 th.) took 0.003707s; avg 0.001236s ( +/- 1.11/ 1.97 %); best 0.001222s; worst 0.00126s; std dev. 1.73e-05 (taking best). -Reference operation time is 0.0012219 s (0.07857 Mflops) with 1 threads. -Starting merge (same threads) based auto-tuning procedure (transA=N, nrhs=1, order=rows) (max 6 steps, inclusive 3 grace steps) on: 3 x 3, type Z, 6 nnz, 2 nnz/r, 4 subms, 3 lsubms, 4.0000 bpnz (tpop: 0.001222 Mflops: 0.079) -Merge (3 -> 1 leaves) took w.c.t. of 1.907e-05s, ~7.153e-06s of computing time (of which 9.537e-07s sorting, 3.099e-06s analysis) -3 iterations (1 th.) took 0.0002651s; avg 8.837e-05s ( +/- 99.91/200.00 %); best 8.19e-08s; worst 0.0002651s; std dev. 0.000125 (taking best). -Reference operation time is 8.18968e-08 s (1172 Mflops) with 1 threads. -After merge step 1: tpop: 8.19e-08 s ~Mflops: 1172.207 nsubm:1 otn:1 -Applying merge (3 -> 1 leaves, 1 th.) yielded SPEEDUP of 14919.942x: 0.001222s -> 8.19e-08s, so taking this instance. +3 iterations (1 th.) took 0.003663s; avg 0.001221s ( +/- 0.59/ 0.84 %); best 0.001214s; worst 0.001231s; std dev. 7.436e-06 (taking best). +Reference operation time is 0.00121379 s (0.07909 Mflops) with 1 threads. +Starting merge (same threads) based auto-tuning procedure (transA=N, nrhs=1, order=rows) (max 6 steps, inclusive 3 grace steps) on: 3 x 3, type Z, 6 nnz, 2 nnz/r, 4 subms, 3 lsubms, 4.0000 bpnz (tpop: 0.001214 Mflops: 0.079) +Merge (3 -> 1 leaves) took w.c.t. of 2.098e-05s, ~7.868e-06s of computing time (of which 9.537e-07s sorting, 2.861e-06s analysis) +3 iterations (1 th.) took 0.000284s; avg 9.465e-05s ( +/- 98.99/197.98 %); best 9.537e-07s; worst 0.000282s; std dev. 0.0001325 (taking best). +Reference operation time is 9.53674e-07 s (100.7 Mflops) with 1 threads. +After merge step 1: tpop: 9.537e-07 s ~Mflops: 100.663 nsubm:1 otn:1 +Applying merge (3 -> 1 leaves, 1 th.) yielded SPEEDUP of 1272.750x: 0.001214s -> 9.537e-07s, so taking this instance. Merged all the matrix leaves: no reason to continue merging. -A total of 1 merge steps (of max 6) (3 -> 1 subms) took 0.00369s (of which 2.193e-05s partitioning, 0s I/O); computing times: 7.153e-06s in par. loops, 9.537e-07s sorting, 3.099e-06s analyzing) -Total merge + benchmarking process took 0.00369s, equivalent to 45056.8/3.0 new/old ops (0.006848s for 2 clones -- as 83615.7/5.6 ops, or 41807.9/2.8 ops per clone), SPEEDUP of 14919.942x -Applying multi-merge (3 -> 1 leaves, 1 steps, 0 -> 1 th.sp.) yielded SPEEDUP of 14919.942x (0.001222s -> 8.19e-08s), will amortize in 3.0 ops by saving 0.001222s per op. -In 1 tuning rounds (tot. 0.011s, 0.0068s for constructor, 2 clones) obtained a SPEEDUP of 1491894.2% (1.492e+04x) (from 0.07857 to 1172 Mflops). +A total of 1 merge steps (of max 6) (3 -> 1 subms) took 0.003661s (of which 2.718e-05s partitioning, 0s I/O); computing times: 7.868e-06s in par. loops, 9.537e-07s sorting, 2.861e-06s analyzing) +Total merge + benchmarking process took 0.003661s, equivalent to 3839.0/3.0 new/old ops (0.006801s for 2 clones -- as 7131.2/5.6 ops, or 3565.6/2.8 ops per clone), SPEEDUP of 1272.750x +Applying multi-merge (3 -> 1 leaves, 1 steps, 0 -> 1 th.sp.) yielded SPEEDUP of 1272.750x (0.001214s -> 9.537e-07s), will amortize in 3.0 ops by saving 0.001213s per op. +In 1 tuning rounds (tot. 0.011s, 0.0068s for constructor, 2 clones) obtained a SPEEDUP of 127175.0% (1273x) (from 0.07909 to 100.7 Mflops). #pr: updating sample at index 1 (0^th of 8), 0^th touch for (0,0,0,0,0,0,0). -First run of RSB Autotuner took 0.0109909 s (1.222e-03 s -> 8.190e-08 s per spmv_sxsa) (tuned: 3 -> 1 lsubm). +First run of RSB Autotuner took 0.010958 s (1.214e-03 s -> 9.537e-07 s per spmv_sxsa) (tuned: 3 -> 1 lsubm). RSB Sparse Blocks Autotuner invoked requesting max 0 splits and max 0 merges in 1 rounds, auto threads spec. -Second run of RSB Autotuner took 0.053165 s and estimated a speedup of 1.000000 x (8.190e-08 s -> 8.190e-08 s per op) in same matrix (1 -> 1 lsubm) +Second run of RSB Autotuner took 0.061599 s and estimated a speedup of 1.000000 x (3.000e-08 s -> 3.000e-08 s per op) in same matrix (1 -> 1 lsubm) #min:1 0 #max:1 0 #sum:3 0 #norm:1.7320508075688772 0 #used index storage compared to COO:28 vs 48 bytes (58.33%) ; compared to CSR:28 vs 40 bytes (77.78%) #%:CONSTRUCTOR_*:SORT SCAN INSERT SCAN+INSERT -%:CONSTRUCTOR_TIMES:A.mtx S N 1 3 3 6 0.000000 0.001611 0.002554 0.004165 -%:UNSORTEDCOO2RSB_TIME:A.mtx S N 1 3 3 6 0.004165 -%:RSB_SUBDIVISION_TIME:A.mtx S N 1 3 3 6 0.001611 -%:RSB_SHUFFLE_TIME:A.mtx S N 1 3 3 6 0.002554 +%:CONSTRUCTOR_TIMES:A.mtx S N 1 3 3 6 0.000000 0.002430 0.002509 0.004939 +%:UNSORTEDCOO2RSB_TIME:A.mtx S N 1 3 3 6 0.004939 +%:RSB_SUBDIVISION_TIME:A.mtx S N 1 3 3 6 0.002430 +%:RSB_SHUFFLE_TIME:A.mtx S N 1 3 3 6 0.002509 %:ROW_MAJOR_SORT_TIME:A.mtx S N 1 3 3 6 0.000000 %:ROW_MAJOR_SORT_SCALING:A.mtx S N 1 3 3 6 nan -%:SORTEDCOO2RSB_TIME:A.mtx S N 1 3 3 6 0.004165 +%:SORTEDCOO2RSB_TIME:A.mtx S N 1 3 3 6 0.004939 %:ROW_MAJOR_SORT_TO_MOP:A.mtx S N 1 3 3 6 0.000 %:UNSORTEDCOO2RSB_SCALING:A.mtx S N 1 3 3 6 1.00 %:SORTEDCOO2RSB_SCALING:A.mtx S N 1 3 3 6 1.00 @@ -3481,47 +3517,47 @@ %:SM_MINMAXAVGNNZ:A.mtx S N 1 3 3 6 6 6 6 # # Using 4 threads -# Constructed matrix (took 0.008s): (3 x 3)[0xaaaafa567840]{Z} @ (0(0..0),0(0..0)) (6 nnz, 2 nnz/r) flags 0x2442186 (coo:1, csr:0, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'S' +# Constructed matrix (took 0.006s): (3 x 3)[0xaaaaf8a73880]{Z} @ (0(0..0),0(0..0)) (6 nnz, 2 nnz/r) flags 0x2442186 (coo:1, csr:0, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'S' # matrix consistency check took 0.000s (ok) RSB Sparse Blocks Autotuner invoked requesting max 6 splits and max 6 merges in 1 rounds, threads spec.1 (specify negative values to enable threads tuning). Will autotune matrix: 3 x 3, type Z, 6 nnz, 2 nnz/r, 4 subms, 3 lsubms, 4.0000 bpnz. Parameters: verbosity:1 mintimes:3 maxtimes:10 mindt:0 maxdt:3 -3 iterations (4 th.) took 0.003705s; avg 0.001235s ( +/- 17.41/ 10.44 %); best 0.00102s; worst 0.001364s; std dev. 0.0001531 (taking best). -Reference operation time is 0.00101995 s (0.09412 Mflops) with 4 threads. -Starting merge (user-supplied threads) based auto-tuning procedure (transA=N, nrhs=1, order=rows) (max 6 steps, inclusive 3 grace steps) on: 3 x 3, type Z, 6 nnz, 2 nnz/r, 4 subms, 3 lsubms, 4.0000 bpnz (tpop: 0.00102 Mflops: 0.094) -Merge (3 -> 1 leaves) took w.c.t. of 1.407e-05s, ~5.96e-06s of computing time (of which 1.907e-06s sorting, 2.146e-06s analysis) -3 iterations (4 th.) took 5.007e-06s; avg 1.669e-06s ( +/- 95.09/128.57 %); best 8.19e-08s; worst 3.815e-06s; std dev. 1.593e-06 (taking best). -Reference operation time is 8.18968e-08 s (1172 Mflops) with 4 threads. -After merge step 1: tpop: 8.19e-08 s ~Mflops: 1172.207 nsubm:1 otn:1 -Applying merge (3 -> 1 leaves, 1 th.) yielded SPEEDUP of 12454.148x: 0.00102s -> 8.19e-08s, so taking this instance. +3 iterations (4 th.) took 0.002818s; avg 0.0009394s ( +/- 0.76/ 1.45 %); best 0.0009322s; worst 0.000953s; std dev. 9.614e-06 (taking best). +Reference operation time is 0.000932217 s (0.103 Mflops) with 4 threads. +Starting merge (user-supplied threads) based auto-tuning procedure (transA=N, nrhs=1, order=rows) (max 6 steps, inclusive 3 grace steps) on: 3 x 3, type Z, 6 nnz, 2 nnz/r, 4 subms, 3 lsubms, 4.0000 bpnz (tpop: 0.0009322 Mflops: 0.103) +Merge (3 -> 1 leaves) took w.c.t. of 1.097e-05s, ~3.815e-06s of computing time (of which 9.537e-07s sorting, 9.537e-07s analysis) +3 iterations (4 th.) took 4.053e-06s; avg 1.351e-06s ( +/- 97.78/129.41 %); best 3e-08s; worst 3.099e-06s; std dev. 1.296e-06 (taking best). +Reference operation time is 3.0005e-08 s (3199 Mflops) with 4 threads. +After merge step 1: tpop: 3e-08 s ~Mflops: 3199.469 nsubm:1 otn:1 +Applying merge (3 -> 1 leaves, 1 th.) yielded SPEEDUP of 31068.733x: 0.0009322s -> 3e-08s, so taking this instance. Merged all the matrix leaves: no reason to continue merging. -A total of 1 merge steps (of max 6) (3 -> 1 subms) took 0.00346s (of which 1.693e-05s partitioning, 0s I/O); computing times: 5.96e-06s in par. loops, 1.907e-06s sorting, 2.146e-06s analyzing) -Total merge + benchmarking process took 0.00346s, equivalent to 42247.5/3.4 new/old ops (0.007865s for 2 clones -- as 96037.8/7.7 ops, or 48018.9/3.9 ops per clone), SPEEDUP of 12454.148x -Applying multi-merge (3 -> 1 leaves, 1 steps, 1 -> 1 th.sp.) yielded SPEEDUP of 12454.148x (0.00102s -> 8.19e-08s), will amortize in 3.4 ops by saving 0.00102s per op. -In 1 tuning rounds (tot. 0.012s, 0.0079s for constructor, 2 clones) obtained a SPEEDUP of 1245314.8% (1.245e+04x) (from 0.09412 to 1172 Mflops). +A total of 1 merge steps (of max 6) (3 -> 1 subms) took 0.002835s (of which 1.502e-05s partitioning, 0s I/O); computing times: 3.815e-06s in par. loops, 9.537e-07s sorting, 9.537e-07s analyzing) +Total merge + benchmarking process took 0.002835s, equivalent to 94485.5/3.0 new/old ops (0.005564s for 2 clones -- as 185435.0/6.0 ops, or 92717.5/3.0 ops per clone), SPEEDUP of 31068.733x +Applying multi-merge (3 -> 1 leaves, 1 steps, 1 -> 1 th.sp.) yielded SPEEDUP of 31068.733x (0.0009322s -> 3e-08s), will amortize in 3.0 ops by saving 0.0009322s per op. +In 1 tuning rounds (tot. 0.0085s, 0.0056s for constructor, 2 clones) obtained a SPEEDUP of 3106773.3% (3.107e+04x) (from 0.103 to 3199 Mflops). #pr: updating sample at index 5 (1^th of 8), 0^th touch for (0,1,0,0,0,0,0). -First run of RSB Autotuner took 0.011673 s (1.020e-03 s -> 8.190e-08 s per spmv_sxsa) (tuned: 3 -> 1 lsubm). +First run of RSB Autotuner took 0.00847101 s (9.322e-04 s -> 3.000e-08 s per spmv_sxsa) (tuned: 3 -> 1 lsubm). RSB Sparse Blocks Autotuner invoked requesting max 0 splits and max 0 merges in 1 rounds, auto threads spec. -Second run of RSB Autotuner took 0.0541821 s and estimated a speedup of 1.000000 x (8.190e-08 s -> 8.190e-08 s per op) in same matrix (1 -> 1 lsubm) +Second run of RSB Autotuner took 0.0496869 s and estimated a speedup of 1.000000 x (3.000e-08 s -> 3.000e-08 s per op) in same matrix (1 -> 1 lsubm) #min:1 0 #max:1 0 #sum:3 0 #norm:1.7320508075688772 0 #used index storage compared to COO:28 vs 48 bytes (58.33%) ; compared to CSR:28 vs 40 bytes (77.78%) #%:CONSTRUCTOR_*:SORT SCAN INSERT SCAN+INSERT -%:CONSTRUCTOR_TIMES:A.mtx S N 4 3 3 6 0.000000 0.002670 0.002431 0.005101 -%:UNSORTEDCOO2RSB_TIME:A.mtx S N 4 3 3 6 0.005101 -%:RSB_SUBDIVISION_TIME:A.mtx S N 4 3 3 6 0.002670 -%:RSB_SHUFFLE_TIME:A.mtx S N 4 3 3 6 0.002431 +%:CONSTRUCTOR_TIMES:A.mtx S N 4 3 3 6 0.000000 0.002693 0.001865 0.004558 +%:UNSORTEDCOO2RSB_TIME:A.mtx S N 4 3 3 6 0.004558 +%:RSB_SUBDIVISION_TIME:A.mtx S N 4 3 3 6 0.002693 +%:RSB_SHUFFLE_TIME:A.mtx S N 4 3 3 6 0.001865 %:ROW_MAJOR_SORT_TIME:A.mtx S N 4 3 3 6 0.000000 %:ROW_MAJOR_SORT_SCALING:A.mtx S N 4 3 3 6 nan -%:SORTEDCOO2RSB_TIME:A.mtx S N 4 3 3 6 0.005101 +%:SORTEDCOO2RSB_TIME:A.mtx S N 4 3 3 6 0.004558 %:ROW_MAJOR_SORT_TO_MOP:A.mtx S N 4 3 3 6 0.000 -%:UNSORTEDCOO2RSB_SCALING:A.mtx S N 4 3 3 6 0.82 -%:SORTEDCOO2RSB_SCALING:A.mtx S N 4 3 3 6 0.82 -%:RSB_SUBDIVISION_SCALING:A.mtx S N 4 3 3 6 0.60 -%:RSB_SHUFFLE_SCALING:A.mtx S N 4 3 3 6 1.05 -%:CONSTRUCTOR_SCALING:A.mtx S N 4 3 3 6 nan 0.60 1.05 0.82 +%:UNSORTEDCOO2RSB_SCALING:A.mtx S N 4 3 3 6 1.08 +%:SORTEDCOO2RSB_SCALING:A.mtx S N 4 3 3 6 1.08 +%:RSB_SUBDIVISION_SCALING:A.mtx S N 4 3 3 6 0.90 +%:RSB_SHUFFLE_SCALING:A.mtx S N 4 3 3 6 1.35 +%:CONSTRUCTOR_SCALING:A.mtx S N 4 3 3 6 nan 0.90 1.35 1.08 #%:SM_COUNTS: Tot HalfwordCsr FullwordCsr HalfwordCoo FullwordCoo %:SM_COUNTS:A.mtx S N 4 3 3 6 1 1 0 0 0 %:SM_IDXOCCUPATIONRSBVSCOOANDCSR:A.mtx S N 4 3 3 6 28 48 36 @@ -3530,56 +3566,56 @@ %:SM_MINMAXAVGNNZ:A.mtx S N 4 3 3 6 6 6 6 # %operation:matrix CONSTRUCTOR[1] SPMV[1] SPMV[4] -%operation:A.mtx 0.00665212 1e+09 1e+09 +%operation:A.mtx 0.00739598 1e+09 1e+09 %constructor:matrix SORT[1] SCAN[1] SHUFFLE[1] INSERT[1] -%constructor:A.mtx 0 0.00161099 0 0.00255394 +%constructor:A.mtx 0 0.0024302 0 0.00250888 # symmetric matrix --- skipping transposed benchmarking # multi-nrhs benchmarking (1,2) -- now using nrhs 2. # Using alpha=1 beta=1 order=rows for rsb_spmv/rsb_spsv/rsb_spmm/rsb_spsm. # multi-transpose benchmarking -- now using transA = N. # will use input matrix flags: RSB_FLAG_USE_HALFWORD_INDICES, RSB_FLAG_SORTED_INPUT, RSB_FLAG_QUAD_PARTITIONING, RSB_FLAG_SYMMETRIC, RSB_FLAG_OWN_PARTITIONING_ARRAYS # Using 1 threads -# Constructed matrix (took 0.005s): (3 x 3)[0xaaaafa567840]{Z} @ (0(0..0),0(0..0)) (6 nnz, 2 nnz/r) flags 0x2442186 (coo:1, csr:0, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'S' +# Constructed matrix (took 0.005s): (3 x 3)[0xaaaaf8a73880]{Z} @ (0(0..0),0(0..0)) (6 nnz, 2 nnz/r) flags 0x2442186 (coo:1, csr:0, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'S' # matrix consistency check took 0.000s (ok) RSB Sparse Blocks Autotuner invoked requesting max 6 splits and max 6 merges in 1 rounds, threads spec.0 (specify negative values to enable threads tuning). Will autotune matrix: 3 x 3, type Z, 6 nnz, 2 nnz/r, 4 subms, 3 lsubms, 4.0000 bpnz. Parameters: verbosity:1 mintimes:3 maxtimes:10 mindt:0 maxdt:3 -3 iterations (1 th.) took 0.002381s; avg 0.0007937s ( +/- 0.96/ 1.80 %); best 0.0007861s; worst 0.000808s; std dev. 1.012e-05 (taking best). -Reference operation time is 0.000786066 s (0.2443 Mflops) with 1 threads. -Starting merge (same threads) based auto-tuning procedure (transA=N, nrhs=2, order=rows) (max 6 steps, inclusive 3 grace steps) on: 3 x 3, type Z, 6 nnz, 2 nnz/r, 4 subms, 3 lsubms, 4.0000 bpnz (tpop: 0.0007861 Mflops: 0.244) -Merge (3 -> 1 leaves) took w.c.t. of 1.216e-05s, ~4.053e-06s of computing time (of which 9.537e-07s sorting, 2.146e-06s analysis) -3 iterations (1 th.) took 9.298e-05s; avg 3.099e-05s ( +/- 99.74/200.00 %); best 8.19e-08s; worst 9.298e-05s; std dev. 4.383e-05 (taking best). -Reference operation time is 8.18968e-08 s (2344 Mflops) with 1 threads. -After merge step 1: tpop: 8.19e-08 s ~Mflops: 2344.414 nsubm:1 otn:1 -Applying merge (3 -> 1 leaves, 1 th.) yielded SPEEDUP of 9598.253x: 0.0007861s -> 8.19e-08s, so taking this instance. +3 iterations (1 th.) took 0.002457s; avg 0.000819s ( +/- 8.94/ 17.35 %); best 0.0007458s; worst 0.0009611s; std dev. 0.0001005 (taking best). +Reference operation time is 0.000745773 s (0.2575 Mflops) with 1 threads. +Starting merge (same threads) based auto-tuning procedure (transA=N, nrhs=2, order=rows) (max 6 steps, inclusive 3 grace steps) on: 3 x 3, type Z, 6 nnz, 2 nnz/r, 4 subms, 3 lsubms, 4.0000 bpnz (tpop: 0.0007458 Mflops: 0.257) +Merge (3 -> 1 leaves) took w.c.t. of 8.106e-06s, ~2.861e-06s of computing time (of which 9.537e-07s sorting, 9.537e-07s analysis) +3 iterations (1 th.) took 9.203e-05s; avg 3.068e-05s ( +/- 99.90/200.00 %); best 3e-08s; worst 9.203e-05s; std dev. 4.338e-05 (taking best). +Reference operation time is 3.0005e-08 s (6399 Mflops) with 1 threads. +After merge step 1: tpop: 3e-08 s ~Mflops: 6398.938 nsubm:1 otn:1 +Applying merge (3 -> 1 leaves, 1 th.) yielded SPEEDUP of 24854.986x: 0.0007458s -> 3e-08s, so taking this instance. Merged all the matrix leaves: no reason to continue merging. -A total of 1 merge steps (of max 6) (3 -> 1 subms) took 0.002328s (of which 1.502e-05s partitioning, 0s I/O); computing times: 4.053e-06s in par. loops, 9.537e-07s sorting, 2.146e-06s analyzing) -Total merge + benchmarking process took 0.002328s, equivalent to 28427.9/3.0 new/old ops (0.004899s for 2 clones -- as 59822.4/6.2 ops, or 29911.2/3.1 ops per clone), SPEEDUP of 9598.253x -Applying multi-merge (3 -> 1 leaves, 1 steps, 0 -> 1 th.sp.) yielded SPEEDUP of 9598.253x (0.0007861s -> 8.19e-08s), will amortize in 3.0 ops by saving 0.000786s per op. -In 1 tuning rounds (tot. 0.0074s, 0.0049s for constructor, 2 clones) obtained a SPEEDUP of 959725.3% (9598x) (from 0.2443 to 2344 Mflops). +A total of 1 merge steps (of max 6) (3 -> 1 subms) took 0.002652s (of which 1.097e-05s partitioning, 0s I/O); computing times: 2.861e-06s in par. loops, 9.537e-07s sorting, 9.537e-07s analyzing) +Total merge + benchmarking process took 0.002652s, equivalent to 88383.0/3.6 new/old ops (0.004933s for 2 clones -- as 164402.1/6.6 ops, or 82201.0/3.3 ops per clone), SPEEDUP of 24854.986x +Applying multi-merge (3 -> 1 leaves, 1 steps, 0 -> 1 th.sp.) yielded SPEEDUP of 24854.986x (0.0007458s -> 3e-08s), will amortize in 3.6 ops by saving 0.0007457s per op. +In 1 tuning rounds (tot. 0.0075s, 0.0049s for constructor, 2 clones) obtained a SPEEDUP of 2485398.6% (2.485e+04x) (from 0.2575 to 6399 Mflops). #pr: updating sample at index 3 (2^th of 8), 0^th touch for (0,0,0,0,1,0,0). -First run of RSB Autotuner took 0.00744605 s (7.861e-04 s -> 8.190e-08 s per spmv_sxsa) (tuned: 3 -> 1 lsubm). +First run of RSB Autotuner took 0.00754595 s (7.458e-04 s -> 3.000e-08 s per spmv_sxsa) (tuned: 3 -> 1 lsubm). RSB Sparse Blocks Autotuner invoked requesting max 0 splits and max 0 merges in 1 rounds, auto threads spec. -Second run of RSB Autotuner took 0.040257 s and estimated a speedup of 1.000000 x (8.190e-08 s -> 8.190e-08 s per op) in same matrix (1 -> 1 lsubm) +Second run of RSB Autotuner took 0.033572 s and estimated a speedup of 1.000000 x (3.000e-08 s -> 3.000e-08 s per op) in same matrix (1 -> 1 lsubm) #min:1 0 #max:1 0 #sum:3 0 #norm:1.7320508075688772 0 #used index storage compared to COO:28 vs 48 bytes (58.33%) ; compared to CSR:28 vs 40 bytes (77.78%) #%:CONSTRUCTOR_*:SORT SCAN INSERT SCAN+INSERT -%:CONSTRUCTOR_TIMES:A.mtx S N 1 3 3 6 0.000001 0.001287 0.001806 0.003093 -%:UNSORTEDCOO2RSB_TIME:A.mtx S N 1 3 3 6 0.003094 -%:RSB_SUBDIVISION_TIME:A.mtx S N 1 3 3 6 0.001287 -%:RSB_SHUFFLE_TIME:A.mtx S N 1 3 3 6 0.001806 -%:ROW_MAJOR_SORT_TIME:A.mtx S N 1 3 3 6 0.000001 -%:ROW_MAJOR_SORT_SCALING:A.mtx S N 1 3 3 6 1.000 -%:SORTEDCOO2RSB_TIME:A.mtx S N 1 3 3 6 0.003093 +%:CONSTRUCTOR_TIMES:A.mtx S N 1 3 3 6 0.000000 0.001784 0.001576 0.003360 +%:UNSORTEDCOO2RSB_TIME:A.mtx S N 1 3 3 6 0.003360 +%:RSB_SUBDIVISION_TIME:A.mtx S N 1 3 3 6 0.001784 +%:RSB_SHUFFLE_TIME:A.mtx S N 1 3 3 6 0.001576 +%:ROW_MAJOR_SORT_TIME:A.mtx S N 1 3 3 6 0.000000 +%:ROW_MAJOR_SORT_SCALING:A.mtx S N 1 3 3 6 nan +%:SORTEDCOO2RSB_TIME:A.mtx S N 1 3 3 6 0.003360 %:ROW_MAJOR_SORT_TO_MOP:A.mtx S N 1 3 3 6 0.000 %:UNSORTEDCOO2RSB_SCALING:A.mtx S N 1 3 3 6 1.00 %:SORTEDCOO2RSB_SCALING:A.mtx S N 1 3 3 6 1.00 %:RSB_SUBDIVISION_SCALING:A.mtx S N 1 3 3 6 1.00 %:RSB_SHUFFLE_SCALING:A.mtx S N 1 3 3 6 1.00 -%:CONSTRUCTOR_SCALING:A.mtx S N 1 3 3 6 1.00 1.00 1.00 1.00 +%:CONSTRUCTOR_SCALING:A.mtx S N 1 3 3 6 nan 1.00 1.00 1.00 #%:SM_COUNTS: Tot HalfwordCsr FullwordCsr HalfwordCoo FullwordCoo %:SM_COUNTS:A.mtx S N 1 3 3 6 1 1 0 0 0 %:SM_IDXOCCUPATIONRSBVSCOOANDCSR:A.mtx S N 1 3 3 6 28 48 36 @@ -3588,47 +3624,47 @@ %:SM_MINMAXAVGNNZ:A.mtx S N 1 3 3 6 6 6 6 # # Using 4 threads -# Constructed matrix (took 0.005s): (3 x 3)[0xaaaafa567840]{Z} @ (0(0..0),0(0..0)) (6 nnz, 2 nnz/r) flags 0x2442186 (coo:1, csr:0, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'S' +# Constructed matrix (took 0.004s): (3 x 3)[0xaaaaf8a73880]{Z} @ (0(0..0),0(0..0)) (6 nnz, 2 nnz/r) flags 0x2442186 (coo:1, csr:0, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'S' # matrix consistency check took 0.000s (ok) RSB Sparse Blocks Autotuner invoked requesting max 6 splits and max 6 merges in 1 rounds, threads spec.1 (specify negative values to enable threads tuning). Will autotune matrix: 3 x 3, type Z, 6 nnz, 2 nnz/r, 4 subms, 3 lsubms, 4.0000 bpnz. Parameters: verbosity:1 mintimes:3 maxtimes:10 mindt:0 maxdt:3 -3 iterations (4 th.) took 0.001911s; avg 0.000637s ( +/- 0.17/ 0.16 %); best 0.0006359s; worst 0.000638s; std dev. 8.778e-07 (taking best). -Reference operation time is 0.000635862 s (0.302 Mflops) with 4 threads. -Starting merge (user-supplied threads) based auto-tuning procedure (transA=N, nrhs=2, order=rows) (max 6 steps, inclusive 3 grace steps) on: 3 x 3, type Z, 6 nnz, 2 nnz/r, 4 subms, 3 lsubms, 4.0000 bpnz (tpop: 0.0006359 Mflops: 0.302) -Merge (3 -> 1 leaves) took w.c.t. of 7.153e-06s, ~3.099e-06s of computing time (of which 0s sorting, 1.192e-06s analysis) -3 iterations (4 th.) took 4.053e-06s; avg 1.351e-06s ( +/- 93.94/129.41 %); best 8.19e-08s; worst 3.099e-06s; std dev. 1.296e-06 (taking best). -Reference operation time is 8.18968e-08 s (2344 Mflops) with 4 threads. -After merge step 1: tpop: 8.19e-08 s ~Mflops: 2344.414 nsubm:1 otn:1 -Applying merge (3 -> 1 leaves, 1 th.) yielded SPEEDUP of 7764.192x: 0.0006359s -> 8.19e-08s, so taking this instance. +3 iterations (4 th.) took 0.001864s; avg 0.0006213s ( +/- 5.53/ 2.84 %); best 0.000587s; worst 0.000639s; std dev. 2.428e-05 (taking best). +Reference operation time is 0.000586987 s (0.3271 Mflops) with 4 threads. +Starting merge (user-supplied threads) based auto-tuning procedure (transA=N, nrhs=2, order=rows) (max 6 steps, inclusive 3 grace steps) on: 3 x 3, type Z, 6 nnz, 2 nnz/r, 4 subms, 3 lsubms, 4.0000 bpnz (tpop: 0.000587 Mflops: 0.327) +Merge (3 -> 1 leaves) took w.c.t. of 1.001e-05s, ~3.099e-06s of computing time (of which 9.537e-07s sorting, 2.146e-06s analysis) +3 iterations (4 th.) took 4.053e-06s; avg 1.351e-06s ( +/- 97.78/129.41 %); best 3e-08s; worst 3.099e-06s; std dev. 1.296e-06 (taking best). +Reference operation time is 3.0005e-08 s (6399 Mflops) with 4 threads. +After merge step 1: tpop: 3e-08 s ~Mflops: 6398.938 nsubm:1 otn:1 +Applying merge (3 -> 1 leaves, 1 th.) yielded SPEEDUP of 19562.972x: 0.000587s -> 3e-08s, so taking this instance. Merged all the matrix leaves: no reason to continue merging. -A total of 1 merge steps (of max 6) (3 -> 1 subms) took 0.001942s (of which 1.001e-05s partitioning, 0s I/O); computing times: 3.099e-06s in par. loops, 0s sorting, 1.192e-06s analyzing) -Total merge + benchmarking process took 0.001942s, equivalent to 23714.7/3.1 new/old ops (0.003825s for 2 clones -- as 46704.5/6.0 ops, or 23352.3/3.0 ops per clone), SPEEDUP of 7764.192x -Applying multi-merge (3 -> 1 leaves, 1 steps, 1 -> 1 th.sp.) yielded SPEEDUP of 7764.192x (0.0006359s -> 8.19e-08s), will amortize in 3.1 ops by saving 0.0006358s per op. -In 1 tuning rounds (tot. 0.0058s, 0.0038s for constructor, 2 clones) obtained a SPEEDUP of 776319.2% (7764x) (from 0.302 to 2344 Mflops). +A total of 1 merge steps (of max 6) (3 -> 1 subms) took 0.001847s (of which 1.311e-05s partitioning, 0s I/O); computing times: 3.099e-06s in par. loops, 9.537e-07s sorting, 2.146e-06s analyzing) +Total merge + benchmarking process took 0.001847s, equivalent to 61557.4/3.1 new/old ops (0.003571s for 2 clones -- as 119014.7/6.1 ops, or 59507.4/3.0 ops per clone), SPEEDUP of 19562.972x +Applying multi-merge (3 -> 1 leaves, 1 steps, 1 -> 1 th.sp.) yielded SPEEDUP of 19562.972x (0.000587s -> 3e-08s), will amortize in 3.1 ops by saving 0.000587s per op. +In 1 tuning rounds (tot. 0.0055s, 0.0036s for constructor, 2 clones) obtained a SPEEDUP of 1956197.2% (1.956e+04x) (from 0.3271 to 6399 Mflops). #pr: updating sample at index 7 (3^th of 8), 0^th touch for (0,1,0,0,1,0,0). -First run of RSB Autotuner took 0.005795 s (6.359e-04 s -> 8.190e-08 s per spmv_sxsa) (tuned: 3 -> 1 lsubm). +First run of RSB Autotuner took 0.00549793 s (5.870e-04 s -> 3.000e-08 s per spmv_sxsa) (tuned: 3 -> 1 lsubm). RSB Sparse Blocks Autotuner invoked requesting max 0 splits and max 0 merges in 1 rounds, auto threads spec. -Second run of RSB Autotuner took 0.0330939 s and estimated a speedup of 1.000000 x (8.190e-08 s -> 8.190e-08 s per op) in same matrix (1 -> 1 lsubm) +Second run of RSB Autotuner took 0.0287342 s and estimated a speedup of 1.000000 x (3.000e-08 s -> 3.000e-08 s per op) in same matrix (1 -> 1 lsubm) #min:1 0 #max:1 0 #sum:3 0 #norm:1.7320508075688772 0 #used index storage compared to COO:28 vs 48 bytes (58.33%) ; compared to CSR:28 vs 40 bytes (77.78%) #%:CONSTRUCTOR_*:SORT SCAN INSERT SCAN+INSERT -%:CONSTRUCTOR_TIMES:A.mtx S N 4 3 3 6 0.000000 0.002324 0.001692 0.004016 -%:UNSORTEDCOO2RSB_TIME:A.mtx S N 4 3 3 6 0.004016 -%:RSB_SUBDIVISION_TIME:A.mtx S N 4 3 3 6 0.002324 -%:RSB_SHUFFLE_TIME:A.mtx S N 4 3 3 6 0.001692 +%:CONSTRUCTOR_TIMES:A.mtx S N 4 3 3 6 0.000000 0.000902 0.001660 0.002562 +%:UNSORTEDCOO2RSB_TIME:A.mtx S N 4 3 3 6 0.002562 +%:RSB_SUBDIVISION_TIME:A.mtx S N 4 3 3 6 0.000902 +%:RSB_SHUFFLE_TIME:A.mtx S N 4 3 3 6 0.001660 %:ROW_MAJOR_SORT_TIME:A.mtx S N 4 3 3 6 0.000000 -%:ROW_MAJOR_SORT_SCALING:A.mtx S N 4 3 3 6 inf -%:SORTEDCOO2RSB_TIME:A.mtx S N 4 3 3 6 0.004016 +%:ROW_MAJOR_SORT_SCALING:A.mtx S N 4 3 3 6 nan +%:SORTEDCOO2RSB_TIME:A.mtx S N 4 3 3 6 0.002562 %:ROW_MAJOR_SORT_TO_MOP:A.mtx S N 4 3 3 6 0.000 -%:UNSORTEDCOO2RSB_SCALING:A.mtx S N 4 3 3 6 0.77 -%:SORTEDCOO2RSB_SCALING:A.mtx S N 4 3 3 6 0.77 -%:RSB_SUBDIVISION_SCALING:A.mtx S N 4 3 3 6 0.55 -%:RSB_SHUFFLE_SCALING:A.mtx S N 4 3 3 6 1.07 -%:CONSTRUCTOR_SCALING:A.mtx S N 4 3 3 6 inf 0.55 1.07 0.77 +%:UNSORTEDCOO2RSB_SCALING:A.mtx S N 4 3 3 6 1.31 +%:SORTEDCOO2RSB_SCALING:A.mtx S N 4 3 3 6 1.31 +%:RSB_SUBDIVISION_SCALING:A.mtx S N 4 3 3 6 1.98 +%:RSB_SHUFFLE_SCALING:A.mtx S N 4 3 3 6 0.95 +%:CONSTRUCTOR_SCALING:A.mtx S N 4 3 3 6 nan 1.98 0.95 1.31 #%:SM_COUNTS: Tot HalfwordCsr FullwordCsr HalfwordCoo FullwordCoo %:SM_COUNTS:A.mtx S N 4 3 3 6 1 1 0 0 0 %:SM_IDXOCCUPATIONRSBVSCOOANDCSR:A.mtx S N 4 3 3 6 28 48 36 @@ -3637,37 +3673,37 @@ %:SM_MINMAXAVGNNZ:A.mtx S N 4 3 3 6 6 6 6 # %operation:matrix CONSTRUCTOR[1] SPMV[1] SPMV[4] -%operation:A.mtx 0.00478292 1e+09 1e+09 +%operation:A.mtx 0.00501084 1e+09 1e+09 %constructor:matrix SORT[1] SCAN[1] SHUFFLE[1] INSERT[1] -%constructor:A.mtx 1.19209e-06 0.00128698 0 0.00180602 +%constructor:A.mtx 0 0.00178385 0 0.00157619 # symmetric matrix --- skipping transposed benchmarking -# so far, program took 5.650s of wall clock time; ancillary tests 0.000s; I/O 0.000s; checks 0.000s; conversions 0.000s; rsb/mkl tuning 0.217s/0.000s . +# so far, program took 5.594s of wall clock time; ancillary tests 0.000s; I/O 0.000s; checks 0.000s; conversions 0.000s; rsb/mkl tuning 0.206s/0.000s . getrusage() stats: ru_maxrss: 6 (maximum resident set size -- MB) -ru_stime : 0.08897s (system CPU time used) -ru_utime : 7.037s (user CPU time used) +ru_stime : 0.06474s (system CPU time used) +ru_utime : 7.444s (user CPU time used) # benchmarking terminated --- finalizing run. # ====== BEGIN Total summary record. #pr: ======== Limiting to nrhs=1: #pr: 2 samples (out of 4) matched the dump limiting criteria. #pr: Dump from a base of 4 samples (of max 8) ordered by (1,2,1,1,2,1,2) = (filename x cores x incX x incY x nrhs x typecode x transA). pr: BESTCODE MTX NR NC NNZ NRHS TYPE SYM TRANS NT AT-NT AT-MKL-NT BPNZ AT-BPNZ NSUBM AT-SUBM RSBBEST-MFLOPS OPTIME MKL-OPTIME AT-OPTIME AT-MKL-OPTIME AT-TIME RWminBW-GBps CB-bpf AT-MS CMFLOPS -pr: 1:R_R A 3 3 6 1 Z S N 1 1 0 4.0000 4.6667 3 1 1172.21 1.222e-03 0.000e+00 8.190e-08 0.000e+00 1.099e-02 3.27e+00 2.29e+00 1 9.60e-05 -pr: 5:R_R A 3 3 6 1 Z S N 4 1 0 4.0000 4.6667 3 1 1172.21 1.020e-03 0.000e+00 8.190e-08 0.000e+00 1.167e-02 3.27e+00 2.29e+00 1 9.60e-05 +pr: 1:R_R A 3 3 6 1 Z S N 1 1 0 4.0000 4.6667 3 1 100.66 1.214e-03 0.000e+00 9.537e-07 0.000e+00 1.096e-02 2.81e-01 2.29e+00 1 9.60e-05 +pr: 5:R_R A 3 3 6 1 Z S N 4 1 0 4.0000 4.6667 3 1 3199.47 9.322e-04 0.000e+00 3.000e-08 0.000e+00 8.471e-03 8.93e+00 2.29e+00 1 9.60e-05 #pr: 2 samples (out of 4) matched the dump limiting criteria. #pr: below, we define 'successful' autotuning when speedup of 1.010000x is exceeded, and 'tuned' results even the ones which are same as untuned #pr: rsb autotuning was successful in 2 cases (100.00 %) and unsuccessful in 0 cases (0.00 %) -#pr: (in succ. cases rsb autotuning gave avg. 1368604.5 % faster, avg. sp. ratio 13687.045x, max sp. ratio 14919.942x, avg. ratio 0.000x) -#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 138368.3/134203.8/142532.8/276736.5 tuned ops) -#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 10.2/ 9.0/ 11.4/ 20.4 untuned ops) -#pr: (and amortizes from untuned rsb in avg. 10.2, min. 9.0, max. 11.4 ops) +#pr: (in succ. cases rsb autotuning gave avg. 1616974.1 % faster, avg. sp. ratio 16170.741x, max sp. ratio 31068.733x, avg. ratio 0.000x) +#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 146905.2/11490.2/282320.2/293810.5 tuned ops) +#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 9.1/ 9.0/ 9.1/ 18.1 untuned ops) +#pr: (and amortizes from untuned rsb in avg. 9.1, min. 9.0, max. 9.1 ops) #pr: (avg/min/max (avg) nnz per subm before successful tuning were 2/ 2/ 2) #pr: (avg/min/max (avg) nnz per subm after successful tuning were 6/ 6/ 6) #pr: (avg/min/max (avg) bytes per subm before successful tuning were 32/ 32/ 32) #pr: (avg/min/max (avg) bytes per subm after successful tuning were 96/ 96/ 96) #pr: (avg/min/max (avg) bytes per nnz before successful tuning were 4.000/ 4.000/ 4.000) -#pr: (avg/min/max operands (mtx,lhs,rhs) read bandwidth lower bound 2.686/ 2.686/ 2.686,GBps) -#pr: (avg/min/max operands (mtx,rhs:r;lhs:rw) bandwidth lower bound 6.545/ 3.272/ 3.272,GBps) +#pr: (avg/min/max operands (mtx,lhs,rhs) read bandwidth lower bound 3.781/ 0.231/ 7.332,GBps) +#pr: (avg/min/max operands (mtx,rhs:r;lhs:rw) bandwidth lower bound 9.213/ 0.281/ 8.932,GBps) #pr: (avg/min/max code balance (bytes read at least once per flop) 2.292/ 2.292/ 2.292) #pr: (avg/min/max (avg) bytes per nnz after successful tuning were 4.667/ 4.667/ 4.667) #pr: (matrix has been subdivided more/less/same in resp. 0 / 2 /0 cases) @@ -3675,32 +3711,32 @@ #pr: no unsuccessful rsb autotuning attempt (according to 1.01x threshold) #pr: rsb auto tuning (either succ. or uns.) time was: on avg.: 0.01 s, min 0.01 s, max 0.01 s, tot 0.02 s (2 samples) #pr: rsb auto tuning ( only successful ) time was: on avg.: 0.01 s, min 0.01 s, max 0.01 s, tot 0.02 s (2 samples) -#pr: best tun. rsb canon. mflops were: on avg. 1.172e+03, min 1.172e+03, max 1.172e+03 (2 samples) -#pr: ref. unt. rsb canon. mflops were: on avg. 8.634e-02, min 7.857e-02, max 9.412e-02 (2 samples) -#pr: best tun. rsb operation time was: on avg. 8.190e-08s, min 8.190e-08s, max 8.190e-08s, tot 1.638e-07s (2 samples) -#pr: ref. unt. rsb operation time was: on avg. 1.121e-03s, min 1.020e-03s, max 1.222e-03s, tot 2.242e-03s (2 samples) -#pr: min / max ratio of in-memory MEMSET bandwidth to extrapolated read bandwidth ratio: 1.743e+01 1.743e+01 -#pr: in-cache to in-memory MEMSET bandwidth ratio: 1.016e+00 +#pr: best tun. rsb canon. mflops were: on avg. 1.650e+03, min 1.007e+02, max 3.199e+03 (2 samples) +#pr: ref. unt. rsb canon. mflops were: on avg. 9.104e-02, min 7.909e-02, max 1.030e-01 (2 samples) +#pr: best tun. rsb operation time was: on avg. 4.918e-07s, min 3.000e-08s, max 9.537e-07s, tot 9.837e-07s (2 samples) +#pr: ref. unt. rsb operation time was: on avg. 1.073e-03s, min 9.322e-04s, max 1.214e-03s, tot 2.146e-03s (2 samples) +#pr: min / max ratio of in-memory MEMSET bandwidth to extrapolated read bandwidth ratio: 6.513e+00 2.070e+02 +#pr: in-cache to in-memory MEMSET bandwidth ratio: 9.987e-01 #pr: ======== Limiting to nrhs=2: #pr: 2 samples (out of 4) matched the dump limiting criteria. #pr: Dump from a base of 4 samples (of max 8) ordered by (1,2,1,1,2,1,2) = (filename x cores x incX x incY x nrhs x typecode x transA). pr: BESTCODE MTX NR NC NNZ NRHS TYPE SYM TRANS NT AT-NT AT-MKL-NT BPNZ AT-BPNZ NSUBM AT-SUBM RSBBEST-MFLOPS OPTIME MKL-OPTIME AT-OPTIME AT-MKL-OPTIME AT-TIME RWminBW-GBps CB-bpf AT-MS CMFLOPS -pr: 3:R_R A 3 3 6 2 Z S N 1 1 0 4.0000 4.6667 3 1 2344.41 7.861e-04 0.000e+00 8.190e-08 0.000e+00 7.446e-03 5.03e+00 1.65e+00 1 1.92e-04 -pr: 7:R_R A 3 3 6 2 Z S N 4 1 0 4.0000 4.6667 3 1 2344.41 6.359e-04 0.000e+00 8.190e-08 0.000e+00 5.795e-03 5.03e+00 1.65e+00 1 1.92e-04 +pr: 3:R_R A 3 3 6 2 Z S N 1 1 0 4.0000 4.6667 3 1 6398.94 7.458e-04 0.000e+00 3.000e-08 0.000e+00 7.546e-03 1.37e+01 1.65e+00 1 1.92e-04 +pr: 7:R_R A 3 3 6 2 Z S N 4 1 0 4.0000 4.6667 3 1 6398.94 5.870e-04 0.000e+00 3.000e-08 0.000e+00 5.498e-03 1.37e+01 1.65e+00 1 1.92e-04 #pr: 2 samples (out of 4) matched the dump limiting criteria. #pr: below, we define 'successful' autotuning when speedup of 1.010000x is exceeded, and 'tuned' results even the ones which are same as untuned #pr: rsb autotuning was successful in 2 cases (100.00 %) and unsuccessful in 0 cases (0.00 %) -#pr: (in succ. cases rsb autotuning gave avg. 868022.3 % faster, avg. sp. ratio 8681.223x, max sp. ratio 9598.253x, avg. ratio 0.000x) -#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 80839.9/70759.8/90919.9/161679.8 tuned ops) -#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 9.3/ 9.1/ 9.5/ 18.6 untuned ops) -#pr: (and amortizes from untuned rsb in avg. 9.3, min. 9.1, max. 9.5 ops) +#pr: (in succ. cases rsb autotuning gave avg. 2220797.9 % faster, avg. sp. ratio 22208.979x, max sp. ratio 24854.986x, avg. ratio 0.000x) +#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 217361.9/183234.0/251489.9/434723.9 tuned ops) +#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 9.7/ 9.4/ 10.1/ 19.5 untuned ops) +#pr: (and amortizes from untuned rsb in avg. 9.7, min. 9.4, max. 10.1 ops) #pr: (avg/min/max (avg) nnz per subm before successful tuning were 2/ 2/ 2) #pr: (avg/min/max (avg) nnz per subm after successful tuning were 6/ 6/ 6) #pr: (avg/min/max (avg) bytes per subm before successful tuning were 32/ 32/ 32) #pr: (avg/min/max (avg) bytes per subm after successful tuning were 96/ 96/ 96) #pr: (avg/min/max (avg) bytes per nnz before successful tuning were 4.000/ 4.000/ 4.000) -#pr: (avg/min/max operands (mtx,lhs,rhs) read bandwidth lower bound 3.859/ 3.859/ 3.859,GBps) -#pr: (avg/min/max operands (mtx,rhs:r;lhs:rw) bandwidth lower bound 10.061/ 5.031/ 5.031,GBps) +#pr: (avg/min/max operands (mtx,lhs,rhs) read bandwidth lower bound 10.532/ 10.532/ 10.532,GBps) +#pr: (avg/min/max operands (mtx,rhs:r;lhs:rw) bandwidth lower bound 27.462/ 13.731/ 13.731,GBps) #pr: (avg/min/max code balance (bytes read at least once per flop) 1.646/ 1.646/ 1.646) #pr: (avg/min/max (avg) bytes per nnz after successful tuning were 4.667/ 4.667/ 4.667) #pr: (matrix has been subdivided more/less/same in resp. 0 / 2 /0 cases) @@ -3708,67 +3744,67 @@ #pr: no unsuccessful rsb autotuning attempt (according to 1.01x threshold) #pr: rsb auto tuning (either succ. or uns.) time was: on avg.: 0.01 s, min 0.01 s, max 0.01 s, tot 0.01 s (2 samples) #pr: rsb auto tuning ( only successful ) time was: on avg.: 0.01 s, min 0.01 s, max 0.01 s, tot 0.01 s (2 samples) -#pr: best tun. rsb canon. mflops were: on avg. 2.344e+03, min 2.344e+03, max 2.344e+03 (2 samples) -#pr: ref. unt. rsb canon. mflops were: on avg. 2.731e-01, min 2.443e-01, max 3.020e-01 (2 samples) -#pr: best tun. rsb operation time was: on avg. 8.190e-08s, min 8.190e-08s, max 8.190e-08s, tot 1.638e-07s (2 samples) -#pr: ref. unt. rsb operation time was: on avg. 7.110e-04s, min 6.359e-04s, max 7.861e-04s, tot 1.422e-03s (2 samples) -#pr: min / max ratio of in-memory MEMSET bandwidth to extrapolated read bandwidth ratio: 1.213e+01 1.213e+01 -#pr: in-cache to in-memory MEMSET bandwidth ratio: 1.016e+00 -#pr: rsb nrhs-to-overall-min-rhs speed ratio was: on avg. 2.000e+00 x, min 2.000e+00 x, max 2.000e+00 x (2 samples, the non-min-nrhs ones) +#pr: best tun. rsb canon. mflops were: on avg. 6.399e+03, min 6.399e+03, max 6.399e+03 (2 samples) +#pr: ref. unt. rsb canon. mflops were: on avg. 2.923e-01, min 2.575e-01, max 3.271e-01 (2 samples) +#pr: best tun. rsb operation time was: on avg. 3.000e-08s, min 3.000e-08s, max 3.000e-08s, tot 6.001e-08s (2 samples) +#pr: ref. unt. rsb operation time was: on avg. 6.664e-04s, min 5.870e-04s, max 7.458e-04s, tot 1.333e-03s (2 samples) +#pr: min / max ratio of in-memory MEMSET bandwidth to extrapolated read bandwidth ratio: 4.534e+00 4.534e+00 +#pr: in-cache to in-memory MEMSET bandwidth ratio: 9.987e-01 +#pr: rsb nrhs-to-overall-min-rhs speed ratio was: on avg. 3.278e+01 x, min 2.000e+00 x, max 6.357e+01 x (2 samples, the non-min-nrhs ones) #pr: ======== Limiting to transA=N: #pr: Dump from a base of 4 samples (of max 8) ordered by (1,2,1,1,2,1,2) = (filename x cores x incX x incY x nrhs x typecode x transA). pr: BESTCODE MTX NR NC NNZ NRHS TYPE SYM TRANS NT AT-NT AT-MKL-NT BPNZ AT-BPNZ NSUBM AT-SUBM RSBBEST-MFLOPS OPTIME MKL-OPTIME AT-OPTIME AT-MKL-OPTIME AT-TIME RWminBW-GBps CB-bpf AT-MS CMFLOPS -pr: 1:R_R A 3 3 6 1 Z S N 1 1 0 4.0000 4.6667 3 1 1172.21 1.222e-03 0.000e+00 8.190e-08 0.000e+00 1.099e-02 3.27e+00 2.29e+00 1 9.60e-05 -pr: 3:R_R A 3 3 6 2 Z S N 1 1 0 4.0000 4.6667 3 1 2344.41 7.861e-04 0.000e+00 8.190e-08 0.000e+00 7.446e-03 5.03e+00 1.65e+00 1 1.92e-04 -pr: 5:R_R A 3 3 6 1 Z S N 4 1 0 4.0000 4.6667 3 1 1172.21 1.020e-03 0.000e+00 8.190e-08 0.000e+00 1.167e-02 3.27e+00 2.29e+00 1 9.60e-05 -pr: 7:R_R A 3 3 6 2 Z S N 4 1 0 4.0000 4.6667 3 1 2344.41 6.359e-04 0.000e+00 8.190e-08 0.000e+00 5.795e-03 5.03e+00 1.65e+00 1 1.92e-04 +pr: 1:R_R A 3 3 6 1 Z S N 1 1 0 4.0000 4.6667 3 1 100.66 1.214e-03 0.000e+00 9.537e-07 0.000e+00 1.096e-02 2.81e-01 2.29e+00 1 9.60e-05 +pr: 3:R_R A 3 3 6 2 Z S N 1 1 0 4.0000 4.6667 3 1 6398.94 7.458e-04 0.000e+00 3.000e-08 0.000e+00 7.546e-03 1.37e+01 1.65e+00 1 1.92e-04 +pr: 5:R_R A 3 3 6 1 Z S N 4 1 0 4.0000 4.6667 3 1 3199.47 9.322e-04 0.000e+00 3.000e-08 0.000e+00 8.471e-03 8.93e+00 2.29e+00 1 9.60e-05 +pr: 7:R_R A 3 3 6 2 Z S N 4 1 0 4.0000 4.6667 3 1 6398.94 5.870e-04 0.000e+00 3.000e-08 0.000e+00 5.498e-03 1.37e+01 1.65e+00 1 1.92e-04 #pr: below, we define 'successful' autotuning when speedup of 1.010000x is exceeded, and 'tuned' results even the ones which are same as untuned #pr: rsb autotuning was successful in 4 cases (100.00 %) and unsuccessful in 0 cases (0.00 %) -#pr: (in succ. cases rsb autotuning gave avg. 1118313.4 % faster, avg. sp. ratio 11184.134x, max sp. ratio 14919.942x, avg. ratio 0.000x) -#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 109604.1/70759.8/142532.8/438416.3 tuned ops) -#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 9.8/ 9.0/ 11.4/ 39.0 untuned ops) -#pr: (and amortizes from untuned rsb in avg. 9.8, min. 9.0, max. 11.4 ops) +#pr: (in succ. cases rsb autotuning gave avg. 1918886.0 % faster, avg. sp. ratio 19189.860x, max sp. ratio 31068.733x, avg. ratio 0.000x) +#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 182133.6/11490.2/282320.2/728534.4 tuned ops) +#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 9.4/ 9.0/ 10.1/ 37.6 untuned ops) +#pr: (and amortizes from untuned rsb in avg. 9.4, min. 9.0, max. 10.1 ops) #pr: (avg/min/max (avg) nnz per subm before successful tuning were 2/ 2/ 2) #pr: (avg/min/max (avg) nnz per subm after successful tuning were 6/ 6/ 6) #pr: (avg/min/max (avg) bytes per subm before successful tuning were 32/ 32/ 32) #pr: (avg/min/max (avg) bytes per subm after successful tuning were 96/ 96/ 96) #pr: (avg/min/max (avg) bytes per nnz before successful tuning were 4.000/ 4.000/ 4.000) -#pr: (avg/min/max operands (mtx,lhs,rhs) read bandwidth lower bound 3.272/ 2.686/ 3.859,GBps) -#pr: (avg/min/max operands (mtx,rhs:r;lhs:rw) bandwidth lower bound 16.606/ 3.272/ 5.031,GBps) +#pr: (avg/min/max operands (mtx,lhs,rhs) read bandwidth lower bound 7.156/ 0.231/ 10.532,GBps) +#pr: (avg/min/max operands (mtx,rhs:r;lhs:rw) bandwidth lower bound 36.675/ 0.281/ 13.731,GBps) #pr: (avg/min/max code balance (bytes read at least once per flop) 1.969/ 1.646/ 2.292) #pr: (avg/min/max (avg) bytes per nnz after successful tuning were 4.667/ 4.667/ 4.667) #pr: (matrix has been subdivided more/less/same in resp. 0 / 4 /0 cases) #pr: (matrix has used more/less/same threads in resp. 0 / 2 /2 cases) #pr: no unsuccessful rsb autotuning attempt (according to 1.01x threshold) -#pr: rsb auto tuning (either succ. or uns.) time was: on avg.: 0.01 s, min 0.01 s, max 0.01 s, tot 0.04 s (4 samples) -#pr: rsb auto tuning ( only successful ) time was: on avg.: 0.01 s, min 0.01 s, max 0.01 s, tot 0.04 s (4 samples) -#pr: best tun. rsb canon. mflops were: on avg. 1.758e+03, min 1.172e+03, max 2.344e+03 (4 samples) -#pr: ref. unt. rsb canon. mflops were: on avg. 1.797e-01, min 7.857e-02, max 3.020e-01 (4 samples) -#pr: best tun. rsb operation time was: on avg. 8.190e-08s, min 8.190e-08s, max 8.190e-08s, tot 3.276e-07s (4 samples) -#pr: ref. unt. rsb operation time was: on avg. 9.159e-04s, min 6.359e-04s, max 1.222e-03s, tot 3.664e-03s (4 samples) -#pr: min / max ratio of in-memory MEMSET bandwidth to extrapolated read bandwidth ratio: 1.213e+01 1.743e+01 -#pr: in-cache to in-memory MEMSET bandwidth ratio: 1.016e+00 -#pr: rsb nrhs-to-overall-min-rhs speed ratio was: on avg. 2.000e+00 x, min 2.000e+00 x, max 2.000e+00 x (2 samples, the non-min-nrhs ones) +#pr: rsb auto tuning (either succ. or uns.) time was: on avg.: 0.01 s, min 0.01 s, max 0.01 s, tot 0.03 s (4 samples) +#pr: rsb auto tuning ( only successful ) time was: on avg.: 0.01 s, min 0.01 s, max 0.01 s, tot 0.03 s (4 samples) +#pr: best tun. rsb canon. mflops were: on avg. 4.025e+03, min 1.007e+02, max 6.399e+03 (4 samples) +#pr: ref. unt. rsb canon. mflops were: on avg. 1.917e-01, min 7.909e-02, max 3.271e-01 (4 samples) +#pr: best tun. rsb operation time was: on avg. 2.609e-07s, min 3.000e-08s, max 9.537e-07s, tot 1.044e-06s (4 samples) +#pr: ref. unt. rsb operation time was: on avg. 8.697e-04s, min 5.870e-04s, max 1.214e-03s, tot 3.479e-03s (4 samples) +#pr: min / max ratio of in-memory MEMSET bandwidth to extrapolated read bandwidth ratio: 4.534e+00 2.070e+02 +#pr: in-cache to in-memory MEMSET bandwidth ratio: 9.987e-01 +#pr: rsb nrhs-to-overall-min-rhs speed ratio was: on avg. 3.278e+01 x, min 2.000e+00 x, max 6.357e+01 x (2 samples, the non-min-nrhs ones) #pr: ======== Limiting to both transA=N and nrhs=1: #pr: 2 samples (out of 4) matched the dump limiting criteria. #pr: Dump from a base of 4 samples (of max 8) ordered by (1,2,1,1,2,1,2) = (filename x cores x incX x incY x nrhs x typecode x transA). pr: BESTCODE MTX NR NC NNZ NRHS TYPE SYM TRANS NT AT-NT AT-MKL-NT BPNZ AT-BPNZ NSUBM AT-SUBM RSBBEST-MFLOPS OPTIME MKL-OPTIME AT-OPTIME AT-MKL-OPTIME AT-TIME RWminBW-GBps CB-bpf AT-MS CMFLOPS -pr: 1:R_R A 3 3 6 1 Z S N 1 1 0 4.0000 4.6667 3 1 1172.21 1.222e-03 0.000e+00 8.190e-08 0.000e+00 1.099e-02 3.27e+00 2.29e+00 1 9.60e-05 -pr: 5:R_R A 3 3 6 1 Z S N 4 1 0 4.0000 4.6667 3 1 1172.21 1.020e-03 0.000e+00 8.190e-08 0.000e+00 1.167e-02 3.27e+00 2.29e+00 1 9.60e-05 +pr: 1:R_R A 3 3 6 1 Z S N 1 1 0 4.0000 4.6667 3 1 100.66 1.214e-03 0.000e+00 9.537e-07 0.000e+00 1.096e-02 2.81e-01 2.29e+00 1 9.60e-05 +pr: 5:R_R A 3 3 6 1 Z S N 4 1 0 4.0000 4.6667 3 1 3199.47 9.322e-04 0.000e+00 3.000e-08 0.000e+00 8.471e-03 8.93e+00 2.29e+00 1 9.60e-05 #pr: 2 samples (out of 4) matched the dump limiting criteria. #pr: below, we define 'successful' autotuning when speedup of 1.010000x is exceeded, and 'tuned' results even the ones which are same as untuned #pr: rsb autotuning was successful in 2 cases (100.00 %) and unsuccessful in 0 cases (0.00 %) -#pr: (in succ. cases rsb autotuning gave avg. 1368604.5 % faster, avg. sp. ratio 13687.045x, max sp. ratio 14919.942x, avg. ratio 0.000x) -#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 138368.3/134203.8/142532.8/276736.5 tuned ops) -#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 10.2/ 9.0/ 11.4/ 20.4 untuned ops) -#pr: (and amortizes from untuned rsb in avg. 10.2, min. 9.0, max. 11.4 ops) +#pr: (in succ. cases rsb autotuning gave avg. 1616974.1 % faster, avg. sp. ratio 16170.741x, max sp. ratio 31068.733x, avg. ratio 0.000x) +#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 146905.2/11490.2/282320.2/293810.5 tuned ops) +#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 9.1/ 9.0/ 9.1/ 18.1 untuned ops) +#pr: (and amortizes from untuned rsb in avg. 9.1, min. 9.0, max. 9.1 ops) #pr: (avg/min/max (avg) nnz per subm before successful tuning were 2/ 2/ 2) #pr: (avg/min/max (avg) nnz per subm after successful tuning were 6/ 6/ 6) #pr: (avg/min/max (avg) bytes per subm before successful tuning were 32/ 32/ 32) #pr: (avg/min/max (avg) bytes per subm after successful tuning were 96/ 96/ 96) #pr: (avg/min/max (avg) bytes per nnz before successful tuning were 4.000/ 4.000/ 4.000) -#pr: (avg/min/max operands (mtx,lhs,rhs) read bandwidth lower bound 2.686/ 2.686/ 2.686,GBps) -#pr: (avg/min/max operands (mtx,rhs:r;lhs:rw) bandwidth lower bound 6.545/ 3.272/ 3.272,GBps) +#pr: (avg/min/max operands (mtx,lhs,rhs) read bandwidth lower bound 3.781/ 0.231/ 7.332,GBps) +#pr: (avg/min/max operands (mtx,rhs:r;lhs:rw) bandwidth lower bound 9.213/ 0.281/ 8.932,GBps) #pr: (avg/min/max code balance (bytes read at least once per flop) 2.292/ 2.292/ 2.292) #pr: (avg/min/max (avg) bytes per nnz after successful tuning were 4.667/ 4.667/ 4.667) #pr: (matrix has been subdivided more/less/same in resp. 0 / 2 /0 cases) @@ -3776,32 +3812,32 @@ #pr: no unsuccessful rsb autotuning attempt (according to 1.01x threshold) #pr: rsb auto tuning (either succ. or uns.) time was: on avg.: 0.01 s, min 0.01 s, max 0.01 s, tot 0.02 s (2 samples) #pr: rsb auto tuning ( only successful ) time was: on avg.: 0.01 s, min 0.01 s, max 0.01 s, tot 0.02 s (2 samples) -#pr: best tun. rsb canon. mflops were: on avg. 1.172e+03, min 1.172e+03, max 1.172e+03 (2 samples) -#pr: ref. unt. rsb canon. mflops were: on avg. 8.634e-02, min 7.857e-02, max 9.412e-02 (2 samples) -#pr: best tun. rsb operation time was: on avg. 8.190e-08s, min 8.190e-08s, max 8.190e-08s, tot 1.638e-07s (2 samples) -#pr: ref. unt. rsb operation time was: on avg. 1.121e-03s, min 1.020e-03s, max 1.222e-03s, tot 2.242e-03s (2 samples) -#pr: min / max ratio of in-memory MEMSET bandwidth to extrapolated read bandwidth ratio: 1.743e+01 1.743e+01 -#pr: in-cache to in-memory MEMSET bandwidth ratio: 1.016e+00 +#pr: best tun. rsb canon. mflops were: on avg. 1.650e+03, min 1.007e+02, max 3.199e+03 (2 samples) +#pr: ref. unt. rsb canon. mflops were: on avg. 9.104e-02, min 7.909e-02, max 1.030e-01 (2 samples) +#pr: best tun. rsb operation time was: on avg. 4.918e-07s, min 3.000e-08s, max 9.537e-07s, tot 9.837e-07s (2 samples) +#pr: ref. unt. rsb operation time was: on avg. 1.073e-03s, min 9.322e-04s, max 1.214e-03s, tot 2.146e-03s (2 samples) +#pr: min / max ratio of in-memory MEMSET bandwidth to extrapolated read bandwidth ratio: 6.513e+00 2.070e+02 +#pr: in-cache to in-memory MEMSET bandwidth ratio: 9.987e-01 #pr: ======== Limiting to both transA=N and nrhs=2: #pr: 2 samples (out of 4) matched the dump limiting criteria. #pr: Dump from a base of 4 samples (of max 8) ordered by (1,2,1,1,2,1,2) = (filename x cores x incX x incY x nrhs x typecode x transA). pr: BESTCODE MTX NR NC NNZ NRHS TYPE SYM TRANS NT AT-NT AT-MKL-NT BPNZ AT-BPNZ NSUBM AT-SUBM RSBBEST-MFLOPS OPTIME MKL-OPTIME AT-OPTIME AT-MKL-OPTIME AT-TIME RWminBW-GBps CB-bpf AT-MS CMFLOPS -pr: 3:R_R A 3 3 6 2 Z S N 1 1 0 4.0000 4.6667 3 1 2344.41 7.861e-04 0.000e+00 8.190e-08 0.000e+00 7.446e-03 5.03e+00 1.65e+00 1 1.92e-04 -pr: 7:R_R A 3 3 6 2 Z S N 4 1 0 4.0000 4.6667 3 1 2344.41 6.359e-04 0.000e+00 8.190e-08 0.000e+00 5.795e-03 5.03e+00 1.65e+00 1 1.92e-04 +pr: 3:R_R A 3 3 6 2 Z S N 1 1 0 4.0000 4.6667 3 1 6398.94 7.458e-04 0.000e+00 3.000e-08 0.000e+00 7.546e-03 1.37e+01 1.65e+00 1 1.92e-04 +pr: 7:R_R A 3 3 6 2 Z S N 4 1 0 4.0000 4.6667 3 1 6398.94 5.870e-04 0.000e+00 3.000e-08 0.000e+00 5.498e-03 1.37e+01 1.65e+00 1 1.92e-04 #pr: 2 samples (out of 4) matched the dump limiting criteria. #pr: below, we define 'successful' autotuning when speedup of 1.010000x is exceeded, and 'tuned' results even the ones which are same as untuned #pr: rsb autotuning was successful in 2 cases (100.00 %) and unsuccessful in 0 cases (0.00 %) -#pr: (in succ. cases rsb autotuning gave avg. 868022.3 % faster, avg. sp. ratio 8681.223x, max sp. ratio 9598.253x, avg. ratio 0.000x) -#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 80839.9/70759.8/90919.9/161679.8 tuned ops) -#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 9.3/ 9.1/ 9.5/ 18.6 untuned ops) -#pr: (and amortizes from untuned rsb in avg. 9.3, min. 9.1, max. 9.5 ops) +#pr: (in succ. cases rsb autotuning gave avg. 2220797.9 % faster, avg. sp. ratio 22208.979x, max sp. ratio 24854.986x, avg. ratio 0.000x) +#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 217361.9/183234.0/251489.9/434723.9 tuned ops) +#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 9.7/ 9.4/ 10.1/ 19.5 untuned ops) +#pr: (and amortizes from untuned rsb in avg. 9.7, min. 9.4, max. 10.1 ops) #pr: (avg/min/max (avg) nnz per subm before successful tuning were 2/ 2/ 2) #pr: (avg/min/max (avg) nnz per subm after successful tuning were 6/ 6/ 6) #pr: (avg/min/max (avg) bytes per subm before successful tuning were 32/ 32/ 32) #pr: (avg/min/max (avg) bytes per subm after successful tuning were 96/ 96/ 96) #pr: (avg/min/max (avg) bytes per nnz before successful tuning were 4.000/ 4.000/ 4.000) -#pr: (avg/min/max operands (mtx,lhs,rhs) read bandwidth lower bound 3.859/ 3.859/ 3.859,GBps) -#pr: (avg/min/max operands (mtx,rhs:r;lhs:rw) bandwidth lower bound 10.061/ 5.031/ 5.031,GBps) +#pr: (avg/min/max operands (mtx,lhs,rhs) read bandwidth lower bound 10.532/ 10.532/ 10.532,GBps) +#pr: (avg/min/max operands (mtx,rhs:r;lhs:rw) bandwidth lower bound 27.462/ 13.731/ 13.731,GBps) #pr: (avg/min/max code balance (bytes read at least once per flop) 1.646/ 1.646/ 1.646) #pr: (avg/min/max (avg) bytes per nnz after successful tuning were 4.667/ 4.667/ 4.667) #pr: (matrix has been subdivided more/less/same in resp. 0 / 2 /0 cases) @@ -3809,13 +3845,13 @@ #pr: no unsuccessful rsb autotuning attempt (according to 1.01x threshold) #pr: rsb auto tuning (either succ. or uns.) time was: on avg.: 0.01 s, min 0.01 s, max 0.01 s, tot 0.01 s (2 samples) #pr: rsb auto tuning ( only successful ) time was: on avg.: 0.01 s, min 0.01 s, max 0.01 s, tot 0.01 s (2 samples) -#pr: best tun. rsb canon. mflops were: on avg. 2.344e+03, min 2.344e+03, max 2.344e+03 (2 samples) -#pr: ref. unt. rsb canon. mflops were: on avg. 2.731e-01, min 2.443e-01, max 3.020e-01 (2 samples) -#pr: best tun. rsb operation time was: on avg. 8.190e-08s, min 8.190e-08s, max 8.190e-08s, tot 1.638e-07s (2 samples) -#pr: ref. unt. rsb operation time was: on avg. 7.110e-04s, min 6.359e-04s, max 7.861e-04s, tot 1.422e-03s (2 samples) -#pr: min / max ratio of in-memory MEMSET bandwidth to extrapolated read bandwidth ratio: 1.213e+01 1.213e+01 -#pr: in-cache to in-memory MEMSET bandwidth ratio: 1.016e+00 -#pr: rsb nrhs-to-overall-min-rhs speed ratio was: on avg. 2.000e+00 x, min 2.000e+00 x, max 2.000e+00 x (2 samples, the non-min-nrhs ones) +#pr: best tun. rsb canon. mflops were: on avg. 6.399e+03, min 6.399e+03, max 6.399e+03 (2 samples) +#pr: ref. unt. rsb canon. mflops were: on avg. 2.923e-01, min 2.575e-01, max 3.271e-01 (2 samples) +#pr: best tun. rsb operation time was: on avg. 3.000e-08s, min 3.000e-08s, max 3.000e-08s, tot 6.001e-08s (2 samples) +#pr: ref. unt. rsb operation time was: on avg. 6.664e-04s, min 5.870e-04s, max 7.458e-04s, tot 1.333e-03s (2 samples) +#pr: min / max ratio of in-memory MEMSET bandwidth to extrapolated read bandwidth ratio: 4.534e+00 4.534e+00 +#pr: in-cache to in-memory MEMSET bandwidth ratio: 9.987e-01 +#pr: rsb nrhs-to-overall-min-rhs speed ratio was: on avg. 3.278e+01 x, min 2.000e+00 x, max 6.357e+01 x (2 samples, the non-min-nrhs ones) #pr: ======== Limiting to transA=T: #pr: No sample (out of 4) matched the dump criteria -- skipping dump round. #pr: ======== Limiting to both transA=T and nrhs=1: @@ -3825,44 +3861,44 @@ #pr: ======== All results (not limiting) #pr: Dump from a base of 4 samples (of max 8) ordered by (1,2,1,1,2,1,2) = (filename x cores x incX x incY x nrhs x typecode x transA). pr: BESTCODE MTX NR NC NNZ NRHS TYPE SYM TRANS NT AT-NT AT-MKL-NT BPNZ AT-BPNZ NSUBM AT-SUBM RSBBEST-MFLOPS OPTIME MKL-OPTIME AT-OPTIME AT-MKL-OPTIME AT-TIME RWminBW-GBps CB-bpf AT-MS CMFLOPS -pr: 1:R_R A 3 3 6 1 Z S N 1 1 0 4.0000 4.6667 3 1 1172.21 1.222e-03 0.000e+00 8.190e-08 0.000e+00 1.099e-02 3.27e+00 2.29e+00 1 9.60e-05 -pr: 3:R_R A 3 3 6 2 Z S N 1 1 0 4.0000 4.6667 3 1 2344.41 7.861e-04 0.000e+00 8.190e-08 0.000e+00 7.446e-03 5.03e+00 1.65e+00 1 1.92e-04 -pr: 5:R_R A 3 3 6 1 Z S N 4 1 0 4.0000 4.6667 3 1 1172.21 1.020e-03 0.000e+00 8.190e-08 0.000e+00 1.167e-02 3.27e+00 2.29e+00 1 9.60e-05 -pr: 7:R_R A 3 3 6 2 Z S N 4 1 0 4.0000 4.6667 3 1 2344.41 6.359e-04 0.000e+00 8.190e-08 0.000e+00 5.795e-03 5.03e+00 1.65e+00 1 1.92e-04 +pr: 1:R_R A 3 3 6 1 Z S N 1 1 0 4.0000 4.6667 3 1 100.66 1.214e-03 0.000e+00 9.537e-07 0.000e+00 1.096e-02 2.81e-01 2.29e+00 1 9.60e-05 +pr: 3:R_R A 3 3 6 2 Z S N 1 1 0 4.0000 4.6667 3 1 6398.94 7.458e-04 0.000e+00 3.000e-08 0.000e+00 7.546e-03 1.37e+01 1.65e+00 1 1.92e-04 +pr: 5:R_R A 3 3 6 1 Z S N 4 1 0 4.0000 4.6667 3 1 3199.47 9.322e-04 0.000e+00 3.000e-08 0.000e+00 8.471e-03 8.93e+00 2.29e+00 1 9.60e-05 +pr: 7:R_R A 3 3 6 2 Z S N 4 1 0 4.0000 4.6667 3 1 6398.94 5.870e-04 0.000e+00 3.000e-08 0.000e+00 5.498e-03 1.37e+01 1.65e+00 1 1.92e-04 #pr: below, we define 'successful' autotuning when speedup of 1.010000x is exceeded, and 'tuned' results even the ones which are same as untuned #pr: rsb autotuning was successful in 4 cases (100.00 %) and unsuccessful in 0 cases (0.00 %) -#pr: (in succ. cases rsb autotuning gave avg. 1118313.4 % faster, avg. sp. ratio 11184.134x, max sp. ratio 14919.942x, avg. ratio 0.000x) -#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 109604.1/70759.8/142532.8/438416.3 tuned ops) -#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 9.8/ 9.0/ 11.4/ 39.0 untuned ops) -#pr: (and amortizes from untuned rsb in avg. 9.8, min. 9.0, max. 11.4 ops) +#pr: (in succ. cases rsb autotuning gave avg. 1918886.0 % faster, avg. sp. ratio 19189.860x, max sp. ratio 31068.733x, avg. ratio 0.000x) +#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 182133.6/11490.2/282320.2/728534.4 tuned ops) +#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 9.4/ 9.0/ 10.1/ 37.6 untuned ops) +#pr: (and amortizes from untuned rsb in avg. 9.4, min. 9.0, max. 10.1 ops) #pr: (avg/min/max (avg) nnz per subm before successful tuning were 2/ 2/ 2) #pr: (avg/min/max (avg) nnz per subm after successful tuning were 6/ 6/ 6) #pr: (avg/min/max (avg) bytes per subm before successful tuning were 32/ 32/ 32) #pr: (avg/min/max (avg) bytes per subm after successful tuning were 96/ 96/ 96) #pr: (avg/min/max (avg) bytes per nnz before successful tuning were 4.000/ 4.000/ 4.000) -#pr: (avg/min/max operands (mtx,lhs,rhs) read bandwidth lower bound 3.272/ 2.686/ 3.859,GBps) -#pr: (avg/min/max operands (mtx,rhs:r;lhs:rw) bandwidth lower bound 16.606/ 3.272/ 5.031,GBps) +#pr: (avg/min/max operands (mtx,lhs,rhs) read bandwidth lower bound 7.156/ 0.231/ 10.532,GBps) +#pr: (avg/min/max operands (mtx,rhs:r;lhs:rw) bandwidth lower bound 36.675/ 0.281/ 13.731,GBps) #pr: (avg/min/max code balance (bytes read at least once per flop) 1.969/ 1.646/ 2.292) #pr: (avg/min/max (avg) bytes per nnz after successful tuning were 4.667/ 4.667/ 4.667) #pr: (matrix has been subdivided more/less/same in resp. 0 / 4 /0 cases) #pr: (matrix has used more/less/same threads in resp. 0 / 2 /2 cases) #pr: no unsuccessful rsb autotuning attempt (according to 1.01x threshold) -#pr: rsb auto tuning (either succ. or uns.) time was: on avg.: 0.01 s, min 0.01 s, max 0.01 s, tot 0.04 s (4 samples) -#pr: rsb auto tuning ( only successful ) time was: on avg.: 0.01 s, min 0.01 s, max 0.01 s, tot 0.04 s (4 samples) -#pr: best tun. rsb canon. mflops were: on avg. 1.758e+03, min 1.172e+03, max 2.344e+03 (4 samples) -#pr: ref. unt. rsb canon. mflops were: on avg. 1.797e-01, min 7.857e-02, max 3.020e-01 (4 samples) -#pr: best tun. rsb operation time was: on avg. 8.190e-08s, min 8.190e-08s, max 8.190e-08s, tot 3.276e-07s (4 samples) -#pr: ref. unt. rsb operation time was: on avg. 9.159e-04s, min 6.359e-04s, max 1.222e-03s, tot 3.664e-03s (4 samples) -#pr: min / max ratio of in-memory MEMSET bandwidth to extrapolated read bandwidth ratio: 1.213e+01 1.743e+01 -#pr: in-cache to in-memory MEMSET bandwidth ratio: 1.016e+00 -#pr: rsb nrhs-to-overall-min-rhs speed ratio was: on avg. 2.000e+00 x, min 2.000e+00 x, max 2.000e+00 x (2 samples, the non-min-nrhs ones) -#pr: Record collection took 0.23 s. +#pr: rsb auto tuning (either succ. or uns.) time was: on avg.: 0.01 s, min 0.01 s, max 0.01 s, tot 0.03 s (4 samples) +#pr: rsb auto tuning ( only successful ) time was: on avg.: 0.01 s, min 0.01 s, max 0.01 s, tot 0.03 s (4 samples) +#pr: best tun. rsb canon. mflops were: on avg. 4.025e+03, min 1.007e+02, max 6.399e+03 (4 samples) +#pr: ref. unt. rsb canon. mflops were: on avg. 1.917e-01, min 7.909e-02, max 3.271e-01 (4 samples) +#pr: best tun. rsb operation time was: on avg. 2.609e-07s, min 3.000e-08s, max 9.537e-07s, tot 1.044e-06s (4 samples) +#pr: ref. unt. rsb operation time was: on avg. 8.697e-04s, min 5.870e-04s, max 1.214e-03s, tot 3.479e-03s (4 samples) +#pr: min / max ratio of in-memory MEMSET bandwidth to extrapolated read bandwidth ratio: 4.534e+00 2.070e+02 +#pr: in-cache to in-memory MEMSET bandwidth ratio: 9.987e-01 +#pr: rsb nrhs-to-overall-min-rhs speed ratio was: on avg. 3.278e+01 x, min 2.000e+00 x, max 6.357e+01 x (2 samples, the non-min-nrhs ones) +#pr: Record collection took 0.22 s. #pr: Record comprises 40 memory benchmark samples (prepend RSB_PR_MBW=1 to dump this). -#pr: Record comprises 105 environment variables in 5773 bytes (prepend RSB_PR_ENV=1 to dump this). +#pr: Record comprises 105 environment variables in 5827 bytes (prepend RSB_PR_ENV=1 to dump this). # ====== END Total summary record. -#pr: ======== Saved a performance record of 8 samples to rsbench_pr__1796064017_gcc-15.2-1,4th.rpr -# Removing the temporary record file rsbench_pr__1796064017_gcc-15.2-1,4th.rpr.tmp. -# terminating run at 1796064023 (after 5.6s of w.c.t.) +#pr: ======== Saved a performance record of 8 samples to rsbench_pr__1761654533_gcc-15.2-1,4th.rpr +# Removing the temporary record file rsbench_pr__1761654533_gcc-15.2-1,4th.rpr.tmp. +# terminating run at 1761654539 (after 5.6s of w.c.t.) + ./rsbench -oa -Ob --help /build/reproducible-path/librsb-1.3.0.2+dfsg/.libs/rsbench is a swiss army knife for testing the library functionality and performance. You can use it to perform sparse matrix - unitary vector multiplication, specifying the blocking parameters, the times to perform multiplication. @@ -4134,10 +4170,10 @@ L1 size: 24576 L2 size: 524288 sysconf() : 4096 bytes per pagesize -sysconf() : 8202356 physical pages -sysconf() : 33596850176 bytes (32040 MB) of physical memory -sysconf() : 5521315 available (free) physical pages -sysconf() : 22615306240 available (free) physical memory +sysconf() : 8202357 physical pages +sysconf() : 33596854272 bytes (32040 MB) of physical memory +sysconf() : 4325581 available (free) physical pages +sysconf() : 17717579776 available (free) physical memory sysconf() , processors : 12 sysconf() , processors online : 12 sysconf() : no level 1 cache @@ -4162,30 +4198,30 @@ RSB_SUBM_IDX_MARKER : 2147483647 RSB_MAX_ALLOCATABLE_MEMORY_CHUNK: 18446744073709551615 timing min delta (if negative, don't complain with us) : 0 s -timing granularity : 2.99931e-08 s +timing granularity : 3.19958e-08 s CFLAGS : -g -O2 -Werror=implicit-function-declaration -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 CXXFLAGS : -g -O2 -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -fopenmp CC : gcc memhinfo : L2:4/64/512K,L1:8/64/24K -detected free memory : 22615306240 -detected total memory : 33596850176 -for array sized 524288 elems, took 0.000108957 s for linear search and 0 s for binary search for element 524287, in 901 tries, for a total of 0.100077 s (ignore this:944765174) -for array sized 524288 elems, took 5.48363e-05 s for linear search and 0 s for binary search for element 262143, in 1798 tries, for a total of 0.100019 s (ignore this:1887431402) -for array sized 524288 elems, took 2.69413e-05 s for linear search and 0 s for binary search for element 131071, in 3564 tries, for a total of 0.100008 s (ignore this:-1473261806) -for array sized 524288 elems, took 1.28746e-05 s for linear search and 0 s for binary search for element 65535, in 7202 tries, for a total of 0.100006 s (ignore this:-529295666) -for array sized 524288 elems, took 5.96046e-06 s for linear search and 0 s for binary search for element 32767, in 14293 tries, for a total of 0.100006 s (ignore this:407381796) -for array sized 524288 elems, took 2.86102e-06 s for linear search and 0 s for binary search for element 16383, in 28149 tries, for a total of 0.100000 s (ignore this:1329711930) -for array sized 524288 elems, took 9.53674e-07 s for linear search and 0 s for binary search for element 8191, in 55241 tries, for a total of 0.100002 s (ignore this:-2060297304) -for array sized 524288 elems, took 0 s for linear search and 0 s for binary search for element 4095, in 104646 tries, for a total of 0.100001 s (ignore this:-1203246564) -for array sized 524288 elems, took 0 s for linear search and 0 s for binary search for element 2047, in 189347 tries, for a total of 0.100001 s (ignore this:-428059946) -for array sized 524288 elems, took 0 s for linear search and 0 s for binary search for element 1023, in 327456 tries, for a total of 0.100000 s (ignore this:241915030) -for array sized 524288 elems, took 0 s for linear search and 0 s for binary search for element 511, in 505296 tries, for a total of 0.100001 s (ignore this:758327542) -for array sized 524288 elems, took 0 s for linear search and 0 s for binary search for element 255, in 692839 tries, for a total of 0.100000 s (ignore this:1111675432) -for array sized 524288 elems, took 0 s for linear search and 0 s for binary search for element 127, in 848057 tries, for a total of 0.100001 s (ignore this:1327081910) -for array sized 524288 elems, took 0 s for linear search and 0 s for binary search for element 63, in 964220 tries, for a total of 0.100000 s (ignore this:1448573630) -for array sized 524288 elems, took 0 s for linear search and 0 s for binary search for element 31, in 1016058 tries, for a total of 0.100000 s (ignore this:1511569226) -for array sized 524288 elems, took 0 s for linear search and 0 s for binary search for element 15, in 1054705 tries, for a total of 0.100000 s (ignore this:1543210376) -for array sized 524288 elems, took 0 s for linear search and 0 s for binary search for element 7, in 1069826 tries, for a total of 0.100001 s (ignore this:1558187940) +detected free memory : 17717579776 +detected total memory : 33596854272 +for array sized 524288 elems, took 0.000108957 s for linear search and 0 s for binary search for element 524287, in 855 tries, for a total of 0.100094 s (ignore this:896530770) +for array sized 524288 elems, took 5.48363e-05 s for linear search and 0 s for binary search for element 262143, in 1811 tries, for a total of 0.100038 s (ignore this:1846012716) +for array sized 524288 elems, took 2.69413e-05 s for linear search and 0 s for binary search for element 131071, in 3578 tries, for a total of 0.100006 s (ignore this:-1511010504) +for array sized 524288 elems, took 1.28746e-05 s for linear search and 0 s for binary search for element 65535, in 7203 tries, for a total of 0.100010 s (ignore this:-566913294) +for array sized 524288 elems, took 5.96046e-06 s for linear search and 0 s for binary search for element 32767, in 14294 tries, for a total of 0.100000 s (ignore this:369829702) +for array sized 524288 elems, took 2.86102e-06 s for linear search and 0 s for binary search for element 16383, in 28000 tries, for a total of 0.100000 s (ignore this:1287277702) +for array sized 524288 elems, took 9.53674e-07 s for linear search and 0 s for binary search for element 8191, in 55241 tries, for a total of 0.100000 s (ignore this:-2102731532) +for array sized 524288 elems, took 0 s for linear search and 0 s for binary search for element 4095, in 104512 tries, for a total of 0.100001 s (ignore this:-1246778252) +for array sized 524288 elems, took 0 s for linear search and 0 s for binary search for element 2047, in 189446 tries, for a total of 0.100001 s (ignore this:-471186328) +for array sized 524288 elems, took 0 s for linear search and 0 s for binary search for element 1023, in 326625 tries, for a total of 0.100001 s (ignore this:197088422) +for array sized 524288 elems, took 0 s for linear search and 0 s for binary search for element 511, in 505004 tries, for a total of 0.100001 s (ignore this:713202510) +for array sized 524288 elems, took 0 s for linear search and 0 s for binary search for element 255, in 692951 tries, for a total of 0.100000 s (ignore this:1066607520) +for array sized 524288 elems, took 0 s for linear search and 0 s for binary search for element 127, in 850825 tries, for a total of 0.100000 s (ignore this:1282717070) +for array sized 524288 elems, took 0 s for linear search and 0 s for binary search for element 63, in 959805 tries, for a total of 0.100001 s (ignore this:1403652500) +for array sized 524288 elems, took 0 s for linear search and 0 s for binary search for element 31, in 1024397 tries, for a total of 0.100000 s (ignore this:1467165114) +for array sized 524288 elems, took 0 s for linear search and 0 s for binary search for element 15, in 1039795 tries, for a total of 0.100001 s (ignore this:1498358964) +for array sized 524288 elems, took 0 s for linear search and 0 s for binary search for element 7, in 1051989 tries, for a total of 0.100001 s (ignore this:1513086810) + ./rsbench -C /build/reproducible-path/librsb-1.3.0.2+dfsg/.libs/rsbench version: 1.3.0 format switches:br @@ -4232,17 +4268,17 @@ Adding matrix file: /build/reproducible-path/librsb-1.3.0.2+dfsg/A.mtx # Sorting matrices list (use --no-sort-filenames-list to prevent this) # Using matrices: A.mtx -# beginning run at 1796064025 +# beginning run at 1761654541 # /build/reproducible-path/librsb-1.3.0.2+dfsg/.libs/rsbench -oa -Ob --bench -f /build/reproducible-path/librsb-1.3.0.2+dfsg/A.mtx --verbose --nrhs 1,4 --by-rows # compiled with: CC=gcc CFLAGS=-g -O2 -Werror=implicit-function-declaration -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 # User did not specify threads; assuming 1. Environment provides max 12 threads; this build supports max 128. # User did not specify threads; assuming 1. Environment provides max 12 threads; this build supports max 128. -# average timer granularity: 7.78e-08 s -# Will write a final performance record to file rsbench_pr__1796064025_gcc-15.2.rpr and periodic checkpoints to rsbench_pr__1796064025_gcc-15.2.rpr.tmp +# average timer granularity: 7.62e-08 s +# Will write a final performance record to file rsbench_pr__1761654541_gcc-15.2.rpr and periodic checkpoints to rsbench_pr__1761654541_gcc-15.2.rpr.tmp # will NOT perform ancillary tests. # will flush cache memory: between each operation measurement series, and NOT between each operation. # will keep any zero encountered in the matrix. -# env: export PATH=/usr/sbin:/usr/bin:/sbin:/bin:/usr/games +# env: export PATH=/usr/sbin:/usr/bin:/sbin:/bin:/usr/games:/i/capture/the/path # env: export LD_LIBRARY_PATH=/build/reproducible-path/librsb-1.3.0.2+dfsg/.libs # env: HOSTNAME is not set # env: KMP_AFFINITY is not set @@ -4281,61 +4317,61 @@ # env: SLURM_NTASKS is not set # env: SLURM_STEP_TASKS_PER_NODE is not set # env: SLURM_TASKS_PER_NODE is not set -# detected hostname: codethink03-arm64 +# detected hostname: i-capture-the-hostname # user specified a verbosity level of 1 (each --verbose occurrence counts +1) # This test will measure times in scanning arrays sized and aligned to fit in caches. # 2 cache levels detected Will fill struct with 40 samples... -# Memory benchmark took 5.371s +# Memory benchmark took 5.396s # auto-tuning oriented output implies times==0 iterations and sort-after-load. #pr: allocated a performance record for 16 samples (4480 bytes). # multi-type benchmarking (DSCZ) -- now using typecode D (last was D). # Cache block size total 524288 bytes, per-thread 43690 bytes -# so far, program took 5.375s of wall clock time; ancillary tests 0.000s; I/O 0.000s; checks 0.000s; conversions 0.000s; rsb/mkl tuning 0.000s/0.000s . +# so far, program took 5.399s of wall clock time; ancillary tests 0.000s; I/O 0.000s; checks 0.000s; conversions 0.000s; rsb/mkl tuning 0.000s/0.000s . # reading A.mtx (184 bytes / 1 MiB / 6 nnz / 3 rows / 3 columns / 1 MiB COO) as type D... -# file input of A.mtx took 0.00 s (6 nnz, 75801 nnz/s ) (2.32 MB/s ) -#pre-sorting (6 elements) took 0.00384307 s +# file input of A.mtx took 0.00 s (6 nnz, 72316 nnz/s ) (2.22 MB/s ) +#pre-sorting (6 elements) took 0.00211406 s #weeding duplicates (to 6 elements) took 2.14577e-06 s (and check, 1.90735e-06 s ) # multi-nrhs benchmarking (1,4) -- now using nrhs 1. # Using alpha=1 beta=1 order=rows for rsb_spmv/rsb_spsv/rsb_spmm/rsb_spsm. # multi-transpose benchmarking -- now using transA = N. # will use input matrix flags: RSB_FLAG_USE_HALFWORD_INDICES, RSB_FLAG_SORTED_INPUT, RSB_FLAG_QUAD_PARTITIONING, RSB_FLAG_SYMMETRIC, RSB_FLAG_OWN_PARTITIONING_ARRAYS # Using 12 threads -# Constructed matrix (took 0.010s): (3 x 3)[0xaaaaf1f38010]{D} @ (0(0..0),0(0..0)) (6 nnz, 2 nnz/r) flags 0x2442186 (coo:1, csr:0, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'S' +# Constructed matrix (took 0.008s): (3 x 3)[0xaaaaeb9d6050]{D} @ (0(0..0),0(0..0)) (6 nnz, 2 nnz/r) flags 0x2442186 (coo:1, csr:0, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'S' # matrix consistency check took 0.000s (ok) RSB Sparse Blocks Autotuner invoked requesting max 6 splits and max 6 merges in 1 rounds, threads spec.0 (specify negative values to enable threads tuning). Will autotune matrix: 3 x 3, type D, 6 nnz, 2 nnz/r, 4 subms, 3 lsubms, 4.0000 bpnz. Parameters: verbosity:1 mintimes:3 maxtimes:10 mindt:0 maxdt:3 -3 iterations (12 th.) took 0.003832s; avg 0.001277s ( +/- 6.52/ 12.26 %); best 0.001194s; worst 0.001434s; std dev. 0.0001108 (taking best). -Reference operation time is 0.001194 s (0.0201 Mflops) with 12 threads. -Starting merge (same threads) based auto-tuning procedure (transA=N, nrhs=1, order=rows) (max 6 steps, inclusive 3 grace steps) on: 3 x 3, type D, 6 nnz, 2 nnz/r, 4 subms, 3 lsubms, 4.0000 bpnz (tpop: 0.001194 Mflops: 0.020) -Merge (3 -> 1 leaves) took w.c.t. of 1.812e-05s, ~7.153e-06s of computing time (of which 9.537e-07s sorting, 2.146e-06s analysis) -3 iterations (12 th.) took 1.884e-05s; avg 6.278e-06s ( +/- 98.78/184.81 %); best 7.645e-08s; worst 1.788e-05s; std dev. 8.214e-06 (taking best). -Reference operation time is 7.64489e-08 s (313.9 Mflops) with 12 threads. -After merge step 1: tpop: 7.645e-08 s ~Mflops: 313.935 nsubm:1 otn:12 -Applying merge (3 -> 1 leaves, 12 th.) yielded SPEEDUP of 15618.275x: 0.001194s -> 7.645e-08s, so taking this instance. +3 iterations (12 th.) took 0.003797s; avg 0.001266s ( +/- 1.80/ 2.08 %); best 0.001243s; worst 0.001292s; std dev. 2.022e-05 (taking best). +Reference operation time is 0.00124288 s (0.01931 Mflops) with 12 threads. +Starting merge (same threads) based auto-tuning procedure (transA=N, nrhs=1, order=rows) (max 6 steps, inclusive 3 grace steps) on: 3 x 3, type D, 6 nnz, 2 nnz/r, 4 subms, 3 lsubms, 4.0000 bpnz (tpop: 0.001243 Mflops: 0.019) +Merge (3 -> 1 leaves) took w.c.t. of 2.885e-05s, ~1.097e-05s of computing time (of which 1.907e-06s sorting, 5.96e-06s analysis) +3 iterations (12 th.) took 3.099e-05s; avg 1.033e-05s ( +/- 99.25/190.77 %); best 7.734e-08s; worst 3.004e-05s; std dev. 1.394e-05 (taking best). +Reference operation time is 7.7343e-08 s (310.3 Mflops) with 12 threads. +After merge step 1: tpop: 7.734e-08 s ~Mflops: 310.306 nsubm:1 otn:12 +Applying merge (3 -> 1 leaves, 12 th.) yielded SPEEDUP of 16069.667x: 0.001243s -> 7.734e-08s, so taking this instance. Merged all the matrix leaves: no reason to continue merging. -A total of 1 merge steps (of max 6) (3 -> 1 subms) took 0.004065s (of which 2.193e-05s partitioning, 0s I/O); computing times: 7.153e-06s in par. loops, 9.537e-07s sorting, 2.146e-06s analyzing) -Total merge + benchmarking process took 0.004065s, equivalent to 53173.2/3.4 new/old ops (0.007203s for 2 clones -- as 94218.0/6.0 ops, or 47109.0/3.0 ops per clone), SPEEDUP of 15618.275x -Applying multi-merge (3 -> 1 leaves, 1 steps, 0 -> 12 th.sp.) yielded SPEEDUP of 15618.275x (0.001194s -> 7.645e-08s), will amortize in 3.4 ops by saving 0.001194s per op. -In 1 tuning rounds (tot. 0.012s, 0.0072s for constructor, 2 clones) obtained a SPEEDUP of 1561727.5% (1.562e+04x) (from 0.0201 to 313.9 Mflops). +A total of 1 merge steps (of max 6) (3 -> 1 subms) took 0.003765s (of which 3.386e-05s partitioning, 0s I/O); computing times: 1.097e-05s in par. loops, 1.907e-06s sorting, 5.96e-06s analyzing) +Total merge + benchmarking process took 0.003765s, equivalent to 48677.6/3.0 new/old ops (0.006929s for 2 clones -- as 89583.8/5.6 ops, or 44791.9/2.8 ops per clone), SPEEDUP of 16069.667x +Applying multi-merge (3 -> 1 leaves, 1 steps, 0 -> 12 th.sp.) yielded SPEEDUP of 16069.667x (0.001243s -> 7.734e-08s), will amortize in 3.0 ops by saving 0.001243s per op. +In 1 tuning rounds (tot. 0.011s, 0.0069s for constructor, 2 clones) obtained a SPEEDUP of 1606866.7% (1.607e+04x) (from 0.01931 to 310.3 Mflops). #pr: updating sample at index 1 (0^th of 16), 0^th touch for (0,0,0,0,0,0,0). -First run of RSB Autotuner took 0.0115621 s (1.194e-03 s -> 7.645e-08 s per spmv_sxsa) (tuned: 3 -> 1 lsubm). +First run of RSB Autotuner took 0.0109081 s (1.243e-03 s -> 7.734e-08 s per spmv_sxsa) (tuned: 3 -> 1 lsubm). RSB Sparse Blocks Autotuner invoked requesting max 0 splits and max 0 merges in 1 rounds, auto threads spec. -Second run of RSB Autotuner took 0.0614598 s and estimated a speedup of 1.000000 x (7.645e-08 s -> 7.645e-08 s per op) in same matrix (1 -> 1 lsubm) +Second run of RSB Autotuner took 0.0581801 s and estimated a speedup of 1.000000 x (7.734e-08 s -> 7.734e-08 s per op) in same matrix (1 -> 1 lsubm) #min:1 #max:1 #sum:3 #norm:1.7320508075688772 #used index storage compared to COO:28 vs 48 bytes (58.33%) ; compared to CSR:28 vs 40 bytes (77.78%) #%:CONSTRUCTOR_*:SORT SCAN INSERT SCAN+INSERT -%:CONSTRUCTOR_TIMES:A.mtx S N 12 3 3 6 0.000000 0.004799 0.002393 0.007192 -%:UNSORTEDCOO2RSB_TIME:A.mtx S N 12 3 3 6 0.007192 -%:RSB_SUBDIVISION_TIME:A.mtx S N 12 3 3 6 0.004799 -%:RSB_SHUFFLE_TIME:A.mtx S N 12 3 3 6 0.002393 +%:CONSTRUCTOR_TIMES:A.mtx S N 12 3 3 6 0.000000 0.003012 0.002495 0.005507 +%:UNSORTEDCOO2RSB_TIME:A.mtx S N 12 3 3 6 0.005507 +%:RSB_SUBDIVISION_TIME:A.mtx S N 12 3 3 6 0.003012 +%:RSB_SHUFFLE_TIME:A.mtx S N 12 3 3 6 0.002495 %:ROW_MAJOR_SORT_TIME:A.mtx S N 12 3 3 6 0.000000 %:ROW_MAJOR_SORT_SCALING:A.mtx S N 12 3 3 6 nan -%:SORTEDCOO2RSB_TIME:A.mtx S N 12 3 3 6 0.007192 +%:SORTEDCOO2RSB_TIME:A.mtx S N 12 3 3 6 0.005507 %:ROW_MAJOR_SORT_TO_MOP:A.mtx S N 12 3 3 6 0.000 %:UNSORTEDCOO2RSB_SCALING:A.mtx S N 12 3 3 6 1.00 %:SORTEDCOO2RSB_SCALING:A.mtx S N 12 3 3 6 1.00 @@ -4350,50 +4386,50 @@ %:SM_MINMAXAVGNNZ:A.mtx S N 12 3 3 6 6 6 6 # %operation:matrix CONSTRUCTOR[12] SPMV[12] SPMV[12] -%operation:A.mtx 0.0100031 1e+09 1e+09 +%operation:A.mtx 0.00794697 1e+09 1e+09 %constructor:matrix SORT[12] SCAN[12] SHUFFLE[12] INSERT[12] -%constructor:A.mtx 0 0.00479913 0 0.00239301 +%constructor:A.mtx 0 0.00301218 0 0.00249505 # symmetric matrix --- skipping transposed benchmarking # multi-nrhs benchmarking (1,4) -- now using nrhs 4. # Using alpha=1 beta=1 order=rows for rsb_spmv/rsb_spsv/rsb_spmm/rsb_spsm. # multi-transpose benchmarking -- now using transA = N. # will use input matrix flags: RSB_FLAG_USE_HALFWORD_INDICES, RSB_FLAG_SORTED_INPUT, RSB_FLAG_QUAD_PARTITIONING, RSB_FLAG_SYMMETRIC, RSB_FLAG_OWN_PARTITIONING_ARRAYS # Using 12 threads -# Constructed matrix (took 0.005s): (3 x 3)[0xaaaaf1f38010]{D} @ (0(0..0),0(0..0)) (6 nnz, 2 nnz/r) flags 0x2442186 (coo:1, csr:0, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'S' +# Constructed matrix (took 0.006s): (3 x 3)[0xaaaaeb9d6050]{D} @ (0(0..0),0(0..0)) (6 nnz, 2 nnz/r) flags 0x2442186 (coo:1, csr:0, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'S' # matrix consistency check took 0.000s (ok) RSB Sparse Blocks Autotuner invoked requesting max 6 splits and max 6 merges in 1 rounds, threads spec.0 (specify negative values to enable threads tuning). Will autotune matrix: 3 x 3, type D, 6 nnz, 2 nnz/r, 4 subms, 3 lsubms, 4.0000 bpnz. Parameters: verbosity:1 mintimes:3 maxtimes:10 mindt:0 maxdt:3 -3 iterations (12 th.) took 0.004941s; avg 0.001647s ( +/- 19.12/ 30.24 %); best 0.001332s; worst 0.002145s; std dev. 0.0003563 (taking best). -Reference operation time is 0.00133204 s (0.07207 Mflops) with 12 threads. -Starting merge (same threads) based auto-tuning procedure (transA=N, nrhs=4, order=rows) (max 6 steps, inclusive 3 grace steps) on: 3 x 3, type D, 6 nnz, 2 nnz/r, 4 subms, 3 lsubms, 4.0000 bpnz (tpop: 0.001332 Mflops: 0.072) -Merge (3 -> 1 leaves) took w.c.t. of 1.311e-05s, ~4.053e-06s of computing time (of which 9.537e-07s sorting, 2.146e-06s analysis) -3 iterations (12 th.) took 3.815e-06s; avg 1.272e-06s ( +/- 93.99/125.00 %); best 7.645e-08s; worst 2.861e-06s; std dev. 1.189e-06 (taking best). -Reference operation time is 7.64489e-08 s (1256 Mflops) with 12 threads. -After merge step 1: tpop: 7.645e-08 s ~Mflops: 1255.740 nsubm:1 otn:12 -Applying merge (3 -> 1 leaves, 12 th.) yielded SPEEDUP of 17423.983x: 0.001332s -> 7.645e-08s, so taking this instance. +3 iterations (12 th.) took 0.002872s; avg 0.0009573s ( +/- 0.78/ 1.34 %); best 0.0009499s; worst 0.0009701s; std dev. 9.09e-06 (taking best). +Reference operation time is 0.00094986 s (0.1011 Mflops) with 12 threads. +Starting merge (same threads) based auto-tuning procedure (transA=N, nrhs=4, order=rows) (max 6 steps, inclusive 3 grace steps) on: 3 x 3, type D, 6 nnz, 2 nnz/r, 4 subms, 3 lsubms, 4.0000 bpnz (tpop: 0.0009499 Mflops: 0.101) +Merge (3 -> 1 leaves) took w.c.t. of 8.821e-06s, ~4.053e-06s of computing time (of which 9.537e-07s sorting, 9.537e-07s analysis) +3 iterations (12 th.) took 4.053e-06s; avg 1.351e-06s ( +/- 94.28/129.41 %); best 7.734e-08s; worst 3.099e-06s; std dev. 1.296e-06 (taking best). +Reference operation time is 7.7343e-08 s (1241 Mflops) with 12 threads. +After merge step 1: tpop: 7.734e-08 s ~Mflops: 1241.224 nsubm:1 otn:12 +Applying merge (3 -> 1 leaves, 12 th.) yielded SPEEDUP of 12281.134x: 0.0009499s -> 7.734e-08s, so taking this instance. Merged all the matrix leaves: no reason to continue merging. -A total of 1 merge steps (of max 6) (3 -> 1 subms) took 0.004245s (of which 1.597e-05s partitioning, 0s I/O); computing times: 4.053e-06s in par. loops, 9.537e-07s sorting, 2.146e-06s analyzing) -Total merge + benchmarking process took 0.004245s, equivalent to 55527.8/3.2 new/old ops (0.006499s for 2 clones -- as 85008.6/4.9 ops, or 42504.3/2.4 ops per clone), SPEEDUP of 17423.983x -Applying multi-merge (3 -> 1 leaves, 1 steps, 0 -> 12 th.sp.) yielded SPEEDUP of 17423.983x (0.001332s -> 7.645e-08s), will amortize in 3.2 ops by saving 0.001332s per op. -In 1 tuning rounds (tot. 0.012s, 0.0065s for constructor, 2 clones) obtained a SPEEDUP of 1742298.3% (1.742e+04x) (from 0.07207 to 1256 Mflops). +A total of 1 merge steps (of max 6) (3 -> 1 subms) took 0.002884s (of which 1.287e-05s partitioning, 0s I/O); computing times: 4.053e-06s in par. loops, 9.537e-07s sorting, 9.537e-07s analyzing) +Total merge + benchmarking process took 0.002884s, equivalent to 37290.4/3.0 new/old ops (0.00573s for 2 clones -- as 74084.5/6.0 ops, or 37042.2/3.0 ops per clone), SPEEDUP of 12281.134x +Applying multi-merge (3 -> 1 leaves, 1 steps, 0 -> 12 th.sp.) yielded SPEEDUP of 12281.134x (0.0009499s -> 7.734e-08s), will amortize in 3.0 ops by saving 0.0009498s per op. +In 1 tuning rounds (tot. 0.0087s, 0.0057s for constructor, 2 clones) obtained a SPEEDUP of 1228013.4% (1.228e+04x) (from 0.1011 to 1241 Mflops). #pr: updating sample at index 9 (1^th of 16), 0^th touch for (0,0,0,0,1,0,0). -First run of RSB Autotuner took 0.0115209 s (1.332e-03 s -> 7.645e-08 s per spmv_sxsa) (tuned: 3 -> 1 lsubm). +First run of RSB Autotuner took 0.00868106 s (9.499e-04 s -> 7.734e-08 s per spmv_sxsa) (tuned: 3 -> 1 lsubm). RSB Sparse Blocks Autotuner invoked requesting max 0 splits and max 0 merges in 1 rounds, auto threads spec. -Second run of RSB Autotuner took 0.0422771 s and estimated a speedup of 1.000000 x (7.645e-08 s -> 7.645e-08 s per op) in same matrix (1 -> 1 lsubm) +Second run of RSB Autotuner took 0.0428119 s and estimated a speedup of 1.000000 x (7.734e-08 s -> 7.734e-08 s per op) in same matrix (1 -> 1 lsubm) #min:1 #max:1 #sum:3 #norm:1.7320508075688772 #used index storage compared to COO:28 vs 48 bytes (58.33%) ; compared to CSR:28 vs 40 bytes (77.78%) #%:CONSTRUCTOR_*:SORT SCAN INSERT SCAN+INSERT -%:CONSTRUCTOR_TIMES:A.mtx S N 12 3 3 6 0.000000 0.002017 0.001609 0.003626 -%:UNSORTEDCOO2RSB_TIME:A.mtx S N 12 3 3 6 0.003626 -%:RSB_SUBDIVISION_TIME:A.mtx S N 12 3 3 6 0.002017 -%:RSB_SHUFFLE_TIME:A.mtx S N 12 3 3 6 0.001609 +%:CONSTRUCTOR_TIMES:A.mtx S N 12 3 3 6 0.000000 0.002007 0.001942 0.003949 +%:UNSORTEDCOO2RSB_TIME:A.mtx S N 12 3 3 6 0.003949 +%:RSB_SUBDIVISION_TIME:A.mtx S N 12 3 3 6 0.002007 +%:RSB_SHUFFLE_TIME:A.mtx S N 12 3 3 6 0.001942 %:ROW_MAJOR_SORT_TIME:A.mtx S N 12 3 3 6 0.000000 %:ROW_MAJOR_SORT_SCALING:A.mtx S N 12 3 3 6 nan -%:SORTEDCOO2RSB_TIME:A.mtx S N 12 3 3 6 0.003626 +%:SORTEDCOO2RSB_TIME:A.mtx S N 12 3 3 6 0.003949 %:ROW_MAJOR_SORT_TO_MOP:A.mtx S N 12 3 3 6 0.000 %:UNSORTEDCOO2RSB_SCALING:A.mtx S N 12 3 3 6 1.00 %:SORTEDCOO2RSB_SCALING:A.mtx S N 12 3 3 6 1.00 @@ -4408,65 +4444,65 @@ %:SM_MINMAXAVGNNZ:A.mtx S N 12 3 3 6 6 6 6 # %operation:matrix CONSTRUCTOR[12] SPMV[12] SPMV[12] -%operation:A.mtx 0.00519109 1e+09 1e+09 +%operation:A.mtx 0.00587702 1e+09 1e+09 %constructor:matrix SORT[12] SCAN[12] SHUFFLE[12] INSERT[12] -%constructor:A.mtx 0 0.00201702 0 0.00160885 +%constructor:A.mtx 0 0.00200677 0 0.00194216 # symmetric matrix --- skipping transposed benchmarking -# so far, program took 5.531s of wall clock time; ancillary tests 0.000s; I/O 0.000s; checks 0.000s; conversions 0.000s; rsb/mkl tuning 0.127s/0.000s . +# so far, program took 5.546s of wall clock time; ancillary tests 0.000s; I/O 0.000s; checks 0.000s; conversions 0.000s; rsb/mkl tuning 0.121s/0.000s . getrusage() stats: ru_maxrss: 6 (maximum resident set size -- MB) -ru_stime : 0.06725s (system CPU time used) -ru_utime : 6.405s (user CPU time used) +ru_stime : 0.05187s (system CPU time used) +ru_utime : 6.681s (user CPU time used) # multi-type benchmarking (DSCZ) -- now using typecode S (last was D). # Cache block size total 524288 bytes, per-thread 43690 bytes -# so far, program took 5.531s of wall clock time; ancillary tests 0.000s; I/O 0.000s; checks 0.000s; conversions 0.000s; rsb/mkl tuning 0.127s/0.000s . +# so far, program took 5.546s of wall clock time; ancillary tests 0.000s; I/O 0.000s; checks 0.000s; conversions 0.000s; rsb/mkl tuning 0.121s/0.000s . # Reusing type converted (D->S) arrays from last iteration instead of reloading matrix file. # multi-nrhs benchmarking (1,4) -- now using nrhs 1. # Using alpha=1 beta=1 order=rows for rsb_spmv/rsb_spsv/rsb_spmm/rsb_spsm. # multi-transpose benchmarking -- now using transA = N. # will use input matrix flags: RSB_FLAG_USE_HALFWORD_INDICES, RSB_FLAG_SORTED_INPUT, RSB_FLAG_QUAD_PARTITIONING, RSB_FLAG_SYMMETRIC, RSB_FLAG_OWN_PARTITIONING_ARRAYS # Using 12 threads -# Constructed matrix (took 0.005s): (3 x 3)[0xaaaaf1f38010]{S} @ (0(0..0),0(0..0)) (6 nnz, 2 nnz/r) flags 0x2442186 (coo:1, csr:0, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'S' +# Constructed matrix (took 0.004s): (3 x 3)[0xaaaaeb9d6050]{S} @ (0(0..0),0(0..0)) (6 nnz, 2 nnz/r) flags 0x2442186 (coo:1, csr:0, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'S' # matrix consistency check took 0.000s (ok) RSB Sparse Blocks Autotuner invoked requesting max 6 splits and max 6 merges in 1 rounds, threads spec.0 (specify negative values to enable threads tuning). Will autotune matrix: 3 x 3, type S, 6 nnz, 2 nnz/r, 4 subms, 3 lsubms, 4.0000 bpnz. Parameters: verbosity:1 mintimes:3 maxtimes:10 mindt:0 maxdt:3 -3 iterations (12 th.) took 0.002247s; avg 0.000749s ( +/- 28.98/ 25.11 %); best 0.0005319s; worst 0.000937s; std dev. 0.0001666 (taking best). -Reference operation time is 0.000531912 s (0.04512 Mflops) with 12 threads. -Starting merge (same threads) based auto-tuning procedure (transA=N, nrhs=1, order=rows) (max 6 steps, inclusive 3 grace steps) on: 3 x 3, type S, 6 nnz, 2 nnz/r, 4 subms, 3 lsubms, 4.0000 bpnz (tpop: 0.0005319 Mflops: 0.045) -Merge (3 -> 1 leaves) took w.c.t. of 8.821e-06s, ~4.053e-06s of computing time (of which 9.537e-07s sorting, 9.537e-07s analysis) -3 iterations (12 th.) took 0.000102s; avg 3.401e-05s ( +/- 99.78/196.50 %); best 7.645e-08s; worst 0.0001009s; std dev. 4.726e-05 (taking best). -Reference operation time is 7.64489e-08 s (313.9 Mflops) with 12 threads. -After merge step 1: tpop: 7.645e-08 s ~Mflops: 313.935 nsubm:1 otn:12 -Applying merge (3 -> 1 leaves, 12 th.) yielded SPEEDUP of 6957.742x: 0.0005319s -> 7.645e-08s, so taking this instance. +3 iterations (12 th.) took 0.001518s; avg 0.000506s ( +/- 30.41/ 17.56 %); best 0.0003521s; worst 0.0005949s; std dev. 0.0001092 (taking best). +Reference operation time is 0.000352144 s (0.06815 Mflops) with 12 threads. +Starting merge (same threads) based auto-tuning procedure (transA=N, nrhs=1, order=rows) (max 6 steps, inclusive 3 grace steps) on: 3 x 3, type S, 6 nnz, 2 nnz/r, 4 subms, 3 lsubms, 4.0000 bpnz (tpop: 0.0003521 Mflops: 0.068) +Merge (3 -> 1 leaves) took w.c.t. of 9.06e-06s, ~4.053e-06s of computing time (of which 0s sorting, 9.537e-07s analysis) +3 iterations (12 th.) took 0.0001001s; avg 3.338e-05s ( +/- 99.77/200.00 %); best 7.734e-08s; worst 0.0001001s; std dev. 4.72e-05 (taking best). +Reference operation time is 7.7343e-08 s (310.3 Mflops) with 12 threads. +After merge step 1: tpop: 7.734e-08 s ~Mflops: 310.306 nsubm:1 otn:12 +Applying merge (3 -> 1 leaves, 12 th.) yielded SPEEDUP of 4553.021x: 0.0003521s -> 7.734e-08s, so taking this instance. Merged all the matrix leaves: no reason to continue merging. -A total of 1 merge steps (of max 6) (3 -> 1 subms) took 0.001659s (of which 1.097e-05s partitioning, 0s I/O); computing times: 4.053e-06s in par. loops, 9.537e-07s sorting, 9.537e-07s analyzing) -Total merge + benchmarking process took 0.001659s, equivalent to 21699.7/3.1 new/old ops (0.003889s for 2 clones -- as 50871.7/7.3 ops, or 25435.8/3.7 ops per clone), SPEEDUP of 6957.742x -Applying multi-merge (3 -> 1 leaves, 1 steps, 0 -> 12 th.sp.) yielded SPEEDUP of 6957.742x (0.0005319s -> 7.645e-08s), will amortize in 3.1 ops by saving 0.0005318s per op. -In 1 tuning rounds (tot. 0.0063s, 0.0039s for constructor, 2 clones) obtained a SPEEDUP of 695674.2% (6958x) (from 0.04512 to 313.9 Mflops). +A total of 1 merge steps (of max 6) (3 -> 1 subms) took 0.001836s (of which 1.192e-05s partitioning, 0s I/O); computing times: 4.053e-06s in par. loops, 0s sorting, 9.537e-07s analyzing) +Total merge + benchmarking process took 0.001836s, equivalent to 23736.1/5.2 new/old ops (0.00339s for 2 clones -- as 43828.6/9.6 ops, or 21914.3/4.8 ops per clone), SPEEDUP of 4553.021x +Applying multi-merge (3 -> 1 leaves, 1 steps, 0 -> 12 th.sp.) yielded SPEEDUP of 4553.021x (0.0003521s -> 7.734e-08s), will amortize in 5.2 ops by saving 0.0003521s per op. +In 1 tuning rounds (tot. 0.0055s, 0.0034s for constructor, 2 clones) obtained a SPEEDUP of 455202.1% (4553x) (from 0.06815 to 310.3 Mflops). #pr: updating sample at index 3 (2^th of 16), 0^th touch for (0,0,0,0,0,1,0). -First run of RSB Autotuner took 0.00631285 s (5.319e-04 s -> 7.645e-08 s per spmv_sxsa) (tuned: 3 -> 1 lsubm). +First run of RSB Autotuner took 0.00550508 s (3.521e-04 s -> 7.734e-08 s per spmv_sxsa) (tuned: 3 -> 1 lsubm). RSB Sparse Blocks Autotuner invoked requesting max 0 splits and max 0 merges in 1 rounds, auto threads spec. -Second run of RSB Autotuner took 0.0196929 s and estimated a speedup of 1.000000 x (7.645e-08 s -> 7.645e-08 s per op) in same matrix (1 -> 1 lsubm) +Second run of RSB Autotuner took 0.0356052 s and estimated a speedup of 1.000000 x (7.734e-08 s -> 7.734e-08 s per op) in same matrix (1 -> 1 lsubm) #min:1 #max:1 #sum:3 #norm:1.73205078 #used index storage compared to COO:28 vs 48 bytes (58.33%) ; compared to CSR:28 vs 40 bytes (77.78%) #%:CONSTRUCTOR_*:SORT SCAN INSERT SCAN+INSERT -%:CONSTRUCTOR_TIMES:A.mtx S N 12 3 3 6 0.000001 0.002210 0.001575 0.003785 -%:UNSORTEDCOO2RSB_TIME:A.mtx S N 12 3 3 6 0.003786 -%:RSB_SUBDIVISION_TIME:A.mtx S N 12 3 3 6 0.002210 -%:RSB_SHUFFLE_TIME:A.mtx S N 12 3 3 6 0.001575 -%:ROW_MAJOR_SORT_TIME:A.mtx S N 12 3 3 6 0.000001 -%:ROW_MAJOR_SORT_SCALING:A.mtx S N 12 3 3 6 1.000 -%:SORTEDCOO2RSB_TIME:A.mtx S N 12 3 3 6 0.003785 +%:CONSTRUCTOR_TIMES:A.mtx S N 12 3 3 6 0.000000 0.001495 0.001193 0.002688 +%:UNSORTEDCOO2RSB_TIME:A.mtx S N 12 3 3 6 0.002688 +%:RSB_SUBDIVISION_TIME:A.mtx S N 12 3 3 6 0.001495 +%:RSB_SHUFFLE_TIME:A.mtx S N 12 3 3 6 0.001193 +%:ROW_MAJOR_SORT_TIME:A.mtx S N 12 3 3 6 0.000000 +%:ROW_MAJOR_SORT_SCALING:A.mtx S N 12 3 3 6 nan +%:SORTEDCOO2RSB_TIME:A.mtx S N 12 3 3 6 0.002688 %:ROW_MAJOR_SORT_TO_MOP:A.mtx S N 12 3 3 6 0.000 %:UNSORTEDCOO2RSB_SCALING:A.mtx S N 12 3 3 6 1.00 %:SORTEDCOO2RSB_SCALING:A.mtx S N 12 3 3 6 1.00 %:RSB_SUBDIVISION_SCALING:A.mtx S N 12 3 3 6 1.00 %:RSB_SHUFFLE_SCALING:A.mtx S N 12 3 3 6 1.00 -%:CONSTRUCTOR_SCALING:A.mtx S N 12 3 3 6 1.00 1.00 1.00 1.00 +%:CONSTRUCTOR_SCALING:A.mtx S N 12 3 3 6 nan 1.00 1.00 1.00 #%:SM_COUNTS: Tot HalfwordCsr FullwordCsr HalfwordCoo FullwordCoo %:SM_COUNTS:A.mtx S N 12 3 3 6 1 1 0 0 0 %:SM_IDXOCCUPATIONRSBVSCOOANDCSR:A.mtx S N 12 3 3 6 28 48 36 @@ -4475,50 +4511,50 @@ %:SM_MINMAXAVGNNZ:A.mtx S N 12 3 3 6 6 6 6 # %operation:matrix CONSTRUCTOR[12] SPMV[12] SPMV[12] -%operation:A.mtx 0.00536013 1e+09 1e+09 +%operation:A.mtx 0.00388694 1e+09 1e+09 %constructor:matrix SORT[12] SCAN[12] SHUFFLE[12] INSERT[12] -%constructor:A.mtx 9.53674e-07 0.0022099 0 0.00157499 +%constructor:A.mtx 0 0.00149488 0 0.00119281 # symmetric matrix --- skipping transposed benchmarking # multi-nrhs benchmarking (1,4) -- now using nrhs 4. # Using alpha=1 beta=1 order=rows for rsb_spmv/rsb_spsv/rsb_spmm/rsb_spsm. # multi-transpose benchmarking -- now using transA = N. # will use input matrix flags: RSB_FLAG_USE_HALFWORD_INDICES, RSB_FLAG_SORTED_INPUT, RSB_FLAG_QUAD_PARTITIONING, RSB_FLAG_SYMMETRIC, RSB_FLAG_OWN_PARTITIONING_ARRAYS # Using 12 threads -# Constructed matrix (took 0.003s): (3 x 3)[0xaaaaf1f383a0]{S} @ (0(0..0),0(0..0)) (6 nnz, 2 nnz/r) flags 0x2442186 (coo:1, csr:0, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'S' +# Constructed matrix (took 0.004s): (3 x 3)[0xaaaaeb9d63e0]{S} @ (0(0..0),0(0..0)) (6 nnz, 2 nnz/r) flags 0x2442186 (coo:1, csr:0, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'S' # matrix consistency check took 0.000s (ok) RSB Sparse Blocks Autotuner invoked requesting max 6 splits and max 6 merges in 1 rounds, threads spec.0 (specify negative values to enable threads tuning). Will autotune matrix: 3 x 3, type S, 6 nnz, 2 nnz/r, 4 subms, 3 lsubms, 4.0000 bpnz. Parameters: verbosity:1 mintimes:3 maxtimes:10 mindt:0 maxdt:3 -3 iterations (12 th.) took 0.001262s; avg 0.0004206s ( +/- 1.61/ 2.47 %); best 0.0004139s; worst 0.0004311s; std dev. 7.47e-06 (taking best). -Reference operation time is 0.000413895 s (0.2319 Mflops) with 12 threads. -Starting merge (same threads) based auto-tuning procedure (transA=N, nrhs=4, order=rows) (max 6 steps, inclusive 3 grace steps) on: 3 x 3, type S, 6 nnz, 2 nnz/r, 4 subms, 3 lsubms, 4.0000 bpnz (tpop: 0.0004139 Mflops: 0.232) -Merge (3 -> 1 leaves) took w.c.t. of 5.96e-06s, ~3.099e-06s of computing time (of which 1.192e-06s sorting, 9.537e-07s analysis) -3 iterations (12 th.) took 2.146e-06s; avg 7.153e-07s ( +/- 89.31/200.00 %); best 7.645e-08s; worst 2.146e-06s; std dev. 1.012e-06 (taking best). -Reference operation time is 7.64489e-08 s (1256 Mflops) with 12 threads. -After merge step 1: tpop: 7.645e-08 s ~Mflops: 1255.740 nsubm:1 otn:12 -Applying merge (3 -> 1 leaves, 12 th.) yielded SPEEDUP of 5414.003x: 0.0004139s -> 7.645e-08s, so taking this instance. +3 iterations (12 th.) took 0.001794s; avg 0.000598s ( +/- 0.33/ 0.35 %); best 0.000596s; worst 0.0006001s; std dev. 1.656e-06 (taking best). +Reference operation time is 0.000596046 s (0.1611 Mflops) with 12 threads. +Starting merge (same threads) based auto-tuning procedure (transA=N, nrhs=4, order=rows) (max 6 steps, inclusive 3 grace steps) on: 3 x 3, type S, 6 nnz, 2 nnz/r, 4 subms, 3 lsubms, 4.0000 bpnz (tpop: 0.000596 Mflops: 0.161) +Merge (3 -> 1 leaves) took w.c.t. of 6.914e-06s, ~3.099e-06s of computing time (of which 0s sorting, 9.537e-07s analysis) +3 iterations (12 th.) took 3.099e-06s; avg 1.033e-06s ( +/- 92.51/200.00 %); best 7.734e-08s; worst 3.099e-06s; std dev. 1.461e-06 (taking best). +Reference operation time is 7.7343e-08 s (1241 Mflops) with 12 threads. +After merge step 1: tpop: 7.734e-08 s ~Mflops: 1241.224 nsubm:1 otn:12 +Applying merge (3 -> 1 leaves, 12 th.) yielded SPEEDUP of 7706.535x: 0.000596s -> 7.734e-08s, so taking this instance. Merged all the matrix leaves: no reason to continue merging. -A total of 1 merge steps (of max 6) (3 -> 1 subms) took 0.001408s (of which 8.821e-06s partitioning, 0s I/O); computing times: 3.099e-06s in par. loops, 1.192e-06s sorting, 9.537e-07s analyzing) -Total merge + benchmarking process took 0.001408s, equivalent to 18415.7/3.4 new/old ops (0.002432s for 2 clones -- as 31813.5/5.9 ops, or 15906.8/2.9 ops per clone), SPEEDUP of 5414.003x -Applying multi-merge (3 -> 1 leaves, 1 steps, 0 -> 12 th.sp.) yielded SPEEDUP of 5414.003x (0.0004139s -> 7.645e-08s), will amortize in 3.4 ops by saving 0.0004138s per op. -In 1 tuning rounds (tot. 0.0039s, 0.0024s for constructor, 2 clones) obtained a SPEEDUP of 541300.3% (5414x) (from 0.2319 to 1256 Mflops). +A total of 1 merge steps (of max 6) (3 -> 1 subms) took 0.00182s (of which 9.775e-06s partitioning, 0s I/O); computing times: 3.099e-06s in par. loops, 0s sorting, 9.537e-07s analyzing) +Total merge + benchmarking process took 0.00182s, equivalent to 23529.6/3.1 new/old ops (0.003593s for 2 clones -- as 46455.0/6.0 ops, or 23227.5/3.0 ops per clone), SPEEDUP of 7706.535x +Applying multi-merge (3 -> 1 leaves, 1 steps, 0 -> 12 th.sp.) yielded SPEEDUP of 7706.535x (0.000596s -> 7.734e-08s), will amortize in 3.1 ops by saving 0.000596s per op. +In 1 tuning rounds (tot. 0.0055s, 0.0036s for constructor, 2 clones) obtained a SPEEDUP of 770553.5% (7707x) (from 0.1611 to 1241 Mflops). #pr: updating sample at index 11 (3^th of 16), 0^th touch for (0,0,0,0,1,1,0). -First run of RSB Autotuner took 0.00392008 s (4.139e-04 s -> 7.645e-08 s per spmv_sxsa) (tuned: 3 -> 1 lsubm). +First run of RSB Autotuner took 0.00546193 s (5.960e-04 s -> 7.734e-08 s per spmv_sxsa) (tuned: 3 -> 1 lsubm). RSB Sparse Blocks Autotuner invoked requesting max 0 splits and max 0 merges in 1 rounds, auto threads spec. -Second run of RSB Autotuner took 0.0268381 s and estimated a speedup of 1.000000 x (7.645e-08 s -> 7.645e-08 s per op) in same matrix (1 -> 1 lsubm) +Second run of RSB Autotuner took 0.022619 s and estimated a speedup of 1.000000 x (7.734e-08 s -> 7.734e-08 s per op) in same matrix (1 -> 1 lsubm) #min:1 #max:1 #sum:3 #norm:1.73205078 #used index storage compared to COO:28 vs 48 bytes (58.33%) ; compared to CSR:28 vs 40 bytes (77.78%) #%:CONSTRUCTOR_*:SORT SCAN INSERT SCAN+INSERT -%:CONSTRUCTOR_TIMES:A.mtx S N 12 3 3 6 0.000000 0.001029 0.000822 0.001851 -%:UNSORTEDCOO2RSB_TIME:A.mtx S N 12 3 3 6 0.001851 -%:RSB_SUBDIVISION_TIME:A.mtx S N 12 3 3 6 0.001029 -%:RSB_SHUFFLE_TIME:A.mtx S N 12 3 3 6 0.000822 +%:CONSTRUCTOR_TIMES:A.mtx S N 12 3 3 6 0.000000 0.001787 0.001248 0.003035 +%:UNSORTEDCOO2RSB_TIME:A.mtx S N 12 3 3 6 0.003035 +%:RSB_SUBDIVISION_TIME:A.mtx S N 12 3 3 6 0.001787 +%:RSB_SHUFFLE_TIME:A.mtx S N 12 3 3 6 0.001248 %:ROW_MAJOR_SORT_TIME:A.mtx S N 12 3 3 6 0.000000 %:ROW_MAJOR_SORT_SCALING:A.mtx S N 12 3 3 6 nan -%:SORTEDCOO2RSB_TIME:A.mtx S N 12 3 3 6 0.001851 +%:SORTEDCOO2RSB_TIME:A.mtx S N 12 3 3 6 0.003035 %:ROW_MAJOR_SORT_TO_MOP:A.mtx S N 12 3 3 6 0.000 %:UNSORTEDCOO2RSB_SCALING:A.mtx S N 12 3 3 6 1.00 %:SORTEDCOO2RSB_SCALING:A.mtx S N 12 3 3 6 1.00 @@ -4533,65 +4569,65 @@ %:SM_MINMAXAVGNNZ:A.mtx S N 12 3 3 6 6 6 6 # %operation:matrix CONSTRUCTOR[12] SPMV[12] SPMV[12] -%operation:A.mtx 0.00267506 1e+09 1e+09 +%operation:A.mtx 0.004287 1e+09 1e+09 %constructor:matrix SORT[12] SCAN[12] SHUFFLE[12] INSERT[12] -%constructor:A.mtx 0 0.00102901 0 0.000822067 +%constructor:A.mtx 0 0.00178695 0 0.00124788 # symmetric matrix --- skipping transposed benchmarking -# so far, program took 5.603s of wall clock time; ancillary tests 0.000s; I/O 0.000s; checks 0.000s; conversions 0.000s; rsb/mkl tuning 0.184s/0.000s . +# so far, program took 5.629s of wall clock time; ancillary tests 0.000s; I/O 0.000s; checks 0.000s; conversions 0.000s; rsb/mkl tuning 0.190s/0.000s . getrusage() stats: ru_maxrss: 6 (maximum resident set size -- MB) -ru_stime : 0.07513s (system CPU time used) -ru_utime : 6.981s (user CPU time used) +ru_stime : 0.06061s (system CPU time used) +ru_utime : 7.405s (user CPU time used) # multi-type benchmarking (DSCZ) -- now using typecode C (last was S). # Cache block size total 524288 bytes, per-thread 43690 bytes -# so far, program took 5.603s of wall clock time; ancillary tests 0.000s; I/O 0.000s; checks 0.000s; conversions 0.000s; rsb/mkl tuning 0.184s/0.000s . +# so far, program took 5.629s of wall clock time; ancillary tests 0.000s; I/O 0.000s; checks 0.000s; conversions 0.000s; rsb/mkl tuning 0.190s/0.000s . # Reusing type converted (S->C) arrays from last iteration instead of reloading matrix file. # multi-nrhs benchmarking (1,4) -- now using nrhs 1. # Using alpha=1 beta=1 order=rows for rsb_spmv/rsb_spsv/rsb_spmm/rsb_spsm. # multi-transpose benchmarking -- now using transA = N. # will use input matrix flags: RSB_FLAG_USE_HALFWORD_INDICES, RSB_FLAG_SORTED_INPUT, RSB_FLAG_QUAD_PARTITIONING, RSB_FLAG_SYMMETRIC, RSB_FLAG_OWN_PARTITIONING_ARRAYS # Using 12 threads -# Constructed matrix (took 0.006s): (3 x 3)[0xaaaaf1f3b400]{C} @ (0(0..0),0(0..0)) (6 nnz, 2 nnz/r) flags 0x2442186 (coo:1, csr:0, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'S' +# Constructed matrix (took 0.003s): (3 x 3)[0xaaaaeb9d9440]{C} @ (0(0..0),0(0..0)) (6 nnz, 2 nnz/r) flags 0x2442186 (coo:1, csr:0, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'S' # matrix consistency check took 0.000s (ok) RSB Sparse Blocks Autotuner invoked requesting max 6 splits and max 6 merges in 1 rounds, threads spec.0 (specify negative values to enable threads tuning). Will autotune matrix: 3 x 3, type C, 6 nnz, 2 nnz/r, 4 subms, 3 lsubms, 4.0000 bpnz. Parameters: verbosity:1 mintimes:3 maxtimes:10 mindt:0 maxdt:3 -3 iterations (12 th.) took 0.002895s; avg 0.000965s ( +/- 43.22/ 84.05 %); best 0.0005479s; worst 0.001776s; std dev. 0.0005736 (taking best). -Reference operation time is 0.000547886 s (0.1752 Mflops) with 12 threads. -Starting merge (same threads) based auto-tuning procedure (transA=N, nrhs=1, order=rows) (max 6 steps, inclusive 3 grace steps) on: 3 x 3, type C, 6 nnz, 2 nnz/r, 4 subms, 3 lsubms, 4.0000 bpnz (tpop: 0.0005479 Mflops: 0.175) -Merge (3 -> 1 leaves) took w.c.t. of 1.001e-05s, ~3.099e-06s of computing time (of which 1.192e-06s sorting, 1.192e-06s analysis) -3 iterations (12 th.) took 0.0001879s; avg 6.262e-05s ( +/- 99.88/198.48 %); best 7.645e-08s; worst 0.0001869s; std dev. 8.789e-05 (taking best). -Reference operation time is 7.64489e-08 s (1256 Mflops) with 12 threads. -After merge step 1: tpop: 7.645e-08 s ~Mflops: 1255.740 nsubm:1 otn:12 -Applying merge (3 -> 1 leaves, 12 th.) yielded SPEEDUP of 7166.693x: 0.0005479s -> 7.645e-08s, so taking this instance. +3 iterations (12 th.) took 0.001958s; avg 0.0006526s ( +/- 35.96/ 66.88 %); best 0.0004179s; worst 0.001089s; std dev. 0.0003089 (taking best). +Reference operation time is 0.000417948 s (0.2297 Mflops) with 12 threads. +Starting merge (same threads) based auto-tuning procedure (transA=N, nrhs=1, order=rows) (max 6 steps, inclusive 3 grace steps) on: 3 x 3, type C, 6 nnz, 2 nnz/r, 4 subms, 3 lsubms, 4.0000 bpnz (tpop: 0.0004179 Mflops: 0.230) +Merge (3 -> 1 leaves) took w.c.t. of 8.106e-06s, ~4.053e-06s of computing time (of which 9.537e-07s sorting, 1.192e-06s analysis) +3 iterations (12 th.) took 0.0002792s; avg 9.306e-05s ( +/- 99.92/200.00 %); best 7.734e-08s; worst 0.0002792s; std dev. 0.0001316 (taking best). +Reference operation time is 7.7343e-08 s (1241 Mflops) with 12 threads. +After merge step 1: tpop: 7.734e-08 s ~Mflops: 1241.224 nsubm:1 otn:12 +Applying merge (3 -> 1 leaves, 12 th.) yielded SPEEDUP of 5403.822x: 0.0004179s -> 7.734e-08s, so taking this instance. Merged all the matrix leaves: no reason to continue merging. -A total of 1 merge steps (of max 6) (3 -> 1 subms) took 0.001624s (of which 1.216e-05s partitioning, 0s I/O); computing times: 3.099e-06s in par. loops, 1.192e-06s sorting, 1.192e-06s analyzing) -Total merge + benchmarking process took 0.001624s, equivalent to 21244.3/3.0 new/old ops (0.003772s for 2 clones -- as 49337.3/6.9 ops, or 24668.6/3.4 ops per clone), SPEEDUP of 7166.693x -Applying multi-merge (3 -> 1 leaves, 1 steps, 0 -> 12 th.sp.) yielded SPEEDUP of 7166.693x (0.0005479s -> 7.645e-08s), will amortize in 3.0 ops by saving 0.0005478s per op. -In 1 tuning rounds (tot. 0.0069s, 0.0038s for constructor, 2 clones) obtained a SPEEDUP of 716569.3% (7167x) (from 0.1752 to 1256 Mflops). +A total of 1 merge steps (of max 6) (3 -> 1 subms) took 0.00116s (of which 1.097e-05s partitioning, 0s I/O); computing times: 4.053e-06s in par. loops, 9.537e-07s sorting, 1.192e-06s analyzing) +Total merge + benchmarking process took 0.00116s, equivalent to 15000.0/2.8 new/old ops (0.001965s for 2 clones -- as 25406.9/4.7 ops, or 12703.5/2.4 ops per clone), SPEEDUP of 5403.822x +Applying multi-merge (3 -> 1 leaves, 1 steps, 0 -> 12 th.sp.) yielded SPEEDUP of 5403.822x (0.0004179s -> 7.734e-08s), will amortize in 2.8 ops by saving 0.0004179s per op. +In 1 tuning rounds (tot. 0.0042s, 0.002s for constructor, 2 clones) obtained a SPEEDUP of 540282.2% (5404x) (from 0.2297 to 1241 Mflops). #pr: updating sample at index 5 (4^th of 16), 0^th touch for (0,0,0,0,0,2,0). -First run of RSB Autotuner took 0.00690508 s (5.479e-04 s -> 7.645e-08 s per spmv_sxsa) (tuned: 3 -> 1 lsubm). +First run of RSB Autotuner took 0.00425196 s (4.179e-04 s -> 7.734e-08 s per spmv_sxsa) (tuned: 3 -> 1 lsubm). RSB Sparse Blocks Autotuner invoked requesting max 0 splits and max 0 merges in 1 rounds, auto threads spec. -Second run of RSB Autotuner took 0.0283039 s and estimated a speedup of 1.000000 x (7.645e-08 s -> 7.645e-08 s per op) in same matrix (1 -> 1 lsubm) +Second run of RSB Autotuner took 0.0203819 s and estimated a speedup of 1.000000 x (7.734e-08 s -> 7.734e-08 s per op) in same matrix (1 -> 1 lsubm) #min:1 0 #max:1 0 #sum:3 0 #norm:1.73205078 0 #used index storage compared to COO:28 vs 48 bytes (58.33%) ; compared to CSR:28 vs 40 bytes (77.78%) #%:CONSTRUCTOR_*:SORT SCAN INSERT SCAN+INSERT -%:CONSTRUCTOR_TIMES:A.mtx S N 12 3 3 6 0.000000 0.002283 0.001792 0.004075 -%:UNSORTEDCOO2RSB_TIME:A.mtx S N 12 3 3 6 0.004075 -%:RSB_SUBDIVISION_TIME:A.mtx S N 12 3 3 6 0.002283 -%:RSB_SHUFFLE_TIME:A.mtx S N 12 3 3 6 0.001792 -%:ROW_MAJOR_SORT_TIME:A.mtx S N 12 3 3 6 0.000000 -%:ROW_MAJOR_SORT_SCALING:A.mtx S N 12 3 3 6 nan -%:SORTEDCOO2RSB_TIME:A.mtx S N 12 3 3 6 0.004075 +%:CONSTRUCTOR_TIMES:A.mtx S N 12 3 3 6 0.000001 0.000949 0.000836 0.001785 +%:UNSORTEDCOO2RSB_TIME:A.mtx S N 12 3 3 6 0.001786 +%:RSB_SUBDIVISION_TIME:A.mtx S N 12 3 3 6 0.000949 +%:RSB_SHUFFLE_TIME:A.mtx S N 12 3 3 6 0.000836 +%:ROW_MAJOR_SORT_TIME:A.mtx S N 12 3 3 6 0.000001 +%:ROW_MAJOR_SORT_SCALING:A.mtx S N 12 3 3 6 1.000 +%:SORTEDCOO2RSB_TIME:A.mtx S N 12 3 3 6 0.001785 %:ROW_MAJOR_SORT_TO_MOP:A.mtx S N 12 3 3 6 0.000 %:UNSORTEDCOO2RSB_SCALING:A.mtx S N 12 3 3 6 1.00 %:SORTEDCOO2RSB_SCALING:A.mtx S N 12 3 3 6 1.00 %:RSB_SUBDIVISION_SCALING:A.mtx S N 12 3 3 6 1.00 %:RSB_SHUFFLE_SCALING:A.mtx S N 12 3 3 6 1.00 -%:CONSTRUCTOR_SCALING:A.mtx S N 12 3 3 6 nan 1.00 1.00 1.00 +%:CONSTRUCTOR_SCALING:A.mtx S N 12 3 3 6 1.00 1.00 1.00 1.00 #%:SM_COUNTS: Tot HalfwordCsr FullwordCsr HalfwordCoo FullwordCoo %:SM_COUNTS:A.mtx S N 12 3 3 6 1 1 0 0 0 %:SM_IDXOCCUPATIONRSBVSCOOANDCSR:A.mtx S N 12 3 3 6 28 48 36 @@ -4600,50 +4636,50 @@ %:SM_MINMAXAVGNNZ:A.mtx S N 12 3 3 6 6 6 6 # %operation:matrix CONSTRUCTOR[12] SPMV[12] SPMV[12] -%operation:A.mtx 0.00587916 1e+09 1e+09 +%operation:A.mtx 0.00260282 1e+09 1e+09 %constructor:matrix SORT[12] SCAN[12] SHUFFLE[12] INSERT[12] -%constructor:A.mtx 0 0.0022831 0 0.00179195 +%constructor:A.mtx 9.53674e-07 0.000948906 0 0.000835896 # symmetric matrix --- skipping transposed benchmarking # multi-nrhs benchmarking (1,4) -- now using nrhs 4. # Using alpha=1 beta=1 order=rows for rsb_spmv/rsb_spsv/rsb_spmm/rsb_spsm. # multi-transpose benchmarking -- now using transA = N. # will use input matrix flags: RSB_FLAG_USE_HALFWORD_INDICES, RSB_FLAG_SORTED_INPUT, RSB_FLAG_QUAD_PARTITIONING, RSB_FLAG_SYMMETRIC, RSB_FLAG_OWN_PARTITIONING_ARRAYS # Using 12 threads -# Constructed matrix (took 0.003s): (3 x 3)[0xaaaaf1f3b400]{C} @ (0(0..0),0(0..0)) (6 nnz, 2 nnz/r) flags 0x2442186 (coo:1, csr:0, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'S' +# Constructed matrix (took 0.002s): (3 x 3)[0xaaaaeb9d9440]{C} @ (0(0..0),0(0..0)) (6 nnz, 2 nnz/r) flags 0x2442186 (coo:1, csr:0, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'S' # matrix consistency check took 0.000s (ok) RSB Sparse Blocks Autotuner invoked requesting max 6 splits and max 6 merges in 1 rounds, threads spec.0 (specify negative values to enable threads tuning). Will autotune matrix: 3 x 3, type C, 6 nnz, 2 nnz/r, 4 subms, 3 lsubms, 4.0000 bpnz. Parameters: verbosity:1 mintimes:3 maxtimes:10 mindt:0 maxdt:3 -3 iterations (12 th.) took 0.00164s; avg 0.0005466s ( +/- 22.27/ 12.14 %); best 0.0004249s; worst 0.000613s; std dev. 8.621e-05 (taking best). -Reference operation time is 0.000424862 s (0.9038 Mflops) with 12 threads. -Starting merge (same threads) based auto-tuning procedure (transA=N, nrhs=4, order=rows) (max 6 steps, inclusive 3 grace steps) on: 3 x 3, type C, 6 nnz, 2 nnz/r, 4 subms, 3 lsubms, 4.0000 bpnz (tpop: 0.0004249 Mflops: 0.904) -Merge (3 -> 1 leaves) took w.c.t. of 5.96e-06s, ~3.099e-06s of computing time (of which 9.537e-07s sorting, 9.537e-07s analysis) -3 iterations (12 th.) took 3.099e-06s; avg 1.033e-06s ( +/- 92.60/107.69 %); best 7.645e-08s; worst 2.146e-06s; std dev. 8.778e-07 (taking best). -Reference operation time is 7.64489e-08 s (5023 Mflops) with 12 threads. -After merge step 1: tpop: 7.645e-08 s ~Mflops: 5022.962 nsubm:1 otn:12 -Applying merge (3 -> 1 leaves, 12 th.) yielded SPEEDUP of 5557.461x: 0.0004249s -> 7.645e-08s, so taking this instance. +3 iterations (12 th.) took 0.001231s; avg 0.0004103s ( +/- 3.02/ 2.38 %); best 0.0003979s; worst 0.0004201s; std dev. 9.24e-06 (taking best). +Reference operation time is 0.000397921 s (0.965 Mflops) with 12 threads. +Starting merge (same threads) based auto-tuning procedure (transA=N, nrhs=4, order=rows) (max 6 steps, inclusive 3 grace steps) on: 3 x 3, type C, 6 nnz, 2 nnz/r, 4 subms, 3 lsubms, 4.0000 bpnz (tpop: 0.0003979 Mflops: 0.965) +Merge (3 -> 1 leaves) took w.c.t. of 5.96e-06s, ~3.099e-06s of computing time (of which 0s sorting, 0s analysis) +3 iterations (12 th.) took 2.861e-06s; avg 9.537e-07s ( +/- 91.89/200.00 %); best 7.734e-08s; worst 2.861e-06s; std dev. 1.349e-06 (taking best). +Reference operation time is 7.7343e-08 s (4965 Mflops) with 12 threads. +After merge step 1: tpop: 7.734e-08 s ~Mflops: 4964.897 nsubm:1 otn:12 +Applying merge (3 -> 1 leaves, 12 th.) yielded SPEEDUP of 5144.883x: 0.0003979s -> 7.734e-08s, so taking this instance. Merged all the matrix leaves: no reason to continue merging. -A total of 1 merge steps (of max 6) (3 -> 1 subms) took 0.001487s (of which 6.914e-06s partitioning, 0s I/O); computing times: 3.099e-06s in par. loops, 9.537e-07s sorting, 9.537e-07s analyzing) -Total merge + benchmarking process took 0.001487s, equivalent to 19451.1/3.5 new/old ops (0.002936s for 2 clones -- as 38403.2/6.9 ops, or 19201.6/3.5 ops per clone), SPEEDUP of 5557.461x -Applying multi-merge (3 -> 1 leaves, 1 steps, 0 -> 12 th.sp.) yielded SPEEDUP of 5557.461x (0.0004249s -> 7.645e-08s), will amortize in 3.5 ops by saving 0.0004248s per op. -In 1 tuning rounds (tot. 0.0046s, 0.0029s for constructor, 2 clones) obtained a SPEEDUP of 555646.1% (5557x) (from 0.9038 to 5023 Mflops). +A total of 1 merge steps (of max 6) (3 -> 1 subms) took 0.001222s (of which 8.106e-06s partitioning, 0s I/O); computing times: 3.099e-06s in par. loops, 0s sorting, 0s analyzing) +Total merge + benchmarking process took 0.001222s, equivalent to 15798.4/3.1 new/old ops (0.002426s for 2 clones -- as 31365.6/6.1 ops, or 15682.8/3.0 ops per clone), SPEEDUP of 5144.883x +Applying multi-merge (3 -> 1 leaves, 1 steps, 0 -> 12 th.sp.) yielded SPEEDUP of 5144.883x (0.0003979s -> 7.734e-08s), will amortize in 3.1 ops by saving 0.0003978s per op. +In 1 tuning rounds (tot. 0.0037s, 0.0024s for constructor, 2 clones) obtained a SPEEDUP of 514388.3% (5145x) (from 0.965 to 4965 Mflops). #pr: updating sample at index 13 (5^th of 16), 0^th touch for (0,0,0,0,1,2,0). -First run of RSB Autotuner took 0.00461698 s (4.249e-04 s -> 7.645e-08 s per spmv_sxsa) (tuned: 3 -> 1 lsubm). +First run of RSB Autotuner took 0.00369787 s (3.979e-04 s -> 7.734e-08 s per spmv_sxsa) (tuned: 3 -> 1 lsubm). RSB Sparse Blocks Autotuner invoked requesting max 0 splits and max 0 merges in 1 rounds, auto threads spec. -Second run of RSB Autotuner took 0.021759 s and estimated a speedup of 1.000000 x (7.645e-08 s -> 7.645e-08 s per op) in same matrix (1 -> 1 lsubm) +Second run of RSB Autotuner took 0.0212882 s and estimated a speedup of 1.000000 x (7.734e-08 s -> 7.734e-08 s per op) in same matrix (1 -> 1 lsubm) #min:1 0 #max:1 0 #sum:3 0 #norm:1.73205078 0 #used index storage compared to COO:28 vs 48 bytes (58.33%) ; compared to CSR:28 vs 40 bytes (77.78%) #%:CONSTRUCTOR_*:SORT SCAN INSERT SCAN+INSERT -%:CONSTRUCTOR_TIMES:A.mtx S N 12 3 3 6 0.000000 0.001203 0.001116 0.002319 -%:UNSORTEDCOO2RSB_TIME:A.mtx S N 12 3 3 6 0.002319 -%:RSB_SUBDIVISION_TIME:A.mtx S N 12 3 3 6 0.001203 -%:RSB_SHUFFLE_TIME:A.mtx S N 12 3 3 6 0.001116 +%:CONSTRUCTOR_TIMES:A.mtx S N 12 3 3 6 0.000000 0.000818 0.000816 0.001634 +%:UNSORTEDCOO2RSB_TIME:A.mtx S N 12 3 3 6 0.001634 +%:RSB_SUBDIVISION_TIME:A.mtx S N 12 3 3 6 0.000818 +%:RSB_SHUFFLE_TIME:A.mtx S N 12 3 3 6 0.000816 %:ROW_MAJOR_SORT_TIME:A.mtx S N 12 3 3 6 0.000000 %:ROW_MAJOR_SORT_SCALING:A.mtx S N 12 3 3 6 nan -%:SORTEDCOO2RSB_TIME:A.mtx S N 12 3 3 6 0.002319 +%:SORTEDCOO2RSB_TIME:A.mtx S N 12 3 3 6 0.001634 %:ROW_MAJOR_SORT_TO_MOP:A.mtx S N 12 3 3 6 0.000 %:UNSORTEDCOO2RSB_SCALING:A.mtx S N 12 3 3 6 1.00 %:SORTEDCOO2RSB_SCALING:A.mtx S N 12 3 3 6 1.00 @@ -4658,59 +4694,59 @@ %:SM_MINMAXAVGNNZ:A.mtx S N 12 3 3 6 6 6 6 # %operation:matrix CONSTRUCTOR[12] SPMV[12] SPMV[12] -%operation:A.mtx 0.00320101 1e+09 1e+09 +%operation:A.mtx 0.00245404 1e+09 1e+09 %constructor:matrix SORT[12] SCAN[12] SHUFFLE[12] INSERT[12] -%constructor:A.mtx 0 0.00120306 0 0.00111604 +%constructor:A.mtx 0 0.000818014 0 0.000815868 # symmetric matrix --- skipping transposed benchmarking -# so far, program took 5.679s of wall clock time; ancillary tests 0.000s; I/O 0.000s; checks 0.000s; conversions 0.000s; rsb/mkl tuning 0.245s/0.000s . +# so far, program took 5.690s of wall clock time; ancillary tests 0.000s; I/O 0.000s; checks 0.000s; conversions 0.000s; rsb/mkl tuning 0.239s/0.000s . getrusage() stats: ru_maxrss: 6 (maximum resident set size -- MB) -ru_stime : 0.08278s (system CPU time used) -ru_utime : 7.571s (user CPU time used) +ru_stime : 0.06458s (system CPU time used) +ru_utime : 8.049s (user CPU time used) # multi-type benchmarking (DSCZ) -- now using typecode Z (last was C). # Cache block size total 524288 bytes, per-thread 43690 bytes -# so far, program took 5.679s of wall clock time; ancillary tests 0.000s; I/O 0.000s; checks 0.000s; conversions 0.000s; rsb/mkl tuning 0.245s/0.000s . +# so far, program took 5.690s of wall clock time; ancillary tests 0.000s; I/O 0.000s; checks 0.000s; conversions 0.000s; rsb/mkl tuning 0.239s/0.000s . # Reusing type converted (C->Z) arrays from last iteration instead of reloading matrix file. # multi-nrhs benchmarking (1,4) -- now using nrhs 1. # Using alpha=1 beta=1 order=rows for rsb_spmv/rsb_spsv/rsb_spmm/rsb_spsm. # multi-transpose benchmarking -- now using transA = N. # will use input matrix flags: RSB_FLAG_USE_HALFWORD_INDICES, RSB_FLAG_SORTED_INPUT, RSB_FLAG_QUAD_PARTITIONING, RSB_FLAG_SYMMETRIC, RSB_FLAG_OWN_PARTITIONING_ARRAYS # Using 12 threads -# Constructed matrix (took 0.003s): (3 x 3)[0xaaaaf1f3b400]{Z} @ (0(0..0),0(0..0)) (6 nnz, 2 nnz/r) flags 0x2442186 (coo:1, csr:0, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'S' +# Constructed matrix (took 0.002s): (3 x 3)[0xaaaaeb9d9440]{Z} @ (0(0..0),0(0..0)) (6 nnz, 2 nnz/r) flags 0x2442186 (coo:1, csr:0, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'S' # matrix consistency check took 0.000s (ok) RSB Sparse Blocks Autotuner invoked requesting max 6 splits and max 6 merges in 1 rounds, threads spec.0 (specify negative values to enable threads tuning). Will autotune matrix: 3 x 3, type Z, 6 nnz, 2 nnz/r, 4 subms, 3 lsubms, 4.0000 bpnz. Parameters: verbosity:1 mintimes:3 maxtimes:10 mindt:0 maxdt:3 -3 iterations (12 th.) took 0.001278s; avg 0.000426s ( +/- 2.11/ 1.42 %); best 0.000417s; worst 0.000432s; std dev. 6.475e-06 (taking best). -Reference operation time is 0.000416994 s (0.2302 Mflops) with 12 threads. -Starting merge (same threads) based auto-tuning procedure (transA=N, nrhs=1, order=rows) (max 6 steps, inclusive 3 grace steps) on: 3 x 3, type Z, 6 nnz, 2 nnz/r, 4 subms, 3 lsubms, 4.0000 bpnz (tpop: 0.000417 Mflops: 0.230) -Merge (3 -> 1 leaves) took w.c.t. of 5.007e-06s, ~2.146e-06s of computing time (of which 1.192e-06s sorting, 9.537e-07s analysis) -3 iterations (12 th.) took 1.502e-05s; avg 5.007e-06s ( +/- 98.47/200.00 %); best 7.645e-08s; worst 1.502e-05s; std dev. 7.081e-06 (taking best). -Reference operation time is 7.64489e-08 s (1256 Mflops) with 12 threads. -After merge step 1: tpop: 7.645e-08 s ~Mflops: 1255.740 nsubm:1 otn:12 -Applying merge (3 -> 1 leaves, 12 th.) yielded SPEEDUP of 5454.545x: 0.000417s -> 7.645e-08s, so taking this instance. +3 iterations (12 th.) took 0.001299s; avg 0.000433s ( +/- 0.94/ 1.16 %); best 0.0004289s; worst 0.000438s; std dev. 3.76e-06 (taking best). +Reference operation time is 0.000428915 s (0.2238 Mflops) with 12 threads. +Starting merge (same threads) based auto-tuning procedure (transA=N, nrhs=1, order=rows) (max 6 steps, inclusive 3 grace steps) on: 3 x 3, type Z, 6 nnz, 2 nnz/r, 4 subms, 3 lsubms, 4.0000 bpnz (tpop: 0.0004289 Mflops: 0.224) +Merge (3 -> 1 leaves) took w.c.t. of 7.153e-06s, ~2.861e-06s of computing time (of which 0s sorting, 0s analysis) +3 iterations (12 th.) took 1.597e-05s; avg 5.325e-06s ( +/- 98.55/182.09 %); best 7.734e-08s; worst 1.502e-05s; std dev. 6.867e-06 (taking best). +Reference operation time is 7.7343e-08 s (1241 Mflops) with 12 threads. +After merge step 1: tpop: 7.734e-08 s ~Mflops: 1241.224 nsubm:1 otn:12 +Applying merge (3 -> 1 leaves, 12 th.) yielded SPEEDUP of 5545.623x: 0.0004289s -> 7.734e-08s, so taking this instance. Merged all the matrix leaves: no reason to continue merging. -A total of 1 merge steps (of max 6) (3 -> 1 subms) took 0.001266s (of which 6.914e-06s partitioning, 0s I/O); computing times: 2.146e-06s in par. loops, 1.192e-06s sorting, 9.537e-07s analyzing) -Total merge + benchmarking process took 0.001266s, equivalent to 16560.1/3.0 new/old ops (0.002489s for 2 clones -- as 32555.7/6.0 ops, or 16277.9/3.0 ops per clone), SPEEDUP of 5454.545x -Applying multi-merge (3 -> 1 leaves, 1 steps, 0 -> 12 th.sp.) yielded SPEEDUP of 5454.545x (0.000417s -> 7.645e-08s), will amortize in 3.0 ops by saving 0.0004169s per op. -In 1 tuning rounds (tot. 0.0038s, 0.0025s for constructor, 2 clones) obtained a SPEEDUP of 545354.5% (5455x) (from 0.2302 to 1256 Mflops). +A total of 1 merge steps (of max 6) (3 -> 1 subms) took 0.001287s (of which 8.106e-06s partitioning, 0s I/O); computing times: 2.861e-06s in par. loops, 0s sorting, 0s analyzing) +Total merge + benchmarking process took 0.001287s, equivalent to 16640.0/3.0 new/old ops (0.002532s for 2 clones -- as 32740.4/5.9 ops, or 16370.2/3.0 ops per clone), SPEEDUP of 5545.623x +Applying multi-merge (3 -> 1 leaves, 1 steps, 0 -> 12 th.sp.) yielded SPEEDUP of 5545.623x (0.0004289s -> 7.734e-08s), will amortize in 3.0 ops by saving 0.0004288s per op. +In 1 tuning rounds (tot. 0.0039s, 0.0025s for constructor, 2 clones) obtained a SPEEDUP of 554462.3% (5546x) (from 0.2238 to 1241 Mflops). #pr: updating sample at index 7 (6^th of 16), 0^th touch for (0,0,0,0,0,3,0). -First run of RSB Autotuner took 0.0038178 s (4.170e-04 s -> 7.645e-08 s per spmv_sxsa) (tuned: 3 -> 1 lsubm). +First run of RSB Autotuner took 0.00388384 s (4.289e-04 s -> 7.734e-08 s per spmv_sxsa) (tuned: 3 -> 1 lsubm). RSB Sparse Blocks Autotuner invoked requesting max 0 splits and max 0 merges in 1 rounds, auto threads spec. -Second run of RSB Autotuner took 0.0213912 s and estimated a speedup of 1.000000 x (7.645e-08 s -> 7.645e-08 s per op) in same matrix (1 -> 1 lsubm) +Second run of RSB Autotuner took 0.026685 s and estimated a speedup of 1.000000 x (7.734e-08 s -> 7.734e-08 s per op) in same matrix (1 -> 1 lsubm) #min:1 0 #max:1 0 #sum:3 0 #norm:1.7320508075688772 0 #used index storage compared to COO:28 vs 48 bytes (58.33%) ; compared to CSR:28 vs 40 bytes (77.78%) #%:CONSTRUCTOR_*:SORT SCAN INSERT SCAN+INSERT -%:CONSTRUCTOR_TIMES:A.mtx S N 12 3 3 6 0.000000 0.000844 0.000857 0.001701 -%:UNSORTEDCOO2RSB_TIME:A.mtx S N 12 3 3 6 0.001701 -%:RSB_SUBDIVISION_TIME:A.mtx S N 12 3 3 6 0.000844 -%:RSB_SHUFFLE_TIME:A.mtx S N 12 3 3 6 0.000857 +%:CONSTRUCTOR_TIMES:A.mtx S N 12 3 3 6 0.000000 0.000692 0.000879 0.001571 +%:UNSORTEDCOO2RSB_TIME:A.mtx S N 12 3 3 6 0.001571 +%:RSB_SUBDIVISION_TIME:A.mtx S N 12 3 3 6 0.000692 +%:RSB_SHUFFLE_TIME:A.mtx S N 12 3 3 6 0.000879 %:ROW_MAJOR_SORT_TIME:A.mtx S N 12 3 3 6 0.000000 %:ROW_MAJOR_SORT_SCALING:A.mtx S N 12 3 3 6 nan -%:SORTEDCOO2RSB_TIME:A.mtx S N 12 3 3 6 0.001701 +%:SORTEDCOO2RSB_TIME:A.mtx S N 12 3 3 6 0.001571 %:ROW_MAJOR_SORT_TO_MOP:A.mtx S N 12 3 3 6 0.000 %:UNSORTEDCOO2RSB_SCALING:A.mtx S N 12 3 3 6 1.00 %:SORTEDCOO2RSB_SCALING:A.mtx S N 12 3 3 6 1.00 @@ -4725,50 +4761,50 @@ %:SM_MINMAXAVGNNZ:A.mtx S N 12 3 3 6 6 6 6 # %operation:matrix CONSTRUCTOR[12] SPMV[12] SPMV[12] -%operation:A.mtx 0.00253797 1e+09 1e+09 +%operation:A.mtx 0.00244713 1e+09 1e+09 %constructor:matrix SORT[12] SCAN[12] SHUFFLE[12] INSERT[12] -%constructor:A.mtx 0 0.000844002 0 0.000856876 +%constructor:A.mtx 0 0.000692129 0 0.000879049 # symmetric matrix --- skipping transposed benchmarking # multi-nrhs benchmarking (1,4) -- now using nrhs 4. # Using alpha=1 beta=1 order=rows for rsb_spmv/rsb_spsv/rsb_spmm/rsb_spsm. # multi-transpose benchmarking -- now using transA = N. # will use input matrix flags: RSB_FLAG_USE_HALFWORD_INDICES, RSB_FLAG_SORTED_INPUT, RSB_FLAG_QUAD_PARTITIONING, RSB_FLAG_SYMMETRIC, RSB_FLAG_OWN_PARTITIONING_ARRAYS # Using 12 threads -# Constructed matrix (took 0.003s): (3 x 3)[0xaaaaf1f3b400]{Z} @ (0(0..0),0(0..0)) (6 nnz, 2 nnz/r) flags 0x2442186 (coo:1, csr:0, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'S' +# Constructed matrix (took 0.003s): (3 x 3)[0xaaaaeb9d9440]{Z} @ (0(0..0),0(0..0)) (6 nnz, 2 nnz/r) flags 0x2442186 (coo:1, csr:0, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'S' # matrix consistency check took 0.000s (ok) RSB Sparse Blocks Autotuner invoked requesting max 6 splits and max 6 merges in 1 rounds, threads spec.0 (specify negative values to enable threads tuning). Will autotune matrix: 3 x 3, type Z, 6 nnz, 2 nnz/r, 4 subms, 3 lsubms, 4.0000 bpnz. Parameters: verbosity:1 mintimes:3 maxtimes:10 mindt:0 maxdt:3 -3 iterations (12 th.) took 0.001468s; avg 0.0004893s ( +/- 14.34/ 26.10 %); best 0.0004191s; worst 0.000617s; std dev. 9.045e-05 (taking best). -Reference operation time is 0.00041914 s (0.9162 Mflops) with 12 threads. -Starting merge (same threads) based auto-tuning procedure (transA=N, nrhs=4, order=rows) (max 6 steps, inclusive 3 grace steps) on: 3 x 3, type Z, 6 nnz, 2 nnz/r, 4 subms, 3 lsubms, 4.0000 bpnz (tpop: 0.0004191 Mflops: 0.916) -Merge (3 -> 1 leaves) took w.c.t. of 5.96e-06s, ~3.099e-06s of computing time (of which 9.537e-07s sorting, 9.537e-07s analysis) -3 iterations (12 th.) took 2.861e-06s; avg 9.537e-07s ( +/- 91.98/100.00 %); best 7.645e-08s; worst 1.907e-06s; std dev. 7.787e-07 (taking best). -Reference operation time is 7.64489e-08 s (5023 Mflops) with 12 threads. -After merge step 1: tpop: 7.645e-08 s ~Mflops: 5022.962 nsubm:1 otn:12 -Applying merge (3 -> 1 leaves, 12 th.) yielded SPEEDUP of 5482.613x: 0.0004191s -> 7.645e-08s, so taking this instance. +3 iterations (12 th.) took 0.005158s; avg 0.001719s ( +/- 75.75/132.13 %); best 0.000417s; worst 0.003991s; std dev. 0.001612 (taking best). +Reference operation time is 0.000416994 s (0.9209 Mflops) with 12 threads. +Starting merge (same threads) based auto-tuning procedure (transA=N, nrhs=4, order=rows) (max 6 steps, inclusive 3 grace steps) on: 3 x 3, type Z, 6 nnz, 2 nnz/r, 4 subms, 3 lsubms, 4.0000 bpnz (tpop: 0.000417 Mflops: 0.921) +Merge (3 -> 1 leaves) took w.c.t. of 6.914e-06s, ~1.907e-06s of computing time (of which 9.537e-07s sorting, 0s analysis) +3 iterations (12 th.) took 2.861e-06s; avg 9.537e-07s ( +/- 91.89/100.00 %); best 7.734e-08s; worst 1.907e-06s; std dev. 7.787e-07 (taking best). +Reference operation time is 7.7343e-08 s (4965 Mflops) with 12 threads. +After merge step 1: tpop: 7.734e-08 s ~Mflops: 4964.897 nsubm:1 otn:12 +Applying merge (3 -> 1 leaves, 12 th.) yielded SPEEDUP of 5391.492x: 0.000417s -> 7.734e-08s, so taking this instance. Merged all the matrix leaves: no reason to continue merging. -A total of 1 merge steps (of max 6) (3 -> 1 subms) took 0.001268s (of which 8.106e-06s partitioning, 0s I/O); computing times: 3.099e-06s in par. loops, 9.537e-07s sorting, 9.537e-07s analyzing) -Total merge + benchmarking process took 0.001268s, equivalent to 16585.1/3.0 new/old ops (0.002512s for 2 clones -- as 32858.3/6.0 ops, or 16429.1/3.0 ops per clone), SPEEDUP of 5482.613x -Applying multi-merge (3 -> 1 leaves, 1 steps, 0 -> 12 th.sp.) yielded SPEEDUP of 5482.613x (0.0004191s -> 7.645e-08s), will amortize in 3.0 ops by saving 0.0004191s per op. -In 1 tuning rounds (tot. 0.004s, 0.0025s for constructor, 2 clones) obtained a SPEEDUP of 548161.3% (5483x) (from 0.9162 to 5023 Mflops). +A total of 1 merge steps (of max 6) (3 -> 1 subms) took 0.001298s (of which 8.106e-06s partitioning, 0s I/O); computing times: 1.907e-06s in par. loops, 9.537e-07s sorting, 0s analyzing) +Total merge + benchmarking process took 0.001298s, equivalent to 16781.8/3.1 new/old ops (0.002566s for 2 clones -- as 33178.2/6.2 ops, or 16589.1/3.1 ops per clone), SPEEDUP of 5391.492x +Applying multi-merge (3 -> 1 leaves, 1 steps, 0 -> 12 th.sp.) yielded SPEEDUP of 5391.492x (0.000417s -> 7.734e-08s), will amortize in 3.1 ops by saving 0.0004169s per op. +In 1 tuning rounds (tot. 0.0078s, 0.0026s for constructor, 2 clones) obtained a SPEEDUP of 539049.2% (5391x) (from 0.9209 to 4965 Mflops). #pr: updating sample at index 15 (7^th of 16), 0^th touch for (0,0,0,0,1,3,0). -First run of RSB Autotuner took 0.00418305 s (4.191e-04 s -> 7.645e-08 s per spmv_sxsa) (tuned: 3 -> 1 lsubm). +First run of RSB Autotuner took 0.00792408 s (4.170e-04 s -> 7.734e-08 s per spmv_sxsa) (tuned: 3 -> 1 lsubm). RSB Sparse Blocks Autotuner invoked requesting max 0 splits and max 0 merges in 1 rounds, auto threads spec. -Second run of RSB Autotuner took 0.027235 s and estimated a speedup of 1.000000 x (7.645e-08 s -> 7.645e-08 s per op) in same matrix (1 -> 1 lsubm) +Second run of RSB Autotuner took 0.0249522 s and estimated a speedup of 1.000000 x (7.734e-08 s -> 7.734e-08 s per op) in same matrix (1 -> 1 lsubm) #min:1 0 #max:1 0 #sum:3 0 #norm:1.7320508075688772 0 #used index storage compared to COO:28 vs 48 bytes (58.33%) ; compared to CSR:28 vs 40 bytes (77.78%) #%:CONSTRUCTOR_*:SORT SCAN INSERT SCAN+INSERT -%:CONSTRUCTOR_TIMES:A.mtx S N 12 3 3 6 0.000000 0.001017 0.000867 0.001884 -%:UNSORTEDCOO2RSB_TIME:A.mtx S N 12 3 3 6 0.001884 -%:RSB_SUBDIVISION_TIME:A.mtx S N 12 3 3 6 0.001017 -%:RSB_SHUFFLE_TIME:A.mtx S N 12 3 3 6 0.000867 +%:CONSTRUCTOR_TIMES:A.mtx S N 12 3 3 6 0.000000 0.001040 0.000883 0.001923 +%:UNSORTEDCOO2RSB_TIME:A.mtx S N 12 3 3 6 0.001923 +%:RSB_SUBDIVISION_TIME:A.mtx S N 12 3 3 6 0.001040 +%:RSB_SHUFFLE_TIME:A.mtx S N 12 3 3 6 0.000883 %:ROW_MAJOR_SORT_TIME:A.mtx S N 12 3 3 6 0.000000 %:ROW_MAJOR_SORT_SCALING:A.mtx S N 12 3 3 6 nan -%:SORTEDCOO2RSB_TIME:A.mtx S N 12 3 3 6 0.001884 +%:SORTEDCOO2RSB_TIME:A.mtx S N 12 3 3 6 0.001923 %:ROW_MAJOR_SORT_TO_MOP:A.mtx S N 12 3 3 6 0.000 %:UNSORTEDCOO2RSB_SCALING:A.mtx S N 12 3 3 6 1.00 %:SORTEDCOO2RSB_SCALING:A.mtx S N 12 3 3 6 1.00 @@ -4783,37 +4819,37 @@ %:SM_MINMAXAVGNNZ:A.mtx S N 12 3 3 6 6 6 6 # %operation:matrix CONSTRUCTOR[12] SPMV[12] SPMV[12] -%operation:A.mtx 0.00275183 1e+09 1e+09 +%operation:A.mtx 0.00278497 1e+09 1e+09 %constructor:matrix SORT[12] SCAN[12] SHUFFLE[12] INSERT[12] -%constructor:A.mtx 0 0.00101709 0 0.00086689 +%constructor:A.mtx 0 0.00103998 0 0.000883102 # symmetric matrix --- skipping transposed benchmarking -# so far, program took 5.746s of wall clock time; ancillary tests 0.000s; I/O 0.000s; checks 0.000s; conversions 0.000s; rsb/mkl tuning 0.302s/0.000s . +# so far, program took 5.764s of wall clock time; ancillary tests 0.000s; I/O 0.000s; checks 0.000s; conversions 0.000s; rsb/mkl tuning 0.303s/0.000s . getrusage() stats: ru_maxrss: 6 (maximum resident set size -- MB) -ru_stime : 0.08752s (system CPU time used) -ru_utime : 8.157s (user CPU time used) +ru_stime : 0.07688s (system CPU time used) +ru_utime : 8.71s (user CPU time used) # benchmarking terminated --- finalizing run. # ====== BEGIN Total summary record. #pr: ======== Limiting to type D: #pr: 2 samples (out of 8) matched the dump limiting criteria. #pr: Dump from a base of 8 samples (of max 16) ordered by (1,1,1,1,2,4,2) = (filename x cores x incX x incY x nrhs x typecode x transA). pr: BESTCODE MTX NR NC NNZ NRHS TYPE SYM TRANS NT AT-NT AT-MKL-NT BPNZ AT-BPNZ NSUBM AT-SUBM RSBBEST-MFLOPS OPTIME MKL-OPTIME AT-OPTIME AT-MKL-OPTIME AT-TIME RWminBW-GBps CB-bpf AT-MS CMFLOPS -pr: 1:R_R A 3 3 6 1 D S N 12 12 0 4.0000 4.6667 3 1 313.94 1.194e-03 0.000e+00 7.645e-08 0.000e+00 1.156e-02 1.94e+00 5.17e+00 1 2.40e-05 -pr: 9:R_R A 3 3 6 4 D S N 12 12 0 4.0000 4.6667 3 1 1255.74 1.332e-03 0.000e+00 7.645e-08 0.000e+00 1.152e-02 4.76e+00 2.79e+00 1 9.60e-05 +pr: 1:R_R A 3 3 6 1 D S N 12 12 0 4.0000 4.6667 3 1 310.31 1.243e-03 0.000e+00 7.734e-08 0.000e+00 1.091e-02 1.91e+00 5.17e+00 1 2.40e-05 +pr: 9:R_R A 3 3 6 4 D S N 12 12 0 4.0000 4.6667 3 1 1241.22 9.499e-04 0.000e+00 7.734e-08 0.000e+00 8.681e-03 4.71e+00 2.79e+00 1 9.60e-05 #pr: 2 samples (out of 8) matched the dump limiting criteria. #pr: below, we define 'successful' autotuning when speedup of 1.010000x is exceeded, and 'tuned' results even the ones which are same as untuned #pr: rsb autotuning was successful in 2 cases (100.00 %) and unsuccessful in 0 cases (0.00 %) -#pr: (in succ. cases rsb autotuning gave avg. 1652012.9 % faster, avg. sp. ratio 16521.129x, max sp. ratio 17423.983x, avg. ratio 0.000x) -#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 150969.9/150700.1/151239.7/301939.8 tuned ops) -#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 9.2/ 8.6/ 9.7/ 18.3 untuned ops) -#pr: (and amortizes from untuned rsb in avg. 9.2, min. 8.6, max. 9.7 ops) +#pr: (in succ. cases rsb autotuning gave avg. 1417440.1 % faster, avg. sp. ratio 14175.401x, max sp. ratio 16069.667x, avg. ratio 0.000x) +#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 126638.4/112241.1/141035.8/253276.8 tuned ops) +#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 9.0/ 8.8/ 9.1/ 17.9 untuned ops) +#pr: (and amortizes from untuned rsb in avg. 9.0, min. 8.8, max. 9.1 ops) #pr: (avg/min/max (avg) nnz per subm before successful tuning were 2/ 2/ 2) #pr: (avg/min/max (avg) nnz per subm after successful tuning were 6/ 6/ 6) #pr: (avg/min/max (avg) bytes per subm before successful tuning were 16/ 16/ 16) #pr: (avg/min/max (avg) bytes per subm after successful tuning were 48/ 48/ 48) #pr: (avg/min/max (avg) bytes per nnz before successful tuning were 4.000/ 4.000/ 4.000) -#pr: (avg/min/max operands (mtx,lhs,rhs) read bandwidth lower bound 2.564/ 1.622/ 3.506,GBps) -#pr: (avg/min/max operands (mtx,rhs:r;lhs:rw) bandwidth lower bound 6.697/ 1.936/ 4.761,GBps) +#pr: (avg/min/max operands (mtx,lhs,rhs) read bandwidth lower bound 2.534/ 1.603/ 3.465,GBps) +#pr: (avg/min/max operands (mtx,rhs:r;lhs:rw) bandwidth lower bound 6.620/ 1.914/ 4.706,GBps) #pr: (avg/min/max code balance (bytes read at least once per flop) 3.979/ 2.792/ 5.167) #pr: (avg/min/max (avg) bytes per nnz after successful tuning were 4.667/ 4.667/ 4.667) #pr: (matrix has been subdivided more/less/same in resp. 0 / 2 /0 cases) @@ -4821,210 +4857,210 @@ #pr: no unsuccessful rsb autotuning attempt (according to 1.01x threshold) #pr: rsb auto tuning (either succ. or uns.) time was: on avg.: 0.01 s, min 0.01 s, max 0.01 s, tot 0.02 s (2 samples) #pr: rsb auto tuning ( only successful ) time was: on avg.: 0.01 s, min 0.01 s, max 0.01 s, tot 0.02 s (2 samples) -#pr: best tun. rsb canon. mflops were: on avg. 7.848e+02, min 3.139e+02, max 1.256e+03 (2 samples) -#pr: ref. unt. rsb canon. mflops were: on avg. 4.609e-02, min 2.010e-02, max 7.207e-02 (2 samples) -#pr: best tun. rsb operation time was: on avg. 7.645e-08s, min 7.645e-08s, max 7.645e-08s, tot 1.529e-07s (2 samples) -#pr: ref. unt. rsb operation time was: on avg. 1.263e-03s, min 1.194e-03s, max 1.332e-03s, tot 2.526e-03s (2 samples) -#pr: min / max ratio of in-memory MEMSET bandwidth to extrapolated read bandwidth ratio: 1.346e+01 2.909e+01 -#pr: in-cache to in-memory MEMSET bandwidth ratio: 1.010e+00 +#pr: best tun. rsb canon. mflops were: on avg. 7.758e+02, min 3.103e+02, max 1.241e+03 (2 samples) +#pr: ref. unt. rsb canon. mflops were: on avg. 6.019e-02, min 1.931e-02, max 1.011e-01 (2 samples) +#pr: best tun. rsb operation time was: on avg. 7.734e-08s, min 7.734e-08s, max 7.734e-08s, tot 1.547e-07s (2 samples) +#pr: ref. unt. rsb operation time was: on avg. 1.096e-03s, min 9.499e-04s, max 1.243e-03s, tot 2.193e-03s (2 samples) +#pr: min / max ratio of in-memory MEMSET bandwidth to extrapolated read bandwidth ratio: 1.376e+01 2.975e+01 +#pr: in-cache to in-memory MEMSET bandwidth ratio: 9.995e-01 #pr: rsb nrhs-to-overall-min-rhs speed ratio was: on avg. 4.000e+00 x, min 4.000e+00 x, max 4.000e+00 x (1 samples, the non-min-nrhs ones) #pr: ======== Limiting to type S: #pr: 2 samples (out of 8) matched the dump limiting criteria. #pr: Dump from a base of 8 samples (of max 16) ordered by (1,1,1,1,2,4,2) = (filename x cores x incX x incY x nrhs x typecode x transA). pr: BESTCODE MTX NR NC NNZ NRHS TYPE SYM TRANS NT AT-NT AT-MKL-NT BPNZ AT-BPNZ NSUBM AT-SUBM RSBBEST-MFLOPS OPTIME MKL-OPTIME AT-OPTIME AT-MKL-OPTIME AT-TIME RWminBW-GBps CB-bpf AT-MS CMFLOPS -pr: 3:R_R A 3 3 6 1 S S N 12 12 0 4.0000 4.6667 3 1 313.94 5.319e-04 0.000e+00 7.645e-08 0.000e+00 6.313e-03 1.15e+00 3.17e+00 1 2.40e-05 -pr: 11:R_R A 3 3 6 4 S S N 12 12 0 4.0000 4.6667 3 1 1255.74 4.139e-04 0.000e+00 7.645e-08 0.000e+00 3.920e-03 2.56e+00 1.54e+00 1 9.60e-05 +pr: 3:R_R A 3 3 6 1 S S N 12 12 0 4.0000 4.6667 3 1 310.31 3.521e-04 0.000e+00 7.734e-08 0.000e+00 5.505e-03 1.14e+00 3.17e+00 1 2.40e-05 +pr: 11:R_R A 3 3 6 4 S S N 12 12 0 4.0000 4.6667 3 1 1241.22 5.960e-04 0.000e+00 7.734e-08 0.000e+00 5.462e-03 2.53e+00 1.54e+00 1 9.60e-05 #pr: 2 samples (out of 8) matched the dump limiting criteria. #pr: below, we define 'successful' autotuning when speedup of 1.010000x is exceeded, and 'tuned' results even the ones which are same as untuned #pr: rsb autotuning was successful in 2 cases (100.00 %) and unsuccessful in 0 cases (0.00 %) -#pr: (in succ. cases rsb autotuning gave avg. 618487.2 % faster, avg. sp. ratio 6185.872x, max sp. ratio 6957.742x, avg. ratio 0.000x) -#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 66926.6/51277.1/82576.0/133853.1 tuned ops) -#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 10.7/ 9.5/ 11.9/ 21.3 untuned ops) -#pr: (and amortizes from untuned rsb in avg. 10.7, min. 9.5, max. 11.9 ops) +#pr: (in succ. cases rsb autotuning gave avg. 612877.8 % faster, avg. sp. ratio 6129.778x, max sp. ratio 7706.535x, avg. ratio 0.000x) +#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 70898.6/70619.6/71177.6/141797.2 tuned ops) +#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 12.4/ 9.2/ 15.6/ 24.8 untuned ops) +#pr: (and amortizes from untuned rsb in avg. 12.4, min. 9.2, max. 15.6 ops) #pr: (avg/min/max (avg) nnz per subm before successful tuning were 2/ 2/ 2) #pr: (avg/min/max (avg) nnz per subm after successful tuning were 6/ 6/ 6) #pr: (avg/min/max (avg) bytes per subm before successful tuning were 8/ 8/ 8) #pr: (avg/min/max (avg) bytes per subm after successful tuning were 24/ 24/ 24) #pr: (avg/min/max (avg) bytes per nnz before successful tuning were 4.000/ 4.000/ 4.000) -#pr: (avg/min/max operands (mtx,lhs,rhs) read bandwidth lower bound 1.465/ 0.994/ 1.936,GBps) -#pr: (avg/min/max operands (mtx,rhs:r;lhs:rw) bandwidth lower bound 3.715/ 1.151/ 2.564,GBps) +#pr: (avg/min/max operands (mtx,lhs,rhs) read bandwidth lower bound 1.448/ 0.983/ 1.914,GBps) +#pr: (avg/min/max operands (mtx,rhs:r;lhs:rw) bandwidth lower bound 3.672/ 1.138/ 2.534,GBps) #pr: (avg/min/max code balance (bytes read at least once per flop) 2.354/ 1.542/ 3.167) #pr: (avg/min/max (avg) bytes per nnz after successful tuning were 4.667/ 4.667/ 4.667) #pr: (matrix has been subdivided more/less/same in resp. 0 / 2 /0 cases) #pr: (matrix has used more/less/same threads in resp. 0 / 0 /2 cases) #pr: no unsuccessful rsb autotuning attempt (according to 1.01x threshold) -#pr: rsb auto tuning (either succ. or uns.) time was: on avg.: 0.01 s, min 0.00 s, max 0.01 s, tot 0.01 s (2 samples) -#pr: rsb auto tuning ( only successful ) time was: on avg.: 0.01 s, min 0.00 s, max 0.01 s, tot 0.01 s (2 samples) -#pr: best tun. rsb canon. mflops were: on avg. 7.848e+02, min 3.139e+02, max 1.256e+03 (2 samples) -#pr: ref. unt. rsb canon. mflops were: on avg. 1.385e-01, min 4.512e-02, max 2.319e-01 (2 samples) -#pr: best tun. rsb operation time was: on avg. 7.645e-08s, min 7.645e-08s, max 7.645e-08s, tot 1.529e-07s (2 samples) -#pr: ref. unt. rsb operation time was: on avg. 4.729e-04s, min 4.139e-04s, max 5.319e-04s, tot 9.458e-04s (2 samples) -#pr: min / max ratio of in-memory MEMSET bandwidth to extrapolated read bandwidth ratio: 2.438e+01 4.747e+01 -#pr: in-cache to in-memory MEMSET bandwidth ratio: 1.010e+00 +#pr: rsb auto tuning (either succ. or uns.) time was: on avg.: 0.01 s, min 0.01 s, max 0.01 s, tot 0.01 s (2 samples) +#pr: rsb auto tuning ( only successful ) time was: on avg.: 0.01 s, min 0.01 s, max 0.01 s, tot 0.01 s (2 samples) +#pr: best tun. rsb canon. mflops were: on avg. 7.758e+02, min 3.103e+02, max 1.241e+03 (2 samples) +#pr: ref. unt. rsb canon. mflops were: on avg. 1.146e-01, min 6.815e-02, max 1.611e-01 (2 samples) +#pr: best tun. rsb operation time was: on avg. 7.734e-08s, min 7.734e-08s, max 7.734e-08s, tot 1.547e-07s (2 samples) +#pr: ref. unt. rsb operation time was: on avg. 4.741e-04s, min 3.521e-04s, max 5.960e-04s, tot 9.482e-04s (2 samples) +#pr: min / max ratio of in-memory MEMSET bandwidth to extrapolated read bandwidth ratio: 2.492e+01 4.854e+01 +#pr: in-cache to in-memory MEMSET bandwidth ratio: 9.995e-01 #pr: rsb nrhs-to-overall-min-rhs speed ratio was: on avg. 4.000e+00 x, min 4.000e+00 x, max 4.000e+00 x (1 samples, the non-min-nrhs ones) #pr: ======== Limiting to type C: #pr: 2 samples (out of 8) matched the dump limiting criteria. #pr: Dump from a base of 8 samples (of max 16) ordered by (1,1,1,1,2,4,2) = (filename x cores x incX x incY x nrhs x typecode x transA). pr: BESTCODE MTX NR NC NNZ NRHS TYPE SYM TRANS NT AT-NT AT-MKL-NT BPNZ AT-BPNZ NSUBM AT-SUBM RSBBEST-MFLOPS OPTIME MKL-OPTIME AT-OPTIME AT-MKL-OPTIME AT-TIME RWminBW-GBps CB-bpf AT-MS CMFLOPS -pr: 5:R_R A 3 3 6 1 C S N 12 12 0 4.0000 4.6667 3 1 1255.74 5.479e-04 0.000e+00 7.645e-08 0.000e+00 6.905e-03 1.94e+00 1.29e+00 1 9.60e-05 -pr: 13:R_R A 3 3 6 4 C S N 12 12 0 4.0000 4.6667 3 1 5022.96 4.249e-04 0.000e+00 7.645e-08 0.000e+00 4.617e-03 4.76e+00 6.98e-01 1 3.84e-04 +pr: 5:R_R A 3 3 6 1 C S N 12 12 0 4.0000 4.6667 3 1 1241.22 4.179e-04 0.000e+00 7.734e-08 0.000e+00 4.252e-03 1.91e+00 1.29e+00 1 9.60e-05 +pr: 13:R_R A 3 3 6 4 C S N 12 12 0 4.0000 4.6667 3 1 4964.90 3.979e-04 0.000e+00 7.734e-08 0.000e+00 3.698e-03 4.71e+00 6.98e-01 1 3.84e-04 #pr: 2 samples (out of 8) matched the dump limiting criteria. #pr: below, we define 'successful' autotuning when speedup of 1.010000x is exceeded, and 'tuned' results even the ones which are same as untuned #pr: rsb autotuning was successful in 2 cases (100.00 %) and unsuccessful in 0 cases (0.00 %) -#pr: (in succ. cases rsb autotuning gave avg. 636107.7 % faster, avg. sp. ratio 6362.077x, max sp. ratio 7166.693x, avg. ratio 0.000x) -#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 75357.9/60393.0/90322.8/150715.7 tuned ops) -#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 11.7/ 10.9/ 12.6/ 23.5 untuned ops) -#pr: (and amortizes from untuned rsb in avg. 11.7, min. 10.9, max. 12.6 ops) +#pr: (in succ. cases rsb autotuning gave avg. 527335.3 % faster, avg. sp. ratio 5274.353x, max sp. ratio 5403.822x, avg. ratio 0.000x) +#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 51393.3/47811.3/54975.3/102786.7 tuned ops) +#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 9.7/ 9.3/ 10.2/ 19.5 untuned ops) +#pr: (and amortizes from untuned rsb in avg. 9.7, min. 9.3, max. 10.2 ops) #pr: (avg/min/max (avg) nnz per subm before successful tuning were 2/ 2/ 2) #pr: (avg/min/max (avg) nnz per subm after successful tuning were 6/ 6/ 6) #pr: (avg/min/max (avg) bytes per subm before successful tuning were 16/ 16/ 16) #pr: (avg/min/max (avg) bytes per subm after successful tuning were 48/ 48/ 48) #pr: (avg/min/max (avg) bytes per nnz before successful tuning were 4.000/ 4.000/ 4.000) -#pr: (avg/min/max operands (mtx,lhs,rhs) read bandwidth lower bound 2.564/ 1.622/ 3.506,GBps) -#pr: (avg/min/max operands (mtx,rhs:r;lhs:rw) bandwidth lower bound 6.697/ 1.936/ 4.761,GBps) +#pr: (avg/min/max operands (mtx,lhs,rhs) read bandwidth lower bound 2.534/ 1.603/ 3.465,GBps) +#pr: (avg/min/max operands (mtx,rhs:r;lhs:rw) bandwidth lower bound 6.620/ 1.914/ 4.706,GBps) #pr: (avg/min/max code balance (bytes read at least once per flop) 0.995/ 0.698/ 1.292) #pr: (avg/min/max (avg) bytes per nnz after successful tuning were 4.667/ 4.667/ 4.667) #pr: (matrix has been subdivided more/less/same in resp. 0 / 2 /0 cases) #pr: (matrix has used more/less/same threads in resp. 0 / 0 /2 cases) #pr: no unsuccessful rsb autotuning attempt (according to 1.01x threshold) -#pr: rsb auto tuning (either succ. or uns.) time was: on avg.: 0.01 s, min 0.00 s, max 0.01 s, tot 0.01 s (2 samples) -#pr: rsb auto tuning ( only successful ) time was: on avg.: 0.01 s, min 0.00 s, max 0.01 s, tot 0.01 s (2 samples) -#pr: best tun. rsb canon. mflops were: on avg. 3.139e+03, min 1.256e+03, max 5.023e+03 (2 samples) -#pr: ref. unt. rsb canon. mflops were: on avg. 5.395e-01, min 1.752e-01, max 9.038e-01 (2 samples) -#pr: best tun. rsb operation time was: on avg. 7.645e-08s, min 7.645e-08s, max 7.645e-08s, tot 1.529e-07s (2 samples) -#pr: ref. unt. rsb operation time was: on avg. 4.864e-04s, min 4.249e-04s, max 5.479e-04s, tot 9.727e-04s (2 samples) -#pr: min / max ratio of in-memory MEMSET bandwidth to extrapolated read bandwidth ratio: 1.346e+01 2.909e+01 -#pr: in-cache to in-memory MEMSET bandwidth ratio: 1.010e+00 +#pr: rsb auto tuning (either succ. or uns.) time was: on avg.: 0.00 s, min 0.00 s, max 0.00 s, tot 0.01 s (2 samples) +#pr: rsb auto tuning ( only successful ) time was: on avg.: 0.00 s, min 0.00 s, max 0.00 s, tot 0.01 s (2 samples) +#pr: best tun. rsb canon. mflops were: on avg. 3.103e+03, min 1.241e+03, max 4.965e+03 (2 samples) +#pr: ref. unt. rsb canon. mflops were: on avg. 5.974e-01, min 2.297e-01, max 9.650e-01 (2 samples) +#pr: best tun. rsb operation time was: on avg. 7.734e-08s, min 7.734e-08s, max 7.734e-08s, tot 1.547e-07s (2 samples) +#pr: ref. unt. rsb operation time was: on avg. 4.079e-04s, min 3.979e-04s, max 4.179e-04s, tot 8.159e-04s (2 samples) +#pr: min / max ratio of in-memory MEMSET bandwidth to extrapolated read bandwidth ratio: 1.376e+01 2.975e+01 +#pr: in-cache to in-memory MEMSET bandwidth ratio: 9.995e-01 #pr: rsb nrhs-to-overall-min-rhs speed ratio was: on avg. 4.000e+00 x, min 4.000e+00 x, max 4.000e+00 x (1 samples, the non-min-nrhs ones) #pr: ======== Limiting to type Z: #pr: 2 samples (out of 8) matched the dump limiting criteria. #pr: Dump from a base of 8 samples (of max 16) ordered by (1,1,1,1,2,4,2) = (filename x cores x incX x incY x nrhs x typecode x transA). pr: BESTCODE MTX NR NC NNZ NRHS TYPE SYM TRANS NT AT-NT AT-MKL-NT BPNZ AT-BPNZ NSUBM AT-SUBM RSBBEST-MFLOPS OPTIME MKL-OPTIME AT-OPTIME AT-MKL-OPTIME AT-TIME RWminBW-GBps CB-bpf AT-MS CMFLOPS -pr: 7:R_R A 3 3 6 1 Z S N 12 12 0 4.0000 4.6667 3 1 1255.74 4.170e-04 0.000e+00 7.645e-08 0.000e+00 3.818e-03 3.51e+00 2.29e+00 1 9.60e-05 -pr: 15:R_R A 3 3 6 4 Z S N 12 12 0 4.0000 4.6667 3 1 5022.96 4.191e-04 0.000e+00 7.645e-08 0.000e+00 4.183e-03 9.16e+00 1.32e+00 1 3.84e-04 +pr: 7:R_R A 3 3 6 1 Z S N 12 12 0 4.0000 4.6667 3 1 1241.22 4.289e-04 0.000e+00 7.734e-08 0.000e+00 3.884e-03 3.47e+00 2.29e+00 1 9.60e-05 +pr: 15:R_R A 3 3 6 4 Z S N 12 12 0 4.0000 4.6667 3 1 4964.90 4.170e-04 0.000e+00 7.734e-08 0.000e+00 7.924e-03 9.05e+00 1.32e+00 1 3.84e-04 #pr: 2 samples (out of 8) matched the dump limiting criteria. #pr: below, we define 'successful' autotuning when speedup of 1.010000x is exceeded, and 'tuned' results even the ones which are same as untuned #pr: rsb autotuning was successful in 2 cases (100.00 %) and unsuccessful in 0 cases (0.00 %) -#pr: (in succ. cases rsb autotuning gave avg. 546757.9 % faster, avg. sp. ratio 5468.579x, max sp. ratio 5482.613x, avg. ratio 0.000x) -#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 52328.1/49939.2/54717.0/104656.2 tuned ops) -#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 9.6/ 9.2/ 10.0/ 19.1 untuned ops) -#pr: (and amortizes from untuned rsb in avg. 9.6, min. 9.2, max. 10.0 ops) +#pr: (in succ. cases rsb autotuning gave avg. 546755.7 % faster, avg. sp. ratio 5468.557x, max sp. ratio 5545.623x, avg. ratio 0.000x) +#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 76334.8/50215.8/102453.8/152669.5 tuned ops) +#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 14.0/ 9.1/ 19.0/ 28.1 untuned ops) +#pr: (and amortizes from untuned rsb in avg. 14.0, min. 9.1, max. 19.0 ops) #pr: (avg/min/max (avg) nnz per subm before successful tuning were 2/ 2/ 2) #pr: (avg/min/max (avg) nnz per subm after successful tuning were 6/ 6/ 6) #pr: (avg/min/max (avg) bytes per subm before successful tuning were 32/ 32/ 32) #pr: (avg/min/max (avg) bytes per subm after successful tuning were 96/ 96/ 96) #pr: (avg/min/max (avg) bytes per nnz before successful tuning were 4.000/ 4.000/ 4.000) -#pr: (avg/min/max operands (mtx,lhs,rhs) read bandwidth lower bound 4.761/ 2.878/ 6.645,GBps) -#pr: (avg/min/max operands (mtx,rhs:r;lhs:rw) bandwidth lower bound 12.662/ 3.506/ 9.156,GBps) +#pr: (avg/min/max operands (mtx,lhs,rhs) read bandwidth lower bound 4.706/ 2.844/ 6.568,GBps) +#pr: (avg/min/max operands (mtx,rhs:r;lhs:rw) bandwidth lower bound 12.516/ 3.465/ 9.051,GBps) #pr: (avg/min/max code balance (bytes read at least once per flop) 1.807/ 1.323/ 2.292) #pr: (avg/min/max (avg) bytes per nnz after successful tuning were 4.667/ 4.667/ 4.667) #pr: (matrix has been subdivided more/less/same in resp. 0 / 2 /0 cases) #pr: (matrix has used more/less/same threads in resp. 0 / 0 /2 cases) #pr: no unsuccessful rsb autotuning attempt (according to 1.01x threshold) -#pr: rsb auto tuning (either succ. or uns.) time was: on avg.: 0.00 s, min 0.00 s, max 0.00 s, tot 0.01 s (2 samples) -#pr: rsb auto tuning ( only successful ) time was: on avg.: 0.00 s, min 0.00 s, max 0.00 s, tot 0.01 s (2 samples) -#pr: best tun. rsb canon. mflops were: on avg. 3.139e+03, min 1.256e+03, max 5.023e+03 (2 samples) -#pr: ref. unt. rsb canon. mflops were: on avg. 5.732e-01, min 2.302e-01, max 9.162e-01 (2 samples) -#pr: best tun. rsb operation time was: on avg. 7.645e-08s, min 7.645e-08s, max 7.645e-08s, tot 1.529e-07s (2 samples) -#pr: ref. unt. rsb operation time was: on avg. 4.181e-04s, min 4.170e-04s, max 4.191e-04s, tot 8.361e-04s (2 samples) -#pr: min / max ratio of in-memory MEMSET bandwidth to extrapolated read bandwidth ratio: 7.102e+00 1.640e+01 -#pr: in-cache to in-memory MEMSET bandwidth ratio: 1.010e+00 +#pr: rsb auto tuning (either succ. or uns.) time was: on avg.: 0.01 s, min 0.00 s, max 0.01 s, tot 0.01 s (2 samples) +#pr: rsb auto tuning ( only successful ) time was: on avg.: 0.01 s, min 0.00 s, max 0.01 s, tot 0.01 s (2 samples) +#pr: best tun. rsb canon. mflops were: on avg. 3.103e+03, min 1.241e+03, max 4.965e+03 (2 samples) +#pr: ref. unt. rsb canon. mflops were: on avg. 5.723e-01, min 2.238e-01, max 9.209e-01 (2 samples) +#pr: best tun. rsb operation time was: on avg. 7.734e-08s, min 7.734e-08s, max 7.734e-08s, tot 1.547e-07s (2 samples) +#pr: ref. unt. rsb operation time was: on avg. 4.230e-04s, min 4.170e-04s, max 4.289e-04s, tot 8.459e-04s (2 samples) +#pr: min / max ratio of in-memory MEMSET bandwidth to extrapolated read bandwidth ratio: 7.261e+00 1.677e+01 +#pr: in-cache to in-memory MEMSET bandwidth ratio: 9.995e-01 #pr: rsb nrhs-to-overall-min-rhs speed ratio was: on avg. 4.000e+00 x, min 4.000e+00 x, max 4.000e+00 x (1 samples, the non-min-nrhs ones) #pr: ======== Limiting to nrhs=1: #pr: 4 samples (out of 8) matched the dump limiting criteria. #pr: Dump from a base of 8 samples (of max 16) ordered by (1,1,1,1,2,4,2) = (filename x cores x incX x incY x nrhs x typecode x transA). pr: BESTCODE MTX NR NC NNZ NRHS TYPE SYM TRANS NT AT-NT AT-MKL-NT BPNZ AT-BPNZ NSUBM AT-SUBM RSBBEST-MFLOPS OPTIME MKL-OPTIME AT-OPTIME AT-MKL-OPTIME AT-TIME RWminBW-GBps CB-bpf AT-MS CMFLOPS -pr: 1:R_R A 3 3 6 1 D S N 12 12 0 4.0000 4.6667 3 1 313.94 1.194e-03 0.000e+00 7.645e-08 0.000e+00 1.156e-02 1.94e+00 5.17e+00 1 2.40e-05 -pr: 3:R_R A 3 3 6 1 S S N 12 12 0 4.0000 4.6667 3 1 313.94 5.319e-04 0.000e+00 7.645e-08 0.000e+00 6.313e-03 1.15e+00 3.17e+00 1 2.40e-05 -pr: 5:R_R A 3 3 6 1 C S N 12 12 0 4.0000 4.6667 3 1 1255.74 5.479e-04 0.000e+00 7.645e-08 0.000e+00 6.905e-03 1.94e+00 1.29e+00 1 9.60e-05 -pr: 7:R_R A 3 3 6 1 Z S N 12 12 0 4.0000 4.6667 3 1 1255.74 4.170e-04 0.000e+00 7.645e-08 0.000e+00 3.818e-03 3.51e+00 2.29e+00 1 9.60e-05 +pr: 1:R_R A 3 3 6 1 D S N 12 12 0 4.0000 4.6667 3 1 310.31 1.243e-03 0.000e+00 7.734e-08 0.000e+00 1.091e-02 1.91e+00 5.17e+00 1 2.40e-05 +pr: 3:R_R A 3 3 6 1 S S N 12 12 0 4.0000 4.6667 3 1 310.31 3.521e-04 0.000e+00 7.734e-08 0.000e+00 5.505e-03 1.14e+00 3.17e+00 1 2.40e-05 +pr: 5:R_R A 3 3 6 1 C S N 12 12 0 4.0000 4.6667 3 1 1241.22 4.179e-04 0.000e+00 7.734e-08 0.000e+00 4.252e-03 1.91e+00 1.29e+00 1 9.60e-05 +pr: 7:R_R A 3 3 6 1 Z S N 12 12 0 4.0000 4.6667 3 1 1241.22 4.289e-04 0.000e+00 7.734e-08 0.000e+00 3.884e-03 3.47e+00 2.29e+00 1 9.60e-05 #pr: 4 samples (out of 8) matched the dump limiting criteria. #pr: below, we define 'successful' autotuning when speedup of 1.010000x is exceeded, and 'tuned' results even the ones which are same as untuned #pr: rsb autotuning was successful in 4 cases (100.00 %) and unsuccessful in 0 cases (0.00 %) -#pr: (in succ. cases rsb autotuning gave avg. 879831.4 % faster, avg. sp. ratio 8799.314x, max sp. ratio 15618.275x, avg. ratio 0.000x) -#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 93519.4/49939.2/151239.7/374077.7 tuned ops) -#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 10.8/ 9.2/ 12.6/ 43.3 untuned ops) -#pr: (and amortizes from untuned rsb in avg. 10.8, min. 9.2, max. 12.6 ops) +#pr: (in succ. cases rsb autotuning gave avg. 789203.3 % faster, avg. sp. ratio 7893.033x, max sp. ratio 16069.667x, avg. ratio 0.000x) +#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 79351.1/50215.8/141035.8/317404.4 tuned ops) +#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 10.9/ 8.8/ 15.6/ 43.6 untuned ops) +#pr: (and amortizes from untuned rsb in avg. 10.9, min. 8.8, max. 15.6 ops) #pr: (avg/min/max (avg) nnz per subm before successful tuning were 2/ 2/ 2) #pr: (avg/min/max (avg) nnz per subm after successful tuning were 6/ 6/ 6) #pr: (avg/min/max (avg) bytes per subm before successful tuning were 18/ 8/ 32) #pr: (avg/min/max (avg) bytes per subm after successful tuning were 54/ 24/ 96) #pr: (avg/min/max (avg) bytes per nnz before successful tuning were 4.000/ 4.000/ 4.000) -#pr: (avg/min/max operands (mtx,lhs,rhs) read bandwidth lower bound 1.779/ 0.994/ 2.878,GBps) -#pr: (avg/min/max operands (mtx,rhs:r;lhs:rw) bandwidth lower bound 8.529/ 1.151/ 3.506,GBps) +#pr: (avg/min/max operands (mtx,lhs,rhs) read bandwidth lower bound 1.758/ 0.983/ 2.844,GBps) +#pr: (avg/min/max operands (mtx,rhs:r;lhs:rw) bandwidth lower bound 8.430/ 1.138/ 3.465,GBps) #pr: (avg/min/max code balance (bytes read at least once per flop) 2.979/ 1.292/ 5.167) #pr: (avg/min/max (avg) bytes per nnz after successful tuning were 4.667/ 4.667/ 4.667) #pr: (matrix has been subdivided more/less/same in resp. 0 / 4 /0 cases) #pr: (matrix has used more/less/same threads in resp. 0 / 0 /4 cases) #pr: no unsuccessful rsb autotuning attempt (according to 1.01x threshold) -#pr: rsb auto tuning (either succ. or uns.) time was: on avg.: 0.01 s, min 0.00 s, max 0.01 s, tot 0.03 s (4 samples) -#pr: rsb auto tuning ( only successful ) time was: on avg.: 0.01 s, min 0.00 s, max 0.01 s, tot 0.03 s (4 samples) -#pr: best tun. rsb canon. mflops were: on avg. 7.848e+02, min 3.139e+02, max 1.256e+03 (4 samples) -#pr: ref. unt. rsb canon. mflops were: on avg. 1.177e-01, min 2.010e-02, max 2.302e-01 (4 samples) -#pr: best tun. rsb operation time was: on avg. 7.645e-08s, min 7.645e-08s, max 7.645e-08s, tot 3.058e-07s (4 samples) -#pr: ref. unt. rsb operation time was: on avg. 6.727e-04s, min 4.170e-04s, max 1.194e-03s, tot 2.691e-03s (4 samples) -#pr: min / max ratio of in-memory MEMSET bandwidth to extrapolated read bandwidth ratio: 1.640e+01 4.747e+01 -#pr: in-cache to in-memory MEMSET bandwidth ratio: 1.010e+00 +#pr: rsb auto tuning (either succ. or uns.) time was: on avg.: 0.01 s, min 0.00 s, max 0.01 s, tot 0.02 s (4 samples) +#pr: rsb auto tuning ( only successful ) time was: on avg.: 0.01 s, min 0.00 s, max 0.01 s, tot 0.02 s (4 samples) +#pr: best tun. rsb canon. mflops were: on avg. 7.758e+02, min 3.103e+02, max 1.241e+03 (4 samples) +#pr: ref. unt. rsb canon. mflops were: on avg. 1.352e-01, min 1.931e-02, max 2.297e-01 (4 samples) +#pr: best tun. rsb operation time was: on avg. 7.734e-08s, min 7.734e-08s, max 7.734e-08s, tot 3.094e-07s (4 samples) +#pr: ref. unt. rsb operation time was: on avg. 6.105e-04s, min 3.521e-04s, max 1.243e-03s, tot 2.442e-03s (4 samples) +#pr: min / max ratio of in-memory MEMSET bandwidth to extrapolated read bandwidth ratio: 1.677e+01 4.854e+01 +#pr: in-cache to in-memory MEMSET bandwidth ratio: 9.995e-01 #pr: ======== Limiting to nrhs=4: #pr: 4 samples (out of 8) matched the dump limiting criteria. #pr: Dump from a base of 8 samples (of max 16) ordered by (1,1,1,1,2,4,2) = (filename x cores x incX x incY x nrhs x typecode x transA). pr: BESTCODE MTX NR NC NNZ NRHS TYPE SYM TRANS NT AT-NT AT-MKL-NT BPNZ AT-BPNZ NSUBM AT-SUBM RSBBEST-MFLOPS OPTIME MKL-OPTIME AT-OPTIME AT-MKL-OPTIME AT-TIME RWminBW-GBps CB-bpf AT-MS CMFLOPS -pr: 9:R_R A 3 3 6 4 D S N 12 12 0 4.0000 4.6667 3 1 1255.74 1.332e-03 0.000e+00 7.645e-08 0.000e+00 1.152e-02 4.76e+00 2.79e+00 1 9.60e-05 -pr: 11:R_R A 3 3 6 4 S S N 12 12 0 4.0000 4.6667 3 1 1255.74 4.139e-04 0.000e+00 7.645e-08 0.000e+00 3.920e-03 2.56e+00 1.54e+00 1 9.60e-05 -pr: 13:R_R A 3 3 6 4 C S N 12 12 0 4.0000 4.6667 3 1 5022.96 4.249e-04 0.000e+00 7.645e-08 0.000e+00 4.617e-03 4.76e+00 6.98e-01 1 3.84e-04 -pr: 15:R_R A 3 3 6 4 Z S N 12 12 0 4.0000 4.6667 3 1 5022.96 4.191e-04 0.000e+00 7.645e-08 0.000e+00 4.183e-03 9.16e+00 1.32e+00 1 3.84e-04 +pr: 9:R_R A 3 3 6 4 D S N 12 12 0 4.0000 4.6667 3 1 1241.22 9.499e-04 0.000e+00 7.734e-08 0.000e+00 8.681e-03 4.71e+00 2.79e+00 1 9.60e-05 +pr: 11:R_R A 3 3 6 4 S S N 12 12 0 4.0000 4.6667 3 1 1241.22 5.960e-04 0.000e+00 7.734e-08 0.000e+00 5.462e-03 2.53e+00 1.54e+00 1 9.60e-05 +pr: 13:R_R A 3 3 6 4 C S N 12 12 0 4.0000 4.6667 3 1 4964.90 3.979e-04 0.000e+00 7.734e-08 0.000e+00 3.698e-03 4.71e+00 6.98e-01 1 3.84e-04 +pr: 15:R_R A 3 3 6 4 Z S N 12 12 0 4.0000 4.6667 3 1 4964.90 4.170e-04 0.000e+00 7.734e-08 0.000e+00 7.924e-03 9.05e+00 1.32e+00 1 3.84e-04 #pr: 4 samples (out of 8) matched the dump limiting criteria. #pr: below, we define 'successful' autotuning when speedup of 1.010000x is exceeded, and 'tuned' results even the ones which are same as untuned #pr: rsb autotuning was successful in 4 cases (100.00 %) and unsuccessful in 0 cases (0.00 %) -#pr: (in succ. cases rsb autotuning gave avg. 846851.5 % faster, avg. sp. ratio 8469.515x, max sp. ratio 17423.983x, avg. ratio 0.000x) -#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 79271.8/51277.1/150700.1/317087.2 tuned ops) -#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 9.7/ 8.6/ 10.9/ 39.0 untuned ops) -#pr: (and amortizes from untuned rsb in avg. 9.7, min. 8.6, max. 10.9 ops) +#pr: (in succ. cases rsb autotuning gave avg. 763001.1 % faster, avg. sp. ratio 7631.011x, max sp. ratio 12281.134x, avg. ratio 0.000x) +#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 83281.4/47811.3/112241.1/333125.8 tuned ops) +#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 11.6/ 9.1/ 19.0/ 46.6 untuned ops) +#pr: (and amortizes from untuned rsb in avg. 11.7, min. 9.1, max. 19.0 ops) #pr: (avg/min/max (avg) nnz per subm before successful tuning were 2/ 2/ 2) #pr: (avg/min/max (avg) nnz per subm after successful tuning were 6/ 6/ 6) #pr: (avg/min/max (avg) bytes per subm before successful tuning were 18/ 8/ 32) #pr: (avg/min/max (avg) bytes per subm after successful tuning were 54/ 24/ 96) #pr: (avg/min/max (avg) bytes per nnz before successful tuning were 4.000/ 4.000/ 4.000) -#pr: (avg/min/max operands (mtx,lhs,rhs) read bandwidth lower bound 3.898/ 1.936/ 6.645,GBps) -#pr: (avg/min/max operands (mtx,rhs:r;lhs:rw) bandwidth lower bound 21.243/ 2.564/ 9.156,GBps) +#pr: (avg/min/max operands (mtx,lhs,rhs) read bandwidth lower bound 3.853/ 1.914/ 6.568,GBps) +#pr: (avg/min/max operands (mtx,rhs:r;lhs:rw) bandwidth lower bound 20.997/ 2.534/ 9.051,GBps) #pr: (avg/min/max code balance (bytes read at least once per flop) 1.589/ 0.698/ 2.792) #pr: (avg/min/max (avg) bytes per nnz after successful tuning were 4.667/ 4.667/ 4.667) #pr: (matrix has been subdivided more/less/same in resp. 0 / 4 /0 cases) #pr: (matrix has used more/less/same threads in resp. 0 / 0 /4 cases) #pr: no unsuccessful rsb autotuning attempt (according to 1.01x threshold) -#pr: rsb auto tuning (either succ. or uns.) time was: on avg.: 0.01 s, min 0.00 s, max 0.01 s, tot 0.02 s (4 samples) -#pr: rsb auto tuning ( only successful ) time was: on avg.: 0.01 s, min 0.00 s, max 0.01 s, tot 0.02 s (4 samples) -#pr: best tun. rsb canon. mflops were: on avg. 3.139e+03, min 1.256e+03, max 5.023e+03 (4 samples) -#pr: ref. unt. rsb canon. mflops were: on avg. 5.310e-01, min 7.207e-02, max 9.162e-01 (4 samples) -#pr: best tun. rsb operation time was: on avg. 7.645e-08s, min 7.645e-08s, max 7.645e-08s, tot 3.058e-07s (4 samples) -#pr: ref. unt. rsb operation time was: on avg. 6.475e-04s, min 4.139e-04s, max 1.332e-03s, tot 2.590e-03s (4 samples) -#pr: min / max ratio of in-memory MEMSET bandwidth to extrapolated read bandwidth ratio: 7.102e+00 2.438e+01 -#pr: in-cache to in-memory MEMSET bandwidth ratio: 1.010e+00 +#pr: rsb auto tuning (either succ. or uns.) time was: on avg.: 0.01 s, min 0.00 s, max 0.01 s, tot 0.03 s (4 samples) +#pr: rsb auto tuning ( only successful ) time was: on avg.: 0.01 s, min 0.00 s, max 0.01 s, tot 0.03 s (4 samples) +#pr: best tun. rsb canon. mflops were: on avg. 3.103e+03, min 1.241e+03, max 4.965e+03 (4 samples) +#pr: ref. unt. rsb canon. mflops were: on avg. 5.370e-01, min 1.011e-01, max 9.650e-01 (4 samples) +#pr: best tun. rsb operation time was: on avg. 7.734e-08s, min 7.734e-08s, max 7.734e-08s, tot 3.094e-07s (4 samples) +#pr: ref. unt. rsb operation time was: on avg. 5.902e-04s, min 3.979e-04s, max 9.499e-04s, tot 2.361e-03s (4 samples) +#pr: min / max ratio of in-memory MEMSET bandwidth to extrapolated read bandwidth ratio: 7.261e+00 2.492e+01 +#pr: in-cache to in-memory MEMSET bandwidth ratio: 9.995e-01 #pr: rsb nrhs-to-overall-min-rhs speed ratio was: on avg. 4.000e+00 x, min 4.000e+00 x, max 4.000e+00 x (4 samples, the non-min-nrhs ones) #pr: ======== Limiting to transA=N: #pr: Dump from a base of 8 samples (of max 16) ordered by (1,1,1,1,2,4,2) = (filename x cores x incX x incY x nrhs x typecode x transA). pr: BESTCODE MTX NR NC NNZ NRHS TYPE SYM TRANS NT AT-NT AT-MKL-NT BPNZ AT-BPNZ NSUBM AT-SUBM RSBBEST-MFLOPS OPTIME MKL-OPTIME AT-OPTIME AT-MKL-OPTIME AT-TIME RWminBW-GBps CB-bpf AT-MS CMFLOPS -pr: 1:R_R A 3 3 6 1 D S N 12 12 0 4.0000 4.6667 3 1 313.94 1.194e-03 0.000e+00 7.645e-08 0.000e+00 1.156e-02 1.94e+00 5.17e+00 1 2.40e-05 -pr: 3:R_R A 3 3 6 1 S S N 12 12 0 4.0000 4.6667 3 1 313.94 5.319e-04 0.000e+00 7.645e-08 0.000e+00 6.313e-03 1.15e+00 3.17e+00 1 2.40e-05 -pr: 5:R_R A 3 3 6 1 C S N 12 12 0 4.0000 4.6667 3 1 1255.74 5.479e-04 0.000e+00 7.645e-08 0.000e+00 6.905e-03 1.94e+00 1.29e+00 1 9.60e-05 -pr: 7:R_R A 3 3 6 1 Z S N 12 12 0 4.0000 4.6667 3 1 1255.74 4.170e-04 0.000e+00 7.645e-08 0.000e+00 3.818e-03 3.51e+00 2.29e+00 1 9.60e-05 -pr: 9:R_R A 3 3 6 4 D S N 12 12 0 4.0000 4.6667 3 1 1255.74 1.332e-03 0.000e+00 7.645e-08 0.000e+00 1.152e-02 4.76e+00 2.79e+00 1 9.60e-05 -pr: 11:R_R A 3 3 6 4 S S N 12 12 0 4.0000 4.6667 3 1 1255.74 4.139e-04 0.000e+00 7.645e-08 0.000e+00 3.920e-03 2.56e+00 1.54e+00 1 9.60e-05 -pr: 13:R_R A 3 3 6 4 C S N 12 12 0 4.0000 4.6667 3 1 5022.96 4.249e-04 0.000e+00 7.645e-08 0.000e+00 4.617e-03 4.76e+00 6.98e-01 1 3.84e-04 -pr: 15:R_R A 3 3 6 4 Z S N 12 12 0 4.0000 4.6667 3 1 5022.96 4.191e-04 0.000e+00 7.645e-08 0.000e+00 4.183e-03 9.16e+00 1.32e+00 1 3.84e-04 +pr: 1:R_R A 3 3 6 1 D S N 12 12 0 4.0000 4.6667 3 1 310.31 1.243e-03 0.000e+00 7.734e-08 0.000e+00 1.091e-02 1.91e+00 5.17e+00 1 2.40e-05 +pr: 3:R_R A 3 3 6 1 S S N 12 12 0 4.0000 4.6667 3 1 310.31 3.521e-04 0.000e+00 7.734e-08 0.000e+00 5.505e-03 1.14e+00 3.17e+00 1 2.40e-05 +pr: 5:R_R A 3 3 6 1 C S N 12 12 0 4.0000 4.6667 3 1 1241.22 4.179e-04 0.000e+00 7.734e-08 0.000e+00 4.252e-03 1.91e+00 1.29e+00 1 9.60e-05 +pr: 7:R_R A 3 3 6 1 Z S N 12 12 0 4.0000 4.6667 3 1 1241.22 4.289e-04 0.000e+00 7.734e-08 0.000e+00 3.884e-03 3.47e+00 2.29e+00 1 9.60e-05 +pr: 9:R_R A 3 3 6 4 D S N 12 12 0 4.0000 4.6667 3 1 1241.22 9.499e-04 0.000e+00 7.734e-08 0.000e+00 8.681e-03 4.71e+00 2.79e+00 1 9.60e-05 +pr: 11:R_R A 3 3 6 4 S S N 12 12 0 4.0000 4.6667 3 1 1241.22 5.960e-04 0.000e+00 7.734e-08 0.000e+00 5.462e-03 2.53e+00 1.54e+00 1 9.60e-05 +pr: 13:R_R A 3 3 6 4 C S N 12 12 0 4.0000 4.6667 3 1 4964.90 3.979e-04 0.000e+00 7.734e-08 0.000e+00 3.698e-03 4.71e+00 6.98e-01 1 3.84e-04 +pr: 15:R_R A 3 3 6 4 Z S N 12 12 0 4.0000 4.6667 3 1 4964.90 4.170e-04 0.000e+00 7.734e-08 0.000e+00 7.924e-03 9.05e+00 1.32e+00 1 3.84e-04 #pr: below, we define 'successful' autotuning when speedup of 1.010000x is exceeded, and 'tuned' results even the ones which are same as untuned #pr: rsb autotuning was successful in 8 cases (100.00 %) and unsuccessful in 0 cases (0.00 %) -#pr: (in succ. cases rsb autotuning gave avg. 863341.4 % faster, avg. sp. ratio 8634.414x, max sp. ratio 17423.983x, avg. ratio 0.000x) -#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 86395.6/49939.2/151239.7/691164.8 tuned ops) -#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 10.3/ 8.6/ 12.6/ 82.3 untuned ops) -#pr: (and amortizes from untuned rsb in avg. 10.3, min. 8.6, max. 12.6 ops) +#pr: (in succ. cases rsb autotuning gave avg. 776102.2 % faster, avg. sp. ratio 7762.022x, max sp. ratio 16069.667x, avg. ratio 0.000x) +#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 81316.3/47811.3/141035.8/650530.2 tuned ops) +#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 11.3/ 8.8/ 19.0/ 90.2 untuned ops) +#pr: (and amortizes from untuned rsb in avg. 11.3, min. 8.8, max. 19.0 ops) #pr: (avg/min/max (avg) nnz per subm before successful tuning were 2/ 2/ 2) #pr: (avg/min/max (avg) nnz per subm after successful tuning were 6/ 6/ 6) #pr: (avg/min/max (avg) bytes per subm before successful tuning were 18/ 8/ 32) #pr: (avg/min/max (avg) bytes per subm after successful tuning were 54/ 24/ 96) #pr: (avg/min/max (avg) bytes per nnz before successful tuning were 4.000/ 4.000/ 4.000) -#pr: (avg/min/max operands (mtx,lhs,rhs) read bandwidth lower bound 2.838/ 0.994/ 6.645,GBps) -#pr: (avg/min/max operands (mtx,rhs:r;lhs:rw) bandwidth lower bound 29.772/ 1.151/ 9.156,GBps) +#pr: (avg/min/max operands (mtx,lhs,rhs) read bandwidth lower bound 2.806/ 0.983/ 6.568,GBps) +#pr: (avg/min/max operands (mtx,rhs:r;lhs:rw) bandwidth lower bound 29.427/ 1.138/ 9.051,GBps) #pr: (avg/min/max code balance (bytes read at least once per flop) 2.284/ 0.698/ 5.167) #pr: (avg/min/max (avg) bytes per nnz after successful tuning were 4.667/ 4.667/ 4.667) #pr: (matrix has been subdivided more/less/same in resp. 0 / 8 /0 cases) @@ -5032,83 +5068,83 @@ #pr: no unsuccessful rsb autotuning attempt (according to 1.01x threshold) #pr: rsb auto tuning (either succ. or uns.) time was: on avg.: 0.01 s, min 0.00 s, max 0.01 s, tot 0.05 s (8 samples) #pr: rsb auto tuning ( only successful ) time was: on avg.: 0.01 s, min 0.00 s, max 0.01 s, tot 0.05 s (8 samples) -#pr: best tun. rsb canon. mflops were: on avg. 1.962e+03, min 3.139e+02, max 5.023e+03 (8 samples) -#pr: ref. unt. rsb canon. mflops were: on avg. 3.243e-01, min 2.010e-02, max 9.162e-01 (8 samples) -#pr: best tun. rsb operation time was: on avg. 7.645e-08s, min 7.645e-08s, max 7.645e-08s, tot 6.116e-07s (8 samples) -#pr: ref. unt. rsb operation time was: on avg. 6.601e-04s, min 4.139e-04s, max 1.332e-03s, tot 5.281e-03s (8 samples) -#pr: min / max ratio of in-memory MEMSET bandwidth to extrapolated read bandwidth ratio: 7.102e+00 4.747e+01 -#pr: in-cache to in-memory MEMSET bandwidth ratio: 1.010e+00 +#pr: best tun. rsb canon. mflops were: on avg. 1.939e+03, min 3.103e+02, max 4.965e+03 (8 samples) +#pr: ref. unt. rsb canon. mflops were: on avg. 3.361e-01, min 1.931e-02, max 9.650e-01 (8 samples) +#pr: best tun. rsb operation time was: on avg. 7.734e-08s, min 7.734e-08s, max 7.734e-08s, tot 6.187e-07s (8 samples) +#pr: ref. unt. rsb operation time was: on avg. 6.003e-04s, min 3.521e-04s, max 1.243e-03s, tot 4.803e-03s (8 samples) +#pr: min / max ratio of in-memory MEMSET bandwidth to extrapolated read bandwidth ratio: 7.261e+00 4.854e+01 +#pr: in-cache to in-memory MEMSET bandwidth ratio: 9.995e-01 #pr: rsb nrhs-to-overall-min-rhs speed ratio was: on avg. 4.000e+00 x, min 4.000e+00 x, max 4.000e+00 x (4 samples, the non-min-nrhs ones) #pr: ======== Limiting to both transA=N and nrhs=1: #pr: 4 samples (out of 8) matched the dump limiting criteria. #pr: Dump from a base of 8 samples (of max 16) ordered by (1,1,1,1,2,4,2) = (filename x cores x incX x incY x nrhs x typecode x transA). pr: BESTCODE MTX NR NC NNZ NRHS TYPE SYM TRANS NT AT-NT AT-MKL-NT BPNZ AT-BPNZ NSUBM AT-SUBM RSBBEST-MFLOPS OPTIME MKL-OPTIME AT-OPTIME AT-MKL-OPTIME AT-TIME RWminBW-GBps CB-bpf AT-MS CMFLOPS -pr: 1:R_R A 3 3 6 1 D S N 12 12 0 4.0000 4.6667 3 1 313.94 1.194e-03 0.000e+00 7.645e-08 0.000e+00 1.156e-02 1.94e+00 5.17e+00 1 2.40e-05 -pr: 3:R_R A 3 3 6 1 S S N 12 12 0 4.0000 4.6667 3 1 313.94 5.319e-04 0.000e+00 7.645e-08 0.000e+00 6.313e-03 1.15e+00 3.17e+00 1 2.40e-05 -pr: 5:R_R A 3 3 6 1 C S N 12 12 0 4.0000 4.6667 3 1 1255.74 5.479e-04 0.000e+00 7.645e-08 0.000e+00 6.905e-03 1.94e+00 1.29e+00 1 9.60e-05 -pr: 7:R_R A 3 3 6 1 Z S N 12 12 0 4.0000 4.6667 3 1 1255.74 4.170e-04 0.000e+00 7.645e-08 0.000e+00 3.818e-03 3.51e+00 2.29e+00 1 9.60e-05 +pr: 1:R_R A 3 3 6 1 D S N 12 12 0 4.0000 4.6667 3 1 310.31 1.243e-03 0.000e+00 7.734e-08 0.000e+00 1.091e-02 1.91e+00 5.17e+00 1 2.40e-05 +pr: 3:R_R A 3 3 6 1 S S N 12 12 0 4.0000 4.6667 3 1 310.31 3.521e-04 0.000e+00 7.734e-08 0.000e+00 5.505e-03 1.14e+00 3.17e+00 1 2.40e-05 +pr: 5:R_R A 3 3 6 1 C S N 12 12 0 4.0000 4.6667 3 1 1241.22 4.179e-04 0.000e+00 7.734e-08 0.000e+00 4.252e-03 1.91e+00 1.29e+00 1 9.60e-05 +pr: 7:R_R A 3 3 6 1 Z S N 12 12 0 4.0000 4.6667 3 1 1241.22 4.289e-04 0.000e+00 7.734e-08 0.000e+00 3.884e-03 3.47e+00 2.29e+00 1 9.60e-05 #pr: 4 samples (out of 8) matched the dump limiting criteria. #pr: below, we define 'successful' autotuning when speedup of 1.010000x is exceeded, and 'tuned' results even the ones which are same as untuned #pr: rsb autotuning was successful in 4 cases (100.00 %) and unsuccessful in 0 cases (0.00 %) -#pr: (in succ. cases rsb autotuning gave avg. 879831.4 % faster, avg. sp. ratio 8799.314x, max sp. ratio 15618.275x, avg. ratio 0.000x) -#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 93519.4/49939.2/151239.7/374077.7 tuned ops) -#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 10.8/ 9.2/ 12.6/ 43.3 untuned ops) -#pr: (and amortizes from untuned rsb in avg. 10.8, min. 9.2, max. 12.6 ops) +#pr: (in succ. cases rsb autotuning gave avg. 789203.3 % faster, avg. sp. ratio 7893.033x, max sp. ratio 16069.667x, avg. ratio 0.000x) +#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 79351.1/50215.8/141035.8/317404.4 tuned ops) +#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 10.9/ 8.8/ 15.6/ 43.6 untuned ops) +#pr: (and amortizes from untuned rsb in avg. 10.9, min. 8.8, max. 15.6 ops) #pr: (avg/min/max (avg) nnz per subm before successful tuning were 2/ 2/ 2) #pr: (avg/min/max (avg) nnz per subm after successful tuning were 6/ 6/ 6) #pr: (avg/min/max (avg) bytes per subm before successful tuning were 18/ 8/ 32) #pr: (avg/min/max (avg) bytes per subm after successful tuning were 54/ 24/ 96) #pr: (avg/min/max (avg) bytes per nnz before successful tuning were 4.000/ 4.000/ 4.000) -#pr: (avg/min/max operands (mtx,lhs,rhs) read bandwidth lower bound 1.779/ 0.994/ 2.878,GBps) -#pr: (avg/min/max operands (mtx,rhs:r;lhs:rw) bandwidth lower bound 8.529/ 1.151/ 3.506,GBps) +#pr: (avg/min/max operands (mtx,lhs,rhs) read bandwidth lower bound 1.758/ 0.983/ 2.844,GBps) +#pr: (avg/min/max operands (mtx,rhs:r;lhs:rw) bandwidth lower bound 8.430/ 1.138/ 3.465,GBps) #pr: (avg/min/max code balance (bytes read at least once per flop) 2.979/ 1.292/ 5.167) #pr: (avg/min/max (avg) bytes per nnz after successful tuning were 4.667/ 4.667/ 4.667) #pr: (matrix has been subdivided more/less/same in resp. 0 / 4 /0 cases) #pr: (matrix has used more/less/same threads in resp. 0 / 0 /4 cases) #pr: no unsuccessful rsb autotuning attempt (according to 1.01x threshold) -#pr: rsb auto tuning (either succ. or uns.) time was: on avg.: 0.01 s, min 0.00 s, max 0.01 s, tot 0.03 s (4 samples) -#pr: rsb auto tuning ( only successful ) time was: on avg.: 0.01 s, min 0.00 s, max 0.01 s, tot 0.03 s (4 samples) -#pr: best tun. rsb canon. mflops were: on avg. 7.848e+02, min 3.139e+02, max 1.256e+03 (4 samples) -#pr: ref. unt. rsb canon. mflops were: on avg. 1.177e-01, min 2.010e-02, max 2.302e-01 (4 samples) -#pr: best tun. rsb operation time was: on avg. 7.645e-08s, min 7.645e-08s, max 7.645e-08s, tot 3.058e-07s (4 samples) -#pr: ref. unt. rsb operation time was: on avg. 6.727e-04s, min 4.170e-04s, max 1.194e-03s, tot 2.691e-03s (4 samples) -#pr: min / max ratio of in-memory MEMSET bandwidth to extrapolated read bandwidth ratio: 1.640e+01 4.747e+01 -#pr: in-cache to in-memory MEMSET bandwidth ratio: 1.010e+00 +#pr: rsb auto tuning (either succ. or uns.) time was: on avg.: 0.01 s, min 0.00 s, max 0.01 s, tot 0.02 s (4 samples) +#pr: rsb auto tuning ( only successful ) time was: on avg.: 0.01 s, min 0.00 s, max 0.01 s, tot 0.02 s (4 samples) +#pr: best tun. rsb canon. mflops were: on avg. 7.758e+02, min 3.103e+02, max 1.241e+03 (4 samples) +#pr: ref. unt. rsb canon. mflops were: on avg. 1.352e-01, min 1.931e-02, max 2.297e-01 (4 samples) +#pr: best tun. rsb operation time was: on avg. 7.734e-08s, min 7.734e-08s, max 7.734e-08s, tot 3.094e-07s (4 samples) +#pr: ref. unt. rsb operation time was: on avg. 6.105e-04s, min 3.521e-04s, max 1.243e-03s, tot 2.442e-03s (4 samples) +#pr: min / max ratio of in-memory MEMSET bandwidth to extrapolated read bandwidth ratio: 1.677e+01 4.854e+01 +#pr: in-cache to in-memory MEMSET bandwidth ratio: 9.995e-01 #pr: ======== Limiting to both transA=N and nrhs=4: #pr: 4 samples (out of 8) matched the dump limiting criteria. #pr: Dump from a base of 8 samples (of max 16) ordered by (1,1,1,1,2,4,2) = (filename x cores x incX x incY x nrhs x typecode x transA). pr: BESTCODE MTX NR NC NNZ NRHS TYPE SYM TRANS NT AT-NT AT-MKL-NT BPNZ AT-BPNZ NSUBM AT-SUBM RSBBEST-MFLOPS OPTIME MKL-OPTIME AT-OPTIME AT-MKL-OPTIME AT-TIME RWminBW-GBps CB-bpf AT-MS CMFLOPS -pr: 9:R_R A 3 3 6 4 D S N 12 12 0 4.0000 4.6667 3 1 1255.74 1.332e-03 0.000e+00 7.645e-08 0.000e+00 1.152e-02 4.76e+00 2.79e+00 1 9.60e-05 -pr: 11:R_R A 3 3 6 4 S S N 12 12 0 4.0000 4.6667 3 1 1255.74 4.139e-04 0.000e+00 7.645e-08 0.000e+00 3.920e-03 2.56e+00 1.54e+00 1 9.60e-05 -pr: 13:R_R A 3 3 6 4 C S N 12 12 0 4.0000 4.6667 3 1 5022.96 4.249e-04 0.000e+00 7.645e-08 0.000e+00 4.617e-03 4.76e+00 6.98e-01 1 3.84e-04 -pr: 15:R_R A 3 3 6 4 Z S N 12 12 0 4.0000 4.6667 3 1 5022.96 4.191e-04 0.000e+00 7.645e-08 0.000e+00 4.183e-03 9.16e+00 1.32e+00 1 3.84e-04 +pr: 9:R_R A 3 3 6 4 D S N 12 12 0 4.0000 4.6667 3 1 1241.22 9.499e-04 0.000e+00 7.734e-08 0.000e+00 8.681e-03 4.71e+00 2.79e+00 1 9.60e-05 +pr: 11:R_R A 3 3 6 4 S S N 12 12 0 4.0000 4.6667 3 1 1241.22 5.960e-04 0.000e+00 7.734e-08 0.000e+00 5.462e-03 2.53e+00 1.54e+00 1 9.60e-05 +pr: 13:R_R A 3 3 6 4 C S N 12 12 0 4.0000 4.6667 3 1 4964.90 3.979e-04 0.000e+00 7.734e-08 0.000e+00 3.698e-03 4.71e+00 6.98e-01 1 3.84e-04 +pr: 15:R_R A 3 3 6 4 Z S N 12 12 0 4.0000 4.6667 3 1 4964.90 4.170e-04 0.000e+00 7.734e-08 0.000e+00 7.924e-03 9.05e+00 1.32e+00 1 3.84e-04 #pr: 4 samples (out of 8) matched the dump limiting criteria. #pr: below, we define 'successful' autotuning when speedup of 1.010000x is exceeded, and 'tuned' results even the ones which are same as untuned #pr: rsb autotuning was successful in 4 cases (100.00 %) and unsuccessful in 0 cases (0.00 %) -#pr: (in succ. cases rsb autotuning gave avg. 846851.5 % faster, avg. sp. ratio 8469.515x, max sp. ratio 17423.983x, avg. ratio 0.000x) -#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 79271.8/51277.1/150700.1/317087.2 tuned ops) -#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 9.7/ 8.6/ 10.9/ 39.0 untuned ops) -#pr: (and amortizes from untuned rsb in avg. 9.7, min. 8.6, max. 10.9 ops) +#pr: (in succ. cases rsb autotuning gave avg. 763001.1 % faster, avg. sp. ratio 7631.011x, max sp. ratio 12281.134x, avg. ratio 0.000x) +#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 83281.4/47811.3/112241.1/333125.8 tuned ops) +#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 11.6/ 9.1/ 19.0/ 46.6 untuned ops) +#pr: (and amortizes from untuned rsb in avg. 11.7, min. 9.1, max. 19.0 ops) #pr: (avg/min/max (avg) nnz per subm before successful tuning were 2/ 2/ 2) #pr: (avg/min/max (avg) nnz per subm after successful tuning were 6/ 6/ 6) #pr: (avg/min/max (avg) bytes per subm before successful tuning were 18/ 8/ 32) #pr: (avg/min/max (avg) bytes per subm after successful tuning were 54/ 24/ 96) #pr: (avg/min/max (avg) bytes per nnz before successful tuning were 4.000/ 4.000/ 4.000) -#pr: (avg/min/max operands (mtx,lhs,rhs) read bandwidth lower bound 3.898/ 1.936/ 6.645,GBps) -#pr: (avg/min/max operands (mtx,rhs:r;lhs:rw) bandwidth lower bound 21.243/ 2.564/ 9.156,GBps) +#pr: (avg/min/max operands (mtx,lhs,rhs) read bandwidth lower bound 3.853/ 1.914/ 6.568,GBps) +#pr: (avg/min/max operands (mtx,rhs:r;lhs:rw) bandwidth lower bound 20.997/ 2.534/ 9.051,GBps) #pr: (avg/min/max code balance (bytes read at least once per flop) 1.589/ 0.698/ 2.792) #pr: (avg/min/max (avg) bytes per nnz after successful tuning were 4.667/ 4.667/ 4.667) #pr: (matrix has been subdivided more/less/same in resp. 0 / 4 /0 cases) #pr: (matrix has used more/less/same threads in resp. 0 / 0 /4 cases) #pr: no unsuccessful rsb autotuning attempt (according to 1.01x threshold) -#pr: rsb auto tuning (either succ. or uns.) time was: on avg.: 0.01 s, min 0.00 s, max 0.01 s, tot 0.02 s (4 samples) -#pr: rsb auto tuning ( only successful ) time was: on avg.: 0.01 s, min 0.00 s, max 0.01 s, tot 0.02 s (4 samples) -#pr: best tun. rsb canon. mflops were: on avg. 3.139e+03, min 1.256e+03, max 5.023e+03 (4 samples) -#pr: ref. unt. rsb canon. mflops were: on avg. 5.310e-01, min 7.207e-02, max 9.162e-01 (4 samples) -#pr: best tun. rsb operation time was: on avg. 7.645e-08s, min 7.645e-08s, max 7.645e-08s, tot 3.058e-07s (4 samples) -#pr: ref. unt. rsb operation time was: on avg. 6.475e-04s, min 4.139e-04s, max 1.332e-03s, tot 2.590e-03s (4 samples) -#pr: min / max ratio of in-memory MEMSET bandwidth to extrapolated read bandwidth ratio: 7.102e+00 2.438e+01 -#pr: in-cache to in-memory MEMSET bandwidth ratio: 1.010e+00 +#pr: rsb auto tuning (either succ. or uns.) time was: on avg.: 0.01 s, min 0.00 s, max 0.01 s, tot 0.03 s (4 samples) +#pr: rsb auto tuning ( only successful ) time was: on avg.: 0.01 s, min 0.00 s, max 0.01 s, tot 0.03 s (4 samples) +#pr: best tun. rsb canon. mflops were: on avg. 3.103e+03, min 1.241e+03, max 4.965e+03 (4 samples) +#pr: ref. unt. rsb canon. mflops were: on avg. 5.370e-01, min 1.011e-01, max 9.650e-01 (4 samples) +#pr: best tun. rsb operation time was: on avg. 7.734e-08s, min 7.734e-08s, max 7.734e-08s, tot 3.094e-07s (4 samples) +#pr: ref. unt. rsb operation time was: on avg. 5.902e-04s, min 3.979e-04s, max 9.499e-04s, tot 2.361e-03s (4 samples) +#pr: min / max ratio of in-memory MEMSET bandwidth to extrapolated read bandwidth ratio: 7.261e+00 2.492e+01 +#pr: in-cache to in-memory MEMSET bandwidth ratio: 9.995e-01 #pr: rsb nrhs-to-overall-min-rhs speed ratio was: on avg. 4.000e+00 x, min 4.000e+00 x, max 4.000e+00 x (4 samples, the non-min-nrhs ones) #pr: ======== Limiting to transA=T: #pr: No sample (out of 8) matched the dump criteria -- skipping dump round. @@ -5119,27 +5155,27 @@ #pr: ======== All results (not limiting) #pr: Dump from a base of 8 samples (of max 16) ordered by (1,1,1,1,2,4,2) = (filename x cores x incX x incY x nrhs x typecode x transA). pr: BESTCODE MTX NR NC NNZ NRHS TYPE SYM TRANS NT AT-NT AT-MKL-NT BPNZ AT-BPNZ NSUBM AT-SUBM RSBBEST-MFLOPS OPTIME MKL-OPTIME AT-OPTIME AT-MKL-OPTIME AT-TIME RWminBW-GBps CB-bpf AT-MS CMFLOPS -pr: 1:R_R A 3 3 6 1 D S N 12 12 0 4.0000 4.6667 3 1 313.94 1.194e-03 0.000e+00 7.645e-08 0.000e+00 1.156e-02 1.94e+00 5.17e+00 1 2.40e-05 -pr: 3:R_R A 3 3 6 1 S S N 12 12 0 4.0000 4.6667 3 1 313.94 5.319e-04 0.000e+00 7.645e-08 0.000e+00 6.313e-03 1.15e+00 3.17e+00 1 2.40e-05 -pr: 5:R_R A 3 3 6 1 C S N 12 12 0 4.0000 4.6667 3 1 1255.74 5.479e-04 0.000e+00 7.645e-08 0.000e+00 6.905e-03 1.94e+00 1.29e+00 1 9.60e-05 -pr: 7:R_R A 3 3 6 1 Z S N 12 12 0 4.0000 4.6667 3 1 1255.74 4.170e-04 0.000e+00 7.645e-08 0.000e+00 3.818e-03 3.51e+00 2.29e+00 1 9.60e-05 -pr: 9:R_R A 3 3 6 4 D S N 12 12 0 4.0000 4.6667 3 1 1255.74 1.332e-03 0.000e+00 7.645e-08 0.000e+00 1.152e-02 4.76e+00 2.79e+00 1 9.60e-05 -pr: 11:R_R A 3 3 6 4 S S N 12 12 0 4.0000 4.6667 3 1 1255.74 4.139e-04 0.000e+00 7.645e-08 0.000e+00 3.920e-03 2.56e+00 1.54e+00 1 9.60e-05 -pr: 13:R_R A 3 3 6 4 C S N 12 12 0 4.0000 4.6667 3 1 5022.96 4.249e-04 0.000e+00 7.645e-08 0.000e+00 4.617e-03 4.76e+00 6.98e-01 1 3.84e-04 -pr: 15:R_R A 3 3 6 4 Z S N 12 12 0 4.0000 4.6667 3 1 5022.96 4.191e-04 0.000e+00 7.645e-08 0.000e+00 4.183e-03 9.16e+00 1.32e+00 1 3.84e-04 +pr: 1:R_R A 3 3 6 1 D S N 12 12 0 4.0000 4.6667 3 1 310.31 1.243e-03 0.000e+00 7.734e-08 0.000e+00 1.091e-02 1.91e+00 5.17e+00 1 2.40e-05 +pr: 3:R_R A 3 3 6 1 S S N 12 12 0 4.0000 4.6667 3 1 310.31 3.521e-04 0.000e+00 7.734e-08 0.000e+00 5.505e-03 1.14e+00 3.17e+00 1 2.40e-05 +pr: 5:R_R A 3 3 6 1 C S N 12 12 0 4.0000 4.6667 3 1 1241.22 4.179e-04 0.000e+00 7.734e-08 0.000e+00 4.252e-03 1.91e+00 1.29e+00 1 9.60e-05 +pr: 7:R_R A 3 3 6 1 Z S N 12 12 0 4.0000 4.6667 3 1 1241.22 4.289e-04 0.000e+00 7.734e-08 0.000e+00 3.884e-03 3.47e+00 2.29e+00 1 9.60e-05 +pr: 9:R_R A 3 3 6 4 D S N 12 12 0 4.0000 4.6667 3 1 1241.22 9.499e-04 0.000e+00 7.734e-08 0.000e+00 8.681e-03 4.71e+00 2.79e+00 1 9.60e-05 +pr: 11:R_R A 3 3 6 4 S S N 12 12 0 4.0000 4.6667 3 1 1241.22 5.960e-04 0.000e+00 7.734e-08 0.000e+00 5.462e-03 2.53e+00 1.54e+00 1 9.60e-05 +pr: 13:R_R A 3 3 6 4 C S N 12 12 0 4.0000 4.6667 3 1 4964.90 3.979e-04 0.000e+00 7.734e-08 0.000e+00 3.698e-03 4.71e+00 6.98e-01 1 3.84e-04 +pr: 15:R_R A 3 3 6 4 Z S N 12 12 0 4.0000 4.6667 3 1 4964.90 4.170e-04 0.000e+00 7.734e-08 0.000e+00 7.924e-03 9.05e+00 1.32e+00 1 3.84e-04 #pr: below, we define 'successful' autotuning when speedup of 1.010000x is exceeded, and 'tuned' results even the ones which are same as untuned #pr: rsb autotuning was successful in 8 cases (100.00 %) and unsuccessful in 0 cases (0.00 %) -#pr: (in succ. cases rsb autotuning gave avg. 863341.4 % faster, avg. sp. ratio 8634.414x, max sp. ratio 17423.983x, avg. ratio 0.000x) -#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 86395.6/49939.2/151239.7/691164.8 tuned ops) -#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 10.3/ 8.6/ 12.6/ 82.3 untuned ops) -#pr: (and amortizes from untuned rsb in avg. 10.3, min. 8.6, max. 12.6 ops) +#pr: (in succ. cases rsb autotuning gave avg. 776102.2 % faster, avg. sp. ratio 7762.022x, max sp. ratio 16069.667x, avg. ratio 0.000x) +#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 81316.3/47811.3/141035.8/650530.2 tuned ops) +#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 11.3/ 8.8/ 19.0/ 90.2 untuned ops) +#pr: (and amortizes from untuned rsb in avg. 11.3, min. 8.8, max. 19.0 ops) #pr: (avg/min/max (avg) nnz per subm before successful tuning were 2/ 2/ 2) #pr: (avg/min/max (avg) nnz per subm after successful tuning were 6/ 6/ 6) #pr: (avg/min/max (avg) bytes per subm before successful tuning were 18/ 8/ 32) #pr: (avg/min/max (avg) bytes per subm after successful tuning were 54/ 24/ 96) #pr: (avg/min/max (avg) bytes per nnz before successful tuning were 4.000/ 4.000/ 4.000) -#pr: (avg/min/max operands (mtx,lhs,rhs) read bandwidth lower bound 2.838/ 0.994/ 6.645,GBps) -#pr: (avg/min/max operands (mtx,rhs:r;lhs:rw) bandwidth lower bound 29.772/ 1.151/ 9.156,GBps) +#pr: (avg/min/max operands (mtx,lhs,rhs) read bandwidth lower bound 2.806/ 0.983/ 6.568,GBps) +#pr: (avg/min/max operands (mtx,rhs:r;lhs:rw) bandwidth lower bound 29.427/ 1.138/ 9.051,GBps) #pr: (avg/min/max code balance (bytes read at least once per flop) 2.284/ 0.698/ 5.167) #pr: (avg/min/max (avg) bytes per nnz after successful tuning were 4.667/ 4.667/ 4.667) #pr: (matrix has been subdivided more/less/same in resp. 0 / 8 /0 cases) @@ -5147,21 +5183,21 @@ #pr: no unsuccessful rsb autotuning attempt (according to 1.01x threshold) #pr: rsb auto tuning (either succ. or uns.) time was: on avg.: 0.01 s, min 0.00 s, max 0.01 s, tot 0.05 s (8 samples) #pr: rsb auto tuning ( only successful ) time was: on avg.: 0.01 s, min 0.00 s, max 0.01 s, tot 0.05 s (8 samples) -#pr: best tun. rsb canon. mflops were: on avg. 1.962e+03, min 3.139e+02, max 5.023e+03 (8 samples) -#pr: ref. unt. rsb canon. mflops were: on avg. 3.243e-01, min 2.010e-02, max 9.162e-01 (8 samples) -#pr: best tun. rsb operation time was: on avg. 7.645e-08s, min 7.645e-08s, max 7.645e-08s, tot 6.116e-07s (8 samples) -#pr: ref. unt. rsb operation time was: on avg. 6.601e-04s, min 4.139e-04s, max 1.332e-03s, tot 5.281e-03s (8 samples) -#pr: min / max ratio of in-memory MEMSET bandwidth to extrapolated read bandwidth ratio: 7.102e+00 4.747e+01 -#pr: in-cache to in-memory MEMSET bandwidth ratio: 1.010e+00 +#pr: best tun. rsb canon. mflops were: on avg. 1.939e+03, min 3.103e+02, max 4.965e+03 (8 samples) +#pr: ref. unt. rsb canon. mflops were: on avg. 3.361e-01, min 1.931e-02, max 9.650e-01 (8 samples) +#pr: best tun. rsb operation time was: on avg. 7.734e-08s, min 7.734e-08s, max 7.734e-08s, tot 6.187e-07s (8 samples) +#pr: ref. unt. rsb operation time was: on avg. 6.003e-04s, min 3.521e-04s, max 1.243e-03s, tot 4.803e-03s (8 samples) +#pr: min / max ratio of in-memory MEMSET bandwidth to extrapolated read bandwidth ratio: 7.261e+00 4.854e+01 +#pr: in-cache to in-memory MEMSET bandwidth ratio: 9.995e-01 #pr: rsb nrhs-to-overall-min-rhs speed ratio was: on avg. 4.000e+00 x, min 4.000e+00 x, max 4.000e+00 x (4 samples, the non-min-nrhs ones) #pr: Record collection took 0.34 s. #pr: Record comprises 40 memory benchmark samples (prepend RSB_PR_MBW=1 to dump this). -#pr: Record comprises 105 environment variables in 5773 bytes (prepend RSB_PR_ENV=1 to dump this). +#pr: Record comprises 105 environment variables in 5827 bytes (prepend RSB_PR_ENV=1 to dump this). # ====== END Total summary record. -#pr: ======== Saved a performance record of 16 samples to rsbench_pr__1796064025_gcc-15.2.rpr -# Removing the temporary record file rsbench_pr__1796064025_gcc-15.2.rpr.tmp. -# terminating run at 1796064031 (after 5.7s of w.c.t.) -srcdir="/build/reproducible-path/librsb-1.3.0.2+dfsg" /bin/bash ./scripts/doc-tests.sh +#pr: ======== Saved a performance record of 16 samples to rsbench_pr__1761654541_gcc-15.2.rpr +# Removing the temporary record file rsbench_pr__1761654541_gcc-15.2.rpr.tmp. +# terminating run at 1761654547 (after 5.8s of w.c.t.) +srcdir="/build/reproducible-path/librsb-1.3.0.2+dfsg" /bin/sh ./scripts/doc-tests.sh + set -o pipefail + test x/build/reproducible-path/librsb-1.3.0.2+dfsg = x + cat /build/reproducible-path/librsb-1.3.0.2+dfsg/examples/autotune.c /build/reproducible-path/librsb-1.3.0.2+dfsg/examples/backsolve.c /build/reproducible-path/librsb-1.3.0.2+dfsg/examples/hello-spblas.c /build/reproducible-path/librsb-1.3.0.2+dfsg/examples/hello.c /build/reproducible-path/librsb-1.3.0.2+dfsg/examples/io-spblas.c /build/reproducible-path/librsb-1.3.0.2+dfsg/examples/power.c /build/reproducible-path/librsb-1.3.0.2+dfsg/examples/snippets.c /build/reproducible-path/librsb-1.3.0.2+dfsg/examples/transpose.c @@ -5215,7 +5251,7 @@ type char codes:D S C Z gmake[4]: Entering directory '/build/reproducible-path/librsb-1.3.0.2+dfsg/examples' if test /build/reproducible-path/librsb-1.3.0.2+dfsg != /build/reproducible-path/librsb-1.3.0.2+dfsg ; then cp /build/reproducible-path/librsb-1.3.0.2+dfsg/pd.mtx /build/reproducible-path/librsb-1.3.0.2+dfsg/vf.mtx /build/reproducible-path/librsb-1.3.0.2+dfsg/examples ; fi -( PATH="/build/reproducible-path/librsb-1.3.0.2+dfsg:/usr/sbin:/usr/bin:/sbin:/bin:/usr/games" /bin/bash /build/reproducible-path/librsb-1.3.0.2+dfsg/examples/bench.sh; ) +( PATH="/build/reproducible-path/librsb-1.3.0.2+dfsg:/usr/sbin:/usr/bin:/sbin:/bin:/usr/games:/i/capture/the/path" /bin/sh /build/reproducible-path/librsb-1.3.0.2+dfsg/examples/bench.sh; ) + which rsbench /build/reproducible-path/librsb-1.3.0.2+dfsg/rsbench + BRF=test.rpr @@ -5225,15 +5261,15 @@ Will invoke autotuning for ~10.000000 s x 1 rounds, specifying verbosity=0 and threads=0. (>0 means no structure tuning; 0 means only structure tuning, <0 means tuning of both with (negated) thread count suggestion). # Requested no transposition. # performance record file set to: test.rpr -# beginning run at 1796064031 +# beginning run at 1761654547 # /build/reproducible-path/librsb-1.3.0.2+dfsg/.libs/rsbench -oa -Ob --bench --lower 100 --as-symmetric --types : -n 1 --notranspose --compare-competitors --verbose --verbose --write-performance-record=test.rpr # compiled with: CC=gcc CFLAGS=-g -O2 -Werror=implicit-function-declaration -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -# average timer granularity: 2.99e-08 s +# average timer granularity: 2.93e-08 s # Will write a final performance record to file test.rpr and periodic checkpoints to test.rpr.tmp # will NOT perform ancillary tests. # will flush cache memory: between each operation measurement series, and NOT between each operation. # will keep any zero encountered in the matrix. -# env: export PATH=/build/reproducible-path/librsb-1.3.0.2+dfsg:/usr/sbin:/usr/bin:/sbin:/bin:/usr/games +# env: export PATH=/build/reproducible-path/librsb-1.3.0.2+dfsg:/usr/sbin:/usr/bin:/sbin:/bin:/usr/games:/i/capture/the/path # env: export LD_LIBRARY_PATH=/build/reproducible-path/librsb-1.3.0.2+dfsg/.libs # env: HOSTNAME is not set # env: KMP_AFFINITY is not set @@ -5272,7 +5308,7 @@ # env: SLURM_NTASKS is not set # env: SLURM_STEP_TASKS_PER_NODE is not set # env: SLURM_TASKS_PER_NODE is not set -# detected hostname: codethink03-arm64 +# detected hostname: i-capture-the-hostname # user specified a verbosity level of 2 (each --verbose occurrence counts +1) # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 524288 bytes, per-thread 43690 bytes @@ -5292,29 +5328,29 @@ # This test will measure times in scanning arrays sized and aligned to fit in caches. # 2 cache levels detected Will fill struct with 40 samples... -# Memory benchmark took 5.288s +# Memory benchmark took 5.339s # auto-tuning oriented output implies times==0 iterations and sort-after-load. #pr: allocated a performance record for 4 samples (1120 bytes). # multi-type benchmarking (DSCZ) -- now using typecode D (last was D). # Cache block size total 524288 bytes, per-thread 43690 bytes -# so far, program took 5.289s of wall clock time; ancillary tests 0.000s; I/O 0.000s; checks 0.000s; conversions 0.000s; rsb/mkl tuning 0.000s/0.000s . +# so far, program took 5.341s of wall clock time; ancillary tests 0.000s; I/O 0.000s; checks 0.000s; conversions 0.000s; rsb/mkl tuning 0.000s/0.000s . # Using 1 threads # Using alpha=1 beta=1 order=cols for rsb_spmv/rsb_spsv/rsb_spmm/rsb_spsm. # will use input matrix flags: RSB_FLAG_USE_HALFWORD_INDICES, RSB_FLAG_SORTED_INPUT, RSB_FLAG_LOWER, RSB_FLAG_QUAD_PARTITIONING, RSB_FLAG_SYMMETRIC, RSB_FLAG_OWN_PARTITIONING_ARRAYS # Using 1 threads Building a matrix with 5050 nnz, 100 x 100 Duplicates check: 5050 - 0 = 5050 - converted COO to RSB in 1.428e-02 s (100.00 %) - analyzed arrays in 2.651e-03 s (18.57 %) - cleaned-up arrays in 1.121e-05 s (0.08 %) - deduplicated arrays in 1.001e-05 s (0.07 %) + converted COO to RSB in 9.549e-03 s (100.00 %) + analyzed arrays in 2.195e-03 s (22.99 %) + cleaned-up arrays in 1.001e-05 s (0.10 %) + deduplicated arrays in 1.001e-05 s (0.10 %) sorted arrays in 0.000e+00 s (0.00 %) - shuffled partitions in 4.836e-03 s (33.87 %) - memory allocations took 9.060e-06 s (0.06 %) - leafs setup took 7.153e-06 s (0.05 %) - halfword conversion took 6.751e-03 s (47.28 %) -Built (100 x 100)[0xaaaac7294530]{D} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x2446196 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'LS' -# Constructed matrix (took 0.014s): (100 x 100)[0xaaaac7294530]{D} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x2446196 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'LS' + shuffled partitions in 4.911e-03 s (51.43 %) + memory allocations took 1.383e-05 s (0.14 %) + leafs setup took 6.914e-06 s (0.07 %) + halfword conversion took 2.400e-03 s (25.13 %) +Built (100 x 100)[0xaaaae44b9570]{D} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x2446196 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'LS' +# Constructed matrix (took 0.010s): (100 x 100)[0xaaaae44b9570]{D} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x2446196 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'LS' # matrix consistency check took 0.000s (ok) RSB Sparse Blocks Autotuner invoked requesting max 6 splits and max 6 merges in 1 rounds, threads spec.0 (specify negative values to enable threads tuning). Will autotune matrix: 100 x 100, type D, 5050 nnz, 50 nnz/r, 4 subms, 3 lsubms, 2.1212 bpnz. @@ -5365,10 +5401,10 @@ # RSB_IO_WANT_SORT_METHOD: 0 # RSB_IO_WANT_SUBDIVISION_MULTIPLIER: 1 # librsb version 1.3.0.2 - 202212201855: Initialization success -3 iterations (1 th.) took 0.003669s; avg 0.001223s ( +/- 0.32/ 0.32 %); best 0.001219s; worst 0.001227s; std dev. 3.213e-06 (taking best). -Reference operation time is 0.00121903 s (16.57 Mflops) with 1 threads. -Starting merge (same threads) based auto-tuning procedure (transA=N, nrhs=1, order=cols) (max 6 steps, inclusive 3 grace steps) on: 100 x 100, type D, 5050 nnz, 50 nnz/r, 4 subms, 3 lsubms, 2.1212 bpnz (tpop: 0.001219 Mflops: 16.570) -Merge (3 -> 1 leaves) took w.c.t. of 4.292e-05s, ~3.29e-05s of computing time (of which 1.502e-05s sorting, 2.861e-06s analysis) +3 iterations (1 th.) took 0.003648s; avg 0.001216s ( +/- 2.54/ 2.70 %); best 0.001185s; worst 0.001249s; std dev. 2.603e-05 (taking best). +Reference operation time is 0.00118518 s (17.04 Mflops) with 1 threads. +Starting merge (same threads) based auto-tuning procedure (transA=N, nrhs=1, order=cols) (max 6 steps, inclusive 3 grace steps) on: 100 x 100, type D, 5050 nnz, 50 nnz/r, 4 subms, 3 lsubms, 2.1212 bpnz (tpop: 0.001185 Mflops: 17.044) +Merge (3 -> 1 leaves) took w.c.t. of 0.0002351s, ~0.0002179s of computing time (of which 0.0001721s sorting, 5.007e-06s analysis) # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 524288 bytes, per-thread 524288 bytes # RSB_IO_WANT_MEMORY_HIERARCHY_INFO_STRING: unset @@ -5399,8 +5435,8 @@ # RSB_IO_WANT_SORT_METHOD: 0 # RSB_IO_WANT_SUBDIVISION_MULTIPLIER: 1 # librsb version 1.3.0.2 - 202212201855: Initialization success -3 iterations (1 th.) took 1.907e-05s; avg 6.358e-06s ( +/- 21.25/ 27.50 %); best 5.007e-06s; worst 8.106e-06s; std dev. 1.296e-06 (taking best). -Reference operation time is 5.00679e-06 s (4035 Mflops) with 1 threads. +3 iterations (1 th.) took 5.412e-05s; avg 1.804e-05s ( +/- 6.17/ 11.01 %); best 1.693e-05s; worst 2.003e-05s; std dev. 1.408e-06 (taking best). +Reference operation time is 1.69277e-05 s (1193 Mflops) with 1 threads. # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 524288 bytes, per-thread 524288 bytes # RSB_IO_WANT_MEMORY_HIERARCHY_INFO_STRING: unset @@ -5416,16 +5452,16 @@ # RSB_IO_WANT_SORT_METHOD: 0 # RSB_IO_WANT_SUBDIVISION_MULTIPLIER: 1 # librsb version 1.3.0.2 - 202212201855: Initialization success -After merge step 1: tpop: 5.007e-06 s ~Mflops: 4034.521 nsubm:1 otn:1 -Applying merge (3 -> 1 leaves, 1 th.) yielded SPEEDUP of 243.476x: 0.001219s -> 5.007e-06s, so taking this instance. +After merge step 1: tpop: 1.693e-05 s ~Mflops: 1193.309 nsubm:1 otn:1 +Applying merge (3 -> 1 leaves, 1 th.) yielded SPEEDUP of 70.014x: 0.001185s -> 1.693e-05s, so taking this instance. Saved plot to test-tuning-lower-100x100-5050nz--D-N-1--mv-tuned_merge1_1x1th.eps Merged all the matrix leaves: no reason to continue merging. -A total of 1 merge steps (of max 6) (3 -> 1 subms) took 0.01197s (of which 4.506e-05s partitioning, 0.008294s I/O); computing times: 3.29e-05s in par. loops, 1.502e-05s sorting, 2.861e-06s analyzing) -Total merge + benchmarking process took 0.01197s, equivalent to 2391.0/9.8 new/old ops (0.007893s for 2 clones -- as 1576.4/6.5 ops, or 788.2/3.2 ops per clone), SPEEDUP of 243.476x -Applying multi-merge (3 -> 1 leaves, 1 steps, 0 -> 1 th.sp.) yielded SPEEDUP of 243.476x (0.001219s -> 5.007e-06s), will amortize in 9.9 ops by saving 0.001214s per op. -In 1 tuning rounds (tot. 0.02s, 0.0079s for constructor, 2 clones) obtained a SPEEDUP of 24247.6% (243.5x) (from 16.57 to 4035 Mflops). Employed 0.0084s for I/O of matrix plots. +A total of 1 merge steps (of max 6) (3 -> 1 subms) took 0.01504s (of which 0.0002429s partitioning, 0.01137s I/O); computing times: 0.0002179s in par. loops, 0.0001721s sorting, 5.007e-06s analyzing) +Total merge + benchmarking process took 0.01504s, equivalent to 888.4/12.7 new/old ops (0.006968s for 2 clones -- as 411.6/5.9 ops, or 205.8/2.9 ops per clone), SPEEDUP of 70.014x +Applying multi-merge (3 -> 1 leaves, 1 steps, 0 -> 1 th.sp.) yielded SPEEDUP of 70.014x (0.001185s -> 1.693e-05s), will amortize in 12.9 ops by saving 0.001168s per op. +In 1 tuning rounds (tot. 0.022s, 0.007s for constructor, 2 clones) obtained a SPEEDUP of 6901.4% (70.01x) (from 17.04 to 1193 Mflops). Employed 0.0086s for I/O of matrix plots. #pr: updating sample at index 1 (0^th of 4), 0^th touch for (0,0,0,0,0,0,0). -First run of RSB Autotuner took 0.0284681 s (1.219e-03 s -> 5.007e-06 s per spmv_sxsa) (tuned: 3 -> 1 lsubm). +First run of RSB Autotuner took 0.031112 s (1.185e-03 s -> 1.693e-05 s per spmv_sxsa) (tuned: 3 -> 1 lsubm). RSB Sparse Blocks Autotuner invoked requesting max 0 splits and max 0 merges in 1 rounds, auto threads spec. Will autotune matrix: 100 x 100, type D, 5050 nnz, 50 nnz/r, 1 subms, 1 lsubms, 2.0800 bpnz. Parameters: verbosity:1 mintimes:3 maxtimes:10 mindt:0 maxdt:10 @@ -5491,20 +5527,20 @@ # RSB_IO_WANT_SORT_METHOD: 0 # RSB_IO_WANT_SUBDIVISION_MULTIPLIER: 1 # librsb version 1.3.0.2 - 202212201855: Initialization success -3 iterations (1 th.) took 2.098e-05s; avg 6.994e-06s ( +/- 28.41/ 39.77 %); best 5.007e-06s; worst 9.775e-06s; std dev. 2.026e-06 (taking best). -Reference operation time is 5.00679e-06 s (4035 Mflops) with 1 threads. +3 iterations (1 th.) took 5.579e-05s; avg 1.86e-05s ( +/- 8.97/ 17.95 %); best 1.693e-05s; worst 2.193e-05s; std dev. 2.36e-06 (taking best). +Reference operation time is 1.69277e-05 s (1193 Mflops) with 1 threads. Building a matrix with 5050 nnz, 100 x 100 Duplicates check: 5050 - 0 = 5050 - converted COO to RSB in 4.199e-03 s (100.00 %) - analyzed arrays in 1.718e-03 s (40.92 %) - cleaned-up arrays in 8.821e-06 s (0.21 %) - deduplicated arrays in 8.106e-06 s (0.19 %) + converted COO to RSB in 4.026e-03 s (100.00 %) + analyzed arrays in 1.524e-03 s (37.85 %) + cleaned-up arrays in 2.503e-05 s (0.62 %) + deduplicated arrays in 2.599e-05 s (0.65 %) sorted arrays in 0.000e+00 s (0.00 %) - shuffled partitions in 2.453e-03 s (58.41 %) - memory allocations took 4.292e-06 s (0.10 %) - leafs setup took 2.146e-06 s (0.05 %) - halfword conversion took 3.815e-06 s (0.09 %) -Built (100 x 100)[0xaaaac729ed20]{D} @ (0(0..100),0(0..100)) (5050 nnz, 50 nnz/r) flags 0x42644094 (coo:0, csr:1, hw:0, ic:1, fi:0), storage: 1, subm: 1, symflags:'LS' + shuffled partitions in 2.439e-03 s (60.57 %) + memory allocations took 5.245e-06 s (0.13 %) + leafs setup took 1.192e-06 s (0.03 %) + halfword conversion took 5.007e-06 s (0.12 %) +Built (100 x 100)[0xaaaae44c3d60]{D} @ (0(0..100),0(0..100)) (5050 nnz, 50 nnz/r) flags 0x42644094 (coo:0, csr:1, hw:0, ic:1, fi:0), storage: 1, subm: 1, symflags:'LS' Starting autotuning stage, with subdivision of 1 (current threads=1, requested threads=0, max threads = 12). # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 524288 bytes, per-thread 524288 bytes @@ -5538,16 +5574,16 @@ # librsb version 1.3.0.2 - 202212201855: Initialization success Building a matrix with 5050 nnz, 100 x 100 Duplicates check: 5050 - 0 = 5050 - converted COO to RSB in 7.719e-03 s (100.00 %) - analyzed arrays in 1.772e-03 s (22.96 %) - cleaned-up arrays in 9.060e-06 s (0.12 %) - deduplicated arrays in 9.060e-06 s (0.12 %) + converted COO to RSB in 7.544e-03 s (100.00 %) + analyzed arrays in 2.140e-03 s (28.37 %) + cleaned-up arrays in 2.480e-05 s (0.33 %) + deduplicated arrays in 2.408e-05 s (0.32 %) sorted arrays in 0.000e+00 s (0.00 %) - shuffled partitions in 3.248e-03 s (42.08 %) - memory allocations took 3.815e-06 s (0.05 %) - leafs setup took 2.861e-06 s (0.04 %) - halfword conversion took 2.674e-03 s (34.64 %) -Built (100 x 100)[0xaaaac7294860]{D} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x42646096 (coo:0, csr:1, hw:1, ic:1, fi:0), storage: 1, subm: 3, symflags:'LS' + shuffled partitions in 2.891e-03 s (38.32 %) + memory allocations took 4.053e-06 s (0.05 %) + leafs setup took 1.907e-06 s (0.03 %) + halfword conversion took 2.458e-03 s (32.58 %) +Built (100 x 100)[0xaaaae44b98a0]{D} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x42646096 (coo:0, csr:1, hw:1, ic:1, fi:0), storage: 1, subm: 3, symflags:'LS' # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 524288 bytes, per-thread 524288 bytes # RSB_IO_WANT_MEMORY_HIERARCHY_INFO_STRING: unset @@ -5593,9 +5629,9 @@ # RSB_IO_WANT_SORT_METHOD: 0 # RSB_IO_WANT_SUBDIVISION_MULTIPLIER: 0.25 # librsb version 1.3.0.2 - 202212201855: Initialization success -3 iterations (1 th.) took 0.00354s; avg 0.00118s ( +/- 40.78/ 34.24 %); best 0.0006988s; worst 0.001584s; std dev. 0.0003655 (taking best). -Reference operation time is 0.000698805 s (28.91 Mflops) with 1 threads. -Challenging best inner round reference (5.00679e-06 s/1 threads) with: subdivision 0.25, 3 leaves, 2.121 bytes/nz, 0.000698805 s/0 threads (speedup 0.00716479 x), same?n. +3 iterations (1 th.) took 0.004182s; avg 0.001394s ( +/- 12.12/ 24.17 %); best 0.001225s; worst 0.001731s; std dev. 0.0002383 (taking best). +Reference operation time is 0.00122499 s (16.49 Mflops) with 1 threads. +Challenging best inner round reference (1.69277e-05 s/1 threads) with: subdivision 0.25, 3 leaves, 2.121 bytes/nz, 0.00122499 s/0 threads (speedup 0.0138186 x), same?n. New candidate clone performs slowly; discarding it: 100 x 100, type D, 5050 nnz, 50 nnz/r, 4 subms, 3 lsubms, 2.1212 bpnz # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 524288 bytes, per-thread 524288 bytes @@ -5629,16 +5665,16 @@ # librsb version 1.3.0.2 - 202212201855: Initialization success Building a matrix with 5050 nnz, 100 x 100 Duplicates check: 5050 - 0 = 5050 - converted COO to RSB in 7.734e-03 s (100.00 %) - analyzed arrays in 3.265e-03 s (42.22 %) - cleaned-up arrays in 2.503e-05 s (0.32 %) - deduplicated arrays in 2.694e-05 s (0.35 %) + converted COO to RSB in 8.272e-03 s (100.00 %) + analyzed arrays in 2.655e-03 s (32.10 %) + cleaned-up arrays in 2.289e-05 s (0.28 %) + deduplicated arrays in 2.098e-05 s (0.25 %) sorted arrays in 0.000e+00 s (0.00 %) - shuffled partitions in 2.137e-03 s (27.63 %) + shuffled partitions in 2.698e-03 s (32.62 %) memory allocations took 5.007e-06 s (0.06 %) - leafs setup took 4.053e-06 s (0.05 %) - halfword conversion took 2.269e-03 s (29.34 %) -Built (100 x 100)[0xaaaac7295250]{D} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x42646096 (coo:0, csr:1, hw:1, ic:1, fi:0), storage: 1, subm: 10, symflags:'LS' + leafs setup took 2.861e-06 s (0.03 %) + halfword conversion took 2.867e-03 s (34.66 %) +Built (100 x 100)[0xaaaae44ba290]{D} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x42646096 (coo:0, csr:1, hw:1, ic:1, fi:0), storage: 1, subm: 10, symflags:'LS' # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 524288 bytes, per-thread 524288 bytes # RSB_IO_WANT_MEMORY_HIERARCHY_INFO_STRING: unset @@ -5684,9 +5720,9 @@ # RSB_IO_WANT_SORT_METHOD: 0 # RSB_IO_WANT_SUBDIVISION_MULTIPLIER: 0.5 # librsb version 1.3.0.2 - 202212201855: Initialization success -3 iterations (1 th.) took 0.003324s; avg 0.001108s ( +/- 3.23/ 2.79 %); best 0.001072s; worst 0.001139s; std dev. 2.748e-05 (taking best). -Reference operation time is 0.00107217 s (18.84 Mflops) with 1 threads. -Challenging best inner round reference (5.00679e-06 s/1 threads) with: subdivision 0.5, 10 leaves, 2.206 bytes/nz, 0.00107217 s/0 threads (speedup 0.00466978 x), same?n. +3 iterations (1 th.) took 0.003495s; avg 0.001165s ( +/- 1.89/ 3.02 %); best 0.001143s; worst 0.0012s; std dev. 2.515e-05 (taking best). +Reference operation time is 0.00114298 s (17.67 Mflops) with 1 threads. +Challenging best inner round reference (1.69277e-05 s/1 threads) with: subdivision 0.5, 10 leaves, 2.206 bytes/nz, 0.00114298 s/0 threads (speedup 0.0148102 x), same?n. New candidate clone performs slowly; discarding it: 100 x 100, type D, 5050 nnz, 50 nnz/r, 14 subms, 10 lsubms, 2.2059 bpnz # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 524288 bytes, per-thread 524288 bytes @@ -5720,16 +5756,16 @@ # librsb version 1.3.0.2 - 202212201855: Initialization success Building a matrix with 5050 nnz, 100 x 100 Duplicates check: 5050 - 0 = 5050 - converted COO to RSB in 6.942e-03 s (100.00 %) - analyzed arrays in 2.921e-03 s (42.08 %) - cleaned-up arrays in 1.884e-05 s (0.27 %) - deduplicated arrays in 1.717e-05 s (0.25 %) + converted COO to RSB in 7.403e-03 s (100.00 %) + analyzed arrays in 3.069e-03 s (41.45 %) + cleaned-up arrays in 2.289e-05 s (0.31 %) + deduplicated arrays in 2.313e-05 s (0.31 %) sorted arrays in 0.000e+00 s (0.00 %) - shuffled partitions in 2.320e-03 s (33.42 %) - memory allocations took 3.099e-06 s (0.04 %) - leafs setup took 2.146e-06 s (0.03 %) - halfword conversion took 1.659e-03 s (23.90 %) -Built (100 x 100)[0xaaaac729ee40]{D} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x42646096 (coo:0, csr:1, hw:1, ic:1, fi:0), storage: 1, subm: 25, symflags:'LS' + shuffled partitions in 2.560e-03 s (34.58 %) + memory allocations took 6.199e-06 s (0.08 %) + leafs setup took 4.053e-06 s (0.05 %) + halfword conversion took 1.716e-03 s (23.18 %) +Built (100 x 100)[0xaaaae44c3e80]{D} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x42646096 (coo:0, csr:1, hw:1, ic:1, fi:0), storage: 1, subm: 24, symflags:'LS' # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 524288 bytes, per-thread 524288 bytes # RSB_IO_WANT_MEMORY_HIERARCHY_INFO_STRING: unset @@ -5775,10 +5811,10 @@ # RSB_IO_WANT_SORT_METHOD: 0 # RSB_IO_WANT_SUBDIVISION_MULTIPLIER: 1 # librsb version 1.3.0.2 - 202212201855: Initialization success -3 iterations (1 th.) took 0.003099s; avg 0.001033s ( +/- 5.90/ 7.46 %); best 0.000972s; worst 0.00111s; std dev. 5.75e-05 (taking best). -Reference operation time is 0.000972033 s (20.78 Mflops) with 1 threads. -Challenging best inner round reference (5.00679e-06 s/1 threads) with: subdivision 1, 25 leaves, 2.317 bytes/nz, 0.000972033 s/0 threads (speedup 0.00515085 x), same?n. -New candidate clone performs slowly; discarding it: 100 x 100, type D, 5050 nnz, 50 nnz/r, 34 subms, 25 lsubms, 2.3168 bpnz +3 iterations (1 th.) took 0.003481s; avg 0.00116s ( +/- 53.05/ 58.32 %); best 0.0005448s; worst 0.001837s; std dev. 0.0005293 (taking best). +Reference operation time is 0.000544786 s (37.08 Mflops) with 1 threads. +Challenging best inner round reference (1.69277e-05 s/1 threads) with: subdivision 1, 24 leaves, 2.306 bytes/nz, 0.000544786 s/0 threads (speedup 0.0310722 x), same?n. +New candidate clone performs slowly; discarding it: 100 x 100, type D, 5050 nnz, 50 nnz/r, 33 subms, 24 lsubms, 2.3057 bpnz # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 524288 bytes, per-thread 524288 bytes # RSB_IO_WANT_MEMORY_HIERARCHY_INFO_STRING: unset @@ -5811,16 +5847,16 @@ # librsb version 1.3.0.2 - 202212201855: Initialization success Building a matrix with 5050 nnz, 100 x 100 Duplicates check: 5050 - 0 = 5050 - converted COO to RSB in 6.289e-03 s (100.00 %) - analyzed arrays in 2.199e-03 s (34.96 %) - cleaned-up arrays in 1.693e-05 s (0.27 %) - deduplicated arrays in 1.693e-05 s (0.27 %) + converted COO to RSB in 7.986e-03 s (100.00 %) + analyzed arrays in 2.960e-03 s (37.07 %) + cleaned-up arrays in 2.003e-05 s (0.25 %) + deduplicated arrays in 1.717e-05 s (0.21 %) sorted arrays in 0.000e+00 s (0.00 %) - shuffled partitions in 2.141e-03 s (34.04 %) - memory allocations took 5.245e-06 s (0.08 %) - leafs setup took 3.099e-06 s (0.05 %) - halfword conversion took 1.907e-03 s (30.32 %) -Built (100 x 100)[0xaaaac72c5ae0]{D} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x42646096 (coo:0, csr:1, hw:1, ic:1, fi:0), storage: 1, subm: 36, symflags:'LS' + shuffled partitions in 2.723e-03 s (34.10 %) + memory allocations took 4.768e-06 s (0.06 %) + leafs setup took 3.099e-06 s (0.04 %) + halfword conversion took 2.256e-03 s (28.25 %) +Built (100 x 100)[0xaaaae44eab20]{D} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x42646096 (coo:0, csr:1, hw:1, ic:1, fi:0), storage: 1, subm: 36, symflags:'LS' # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 524288 bytes, per-thread 524288 bytes # RSB_IO_WANT_MEMORY_HIERARCHY_INFO_STRING: unset @@ -5866,9 +5902,9 @@ # RSB_IO_WANT_SORT_METHOD: 0 # RSB_IO_WANT_SUBDIVISION_MULTIPLIER: 2 # librsb version 1.3.0.2 - 202212201855: Initialization success -3 iterations (1 th.) took 0.00261s; avg 0.0008701s ( +/- 14.59/ 28.38 %); best 0.0007432s; worst 0.001117s; std dev. 0.0001746 (taking best). -Reference operation time is 0.000743151 s (27.18 Mflops) with 1 threads. -Challenging best inner round reference (5.00679e-06 s/1 threads) with: subdivision 2, 36 leaves, 2.383 bytes/nz, 0.000743151 s/0 threads (speedup 0.00673725 x), same?n. +3 iterations (1 th.) took 0.003036s; avg 0.001012s ( +/- 19.36/ 13.34 %); best 0.0008161s; worst 0.001147s; std dev. 0.0001418 (taking best). +Reference operation time is 0.000816107 s (24.75 Mflops) with 1 threads. +Challenging best inner round reference (1.69277e-05 s/1 threads) with: subdivision 2, 36 leaves, 2.383 bytes/nz, 0.000816107 s/0 threads (speedup 0.020742 x), same?n. New candidate clone performs slowly; discarding it: 100 x 100, type D, 5050 nnz, 50 nnz/r, 50 subms, 36 lsubms, 2.3834 bpnz # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 524288 bytes, per-thread 524288 bytes @@ -5902,16 +5938,16 @@ # librsb version 1.3.0.2 - 202212201855: Initialization success Building a matrix with 5050 nnz, 100 x 100 Duplicates check: 5050 - 0 = 5050 - converted COO to RSB in 4.806e-03 s (100.00 %) - analyzed arrays in 1.938e-03 s (40.33 %) - cleaned-up arrays in 8.821e-06 s (0.18 %) - deduplicated arrays in 9.060e-06 s (0.19 %) + converted COO to RSB in 8.661e-03 s (100.00 %) + analyzed arrays in 3.413e-03 s (39.41 %) + cleaned-up arrays in 1.693e-05 s (0.20 %) + deduplicated arrays in 1.407e-05 s (0.16 %) sorted arrays in 0.000e+00 s (0.00 %) - shuffled partitions in 1.430e-03 s (29.75 %) - memory allocations took 3.099e-06 s (0.06 %) - leafs setup took 1.907e-06 s (0.04 %) - halfword conversion took 1.415e-03 s (29.44 %) -Built (100 x 100)[0xaaaac72c5ae0]{D} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x42646096 (coo:0, csr:1, hw:1, ic:1, fi:0), storage: 1, subm: 36, symflags:'LS' + shuffled partitions in 2.747e-03 s (31.72 %) + memory allocations took 5.007e-06 s (0.06 %) + leafs setup took 2.861e-06 s (0.03 %) + halfword conversion took 2.462e-03 s (28.43 %) +Built (100 x 100)[0xaaaae44eab20]{D} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x42646096 (coo:0, csr:1, hw:1, ic:1, fi:0), storage: 1, subm: 36, symflags:'LS' # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 524288 bytes, per-thread 524288 bytes # RSB_IO_WANT_MEMORY_HIERARCHY_INFO_STRING: unset @@ -5957,11 +5993,11 @@ # RSB_IO_WANT_SORT_METHOD: 0 # RSB_IO_WANT_SUBDIVISION_MULTIPLIER: 4 # librsb version 1.3.0.2 - 202212201855: Initialization success -3 iterations (1 th.) took 0.00225s; avg 0.00075s ( +/- 42.27/ 27.89 %); best 0.000433s; worst 0.0009592s; std dev. 0.0002279 (taking best). -Reference operation time is 0.000432968 s (46.65 Mflops) with 1 threads. -Challenging best inner round reference (5.00679e-06 s/1 threads) with: subdivision 4, 36 leaves, 2.383 bytes/nz, 0.000432968 s/0 threads (speedup 0.0115639 x), same?n. +3 iterations (1 th.) took 0.003447s; avg 0.001149s ( +/- 13.31/ 24.10 %); best 0.0009961s; worst 0.001426s; std dev. 0.0001962 (taking best). +Reference operation time is 0.000996113 s (20.28 Mflops) with 1 threads. +Challenging best inner round reference (1.69277e-05 s/1 threads) with: subdivision 4, 36 leaves, 2.383 bytes/nz, 0.000996113 s/0 threads (speedup 0.0169938 x), same?n. New candidate clone performs slowly; discarding it: 100 x 100, type D, 5050 nnz, 50 nnz/r, 50 subms, 36 lsubms, 2.3834 bpnz -Best sparse multiply performance with subdivision multiplier of 1: 4034.52 Mflops. +Best sparse multiply performance with subdivision multiplier of 1: 1193.31 Mflops. # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 524288 bytes, per-thread 524288 bytes # RSB_IO_WANT_MEMORY_HIERARCHY_INFO_STRING: unset @@ -5977,23 +6013,23 @@ # RSB_IO_WANT_SORT_METHOD: 0 # RSB_IO_WANT_SUBDIVISION_MULTIPLIER: 1 # librsb version 1.3.0.2 - 202212201855: Initialization success -Last tuner inner round (1 of 1) took 0.054039 s (eq. to 1e+04/ 1e+04 old/new op.times), gained local/global speedup 1 x (5.00679e-06 : 5.00679e-06) / 1 x (5.00679e-06 : 5.00679e-06). This is not amortizable ! +Last tuner inner round (1 of 1) took 0.062825 s (eq. to 4e+03/ 4e+03 old/new op.times), gained local/global speedup 1 x (1.69277e-05 : 1.69277e-05) / 1 x (1.69277e-05 : 1.69277e-05). This is not amortizable ! Auto tuning inner round 1 did not find a configuration better than the original. -In 1 tuning rounds (tot. 0.054s, 0.039s for constructor, 0 clones) obtained NO speedup (best stays 4035 Mflops). -Second run of RSB Autotuner took 0.054059 s and estimated a speedup of 1.000000 x (5.007e-06 s -> 5.007e-06 s per op) in same matrix (1 -> 1 lsubm) +In 1 tuning rounds (tot. 0.063s, 0.044s for constructor, 0 clones) obtained NO speedup (best stays 1193 Mflops). +Second run of RSB Autotuner took 0.0628588 s and estimated a speedup of 1.000000 x (1.693e-05 s -> 1.693e-05 s per op) in same matrix (1 -> 1 lsubm) #min:1 #max:1 #sum:100 #norm:10 #used index storage compared to COO:10504 vs 40400 bytes (26.00%) ; compared to CSR:10504 vs 20604 bytes (50.99%) #%:CONSTRUCTOR_*:SORT SCAN INSERT SCAN+INSERT -%:CONSTRUCTOR_TIMES:lower-100x100-5050nz S N 1 100 100 5050 0.000000 0.002651 0.004836 0.007487 -%:UNSORTEDCOO2RSB_TIME:lower-100x100-5050nz S N 1 100 100 5050 0.007487 -%:RSB_SUBDIVISION_TIME:lower-100x100-5050nz S N 1 100 100 5050 0.002651 -%:RSB_SHUFFLE_TIME:lower-100x100-5050nz S N 1 100 100 5050 0.004836 +%:CONSTRUCTOR_TIMES:lower-100x100-5050nz S N 1 100 100 5050 0.000000 0.002195 0.004911 0.007106 +%:UNSORTEDCOO2RSB_TIME:lower-100x100-5050nz S N 1 100 100 5050 0.007106 +%:RSB_SUBDIVISION_TIME:lower-100x100-5050nz S N 1 100 100 5050 0.002195 +%:RSB_SHUFFLE_TIME:lower-100x100-5050nz S N 1 100 100 5050 0.004911 %:ROW_MAJOR_SORT_TIME:lower-100x100-5050nz S N 1 100 100 5050 0.000000 %:ROW_MAJOR_SORT_SCALING:lower-100x100-5050nz S N 1 100 100 5050 nan -%:SORTEDCOO2RSB_TIME:lower-100x100-5050nz S N 1 100 100 5050 0.007487 +%:SORTEDCOO2RSB_TIME:lower-100x100-5050nz S N 1 100 100 5050 0.007106 %:ROW_MAJOR_SORT_TO_MOP:lower-100x100-5050nz S N 1 100 100 5050 0.000 %:UNSORTEDCOO2RSB_SCALING:lower-100x100-5050nz S N 1 100 100 5050 1.00 %:SORTEDCOO2RSB_SCALING:lower-100x100-5050nz S N 1 100 100 5050 1.00 @@ -6008,34 +6044,34 @@ %:SM_MINMAXAVGNNZ:lower-100x100-5050nz S N 1 100 100 5050 5050 5050 5050 # %operation:matrix CONSTRUCTOR[1] SPMV[1] SPMV[1] -%operation:lower-100x100-5050nz 0.0142779 1e+09 1e+09 +%operation:lower-100x100-5050nz 0.0095489 1e+09 1e+09 %constructor:matrix SORT[1] SCAN[1] SHUFFLE[1] INSERT[1] -%constructor:lower-100x100-5050nz 0 0.00265098 0 0.00483584 -# so far, program took 5.394s of wall clock time; ancillary tests 0.000s; I/O 0.000s; checks 0.000s; conversions 0.000s; rsb/mkl tuning 0.083s/0.000s . +%constructor:lower-100x100-5050nz 0 0.00219512 0 0.00491118 +# so far, program took 5.451s of wall clock time; ancillary tests 0.000s; I/O 0.000s; checks 0.000s; conversions 0.000s; rsb/mkl tuning 0.094s/0.000s . getrusage() stats: ru_maxrss: 6 (maximum resident set size -- MB) -ru_stime : 0.05983s (system CPU time used) -ru_utime : 5.768s (user CPU time used) +ru_stime : 0.04788s (system CPU time used) +ru_utime : 6.026s (user CPU time used) # multi-type benchmarking (DSCZ) -- now using typecode S (last was D). # Cache block size total 524288 bytes, per-thread 524288 bytes -# so far, program took 5.394s of wall clock time; ancillary tests 0.000s; I/O 0.000s; checks 0.000s; conversions 0.000s; rsb/mkl tuning 0.083s/0.000s . +# so far, program took 5.451s of wall clock time; ancillary tests 0.000s; I/O 0.000s; checks 0.000s; conversions 0.000s; rsb/mkl tuning 0.094s/0.000s . # Using 1 threads # Using alpha=1 beta=1 order=cols for rsb_spmv/rsb_spsv/rsb_spmm/rsb_spsm. # will use input matrix flags: RSB_FLAG_USE_HALFWORD_INDICES, RSB_FLAG_SORTED_INPUT, RSB_FLAG_LOWER, RSB_FLAG_QUAD_PARTITIONING, RSB_FLAG_SYMMETRIC, RSB_FLAG_OWN_PARTITIONING_ARRAYS # Using 1 threads Building a matrix with 5050 nnz, 100 x 100 Duplicates check: 5050 - 0 = 5050 - converted COO to RSB in 9.215e-03 s (100.00 %) - analyzed arrays in 1.808e-03 s (19.62 %) - cleaned-up arrays in 1.407e-05 s (0.15 %) - deduplicated arrays in 1.192e-05 s (0.13 %) + converted COO to RSB in 7.635e-03 s (100.00 %) + analyzed arrays in 1.572e-03 s (20.59 %) + cleaned-up arrays in 1.621e-05 s (0.21 %) + deduplicated arrays in 1.383e-05 s (0.18 %) sorted arrays in 0.000e+00 s (0.00 %) - shuffled partitions in 5.058e-03 s (54.89 %) - memory allocations took 3.815e-06 s (0.04 %) + shuffled partitions in 4.101e-03 s (53.71 %) + memory allocations took 2.861e-06 s (0.04 %) leafs setup took 9.537e-07 s (0.01 %) - halfword conversion took 2.316e-03 s (25.13 %) -Built (100 x 100)[0xaaaac729ee40]{S} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x2446196 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'LS' -# Constructed matrix (took 0.009s): (100 x 100)[0xaaaac729ee40]{S} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x2446196 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'LS' + halfword conversion took 1.927e-03 s (25.24 %) +Built (100 x 100)[0xaaaae44c3e80]{S} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x2446196 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'LS' +# Constructed matrix (took 0.008s): (100 x 100)[0xaaaae44c3e80]{S} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x2446196 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'LS' # matrix consistency check took 0.000s (ok) RSB Sparse Blocks Autotuner invoked requesting max 6 splits and max 6 merges in 1 rounds, threads spec.0 (specify negative values to enable threads tuning). Will autotune matrix: 100 x 100, type S, 5050 nnz, 50 nnz/r, 4 subms, 3 lsubms, 2.1212 bpnz. @@ -6086,10 +6122,10 @@ # RSB_IO_WANT_SORT_METHOD: 0 # RSB_IO_WANT_SUBDIVISION_MULTIPLIER: 1 # librsb version 1.3.0.2 - 202212201855: Initialization success -3 iterations (1 th.) took 0.00189s; avg 0.00063s ( +/- 1.30/ 0.97 %); best 0.0006218s; worst 0.0006361s; std dev. 6.02e-06 (taking best). -Reference operation time is 0.000621796 s (32.49 Mflops) with 1 threads. -Starting merge (same threads) based auto-tuning procedure (transA=N, nrhs=1, order=cols) (max 6 steps, inclusive 3 grace steps) on: 100 x 100, type S, 5050 nnz, 50 nnz/r, 4 subms, 3 lsubms, 2.1212 bpnz (tpop: 0.0006218 Mflops: 32.487) -Merge (3 -> 1 leaves) took w.c.t. of 5.198e-05s, ~4.387e-05s of computing time (of which 1.788e-05s sorting, 2.146e-06s analysis) +3 iterations (1 th.) took 0.002509s; avg 0.0008363s ( +/- 0.39/ 0.67 %); best 0.000833s; worst 0.0008419s; std dev. 3.953e-06 (taking best). +Reference operation time is 0.000833035 s (24.25 Mflops) with 1 threads. +Starting merge (same threads) based auto-tuning procedure (transA=N, nrhs=1, order=cols) (max 6 steps, inclusive 3 grace steps) on: 100 x 100, type S, 5050 nnz, 50 nnz/r, 4 subms, 3 lsubms, 2.1212 bpnz (tpop: 0.000833 Mflops: 24.249) +Merge (3 -> 1 leaves) took w.c.t. of 5.102e-05s, ~4.292e-05s of computing time (of which 1.717e-05s sorting, 1.907e-06s analysis) # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 524288 bytes, per-thread 524288 bytes # RSB_IO_WANT_MEMORY_HIERARCHY_INFO_STRING: unset @@ -6120,8 +6156,8 @@ # RSB_IO_WANT_SORT_METHOD: 0 # RSB_IO_WANT_SUBDIVISION_MULTIPLIER: 1 # librsb version 1.3.0.2 - 202212201855: Initialization success -3 iterations (1 th.) took 3.099e-05s; avg 1.033e-05s ( +/- 12.31/ 15.38 %); best 9.06e-06s; worst 1.192e-05s; std dev. 1.189e-06 (taking best). -Reference operation time is 9.05991e-06 s (2230 Mflops) with 1 threads. +3 iterations (1 th.) took 3.004e-05s; avg 1.001e-05s ( +/- 0.00/ 0.00 %); best 1.001e-05s; worst 1.001e-05s; std dev. 0 (taking best). +Reference operation time is 1.00136e-05 s (2017 Mflops) with 1 threads. # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 524288 bytes, per-thread 524288 bytes # RSB_IO_WANT_MEMORY_HIERARCHY_INFO_STRING: unset @@ -6137,16 +6173,16 @@ # RSB_IO_WANT_SORT_METHOD: 0 # RSB_IO_WANT_SUBDIVISION_MULTIPLIER: 1 # librsb version 1.3.0.2 - 202212201855: Initialization success -After merge step 1: tpop: 9.06e-06 s ~Mflops: 2229.604 nsubm:1 otn:1 -Applying merge (3 -> 1 leaves, 1 th.) yielded SPEEDUP of 68.632x: 0.0006218s -> 9.06e-06s, so taking this instance. +After merge step 1: tpop: 1.001e-05 s ~Mflops: 2017.260 nsubm:1 otn:1 +Applying merge (3 -> 1 leaves, 1 th.) yielded SPEEDUP of 83.190x: 0.000833s -> 1.001e-05s, so taking this instance. Saved plot to test-tuning-lower-100x100-5050nz--S-N-1--mv-tuned_merge1_1x1th.eps Merged all the matrix leaves: no reason to continue merging. -A total of 1 merge steps (of max 6) (3 -> 1 subms) took 0.008397s (of which 5.412e-05s partitioning, 0.006246s I/O); computing times: 4.387e-05s in par. loops, 1.788e-05s sorting, 2.146e-06s analyzing) -Total merge + benchmarking process took 0.008397s, equivalent to 926.8/13.5 new/old ops (0.003599s for 2 clones -- as 397.2/5.8 ops, or 198.6/2.9 ops per clone), SPEEDUP of 68.632x -Applying multi-merge (3 -> 1 leaves, 1 steps, 0 -> 1 th.sp.) yielded SPEEDUP of 68.632x (0.0006218s -> 9.06e-06s), will amortize in 13.7 ops by saving 0.0006127s per op. -In 1 tuning rounds (tot. 0.012s, 0.0036s for constructor, 2 clones) obtained a SPEEDUP of 6763.2% (68.63x) (from 32.49 to 2230 Mflops). Employed 0.008s for I/O of matrix plots. +A total of 1 merge steps (of max 6) (3 -> 1 subms) took 0.00981s (of which 5.293e-05s partitioning, 0.00728s I/O); computing times: 4.292e-05s in par. loops, 1.717e-05s sorting, 1.907e-06s analyzing) +Total merge + benchmarking process took 0.00981s, equivalent to 979.7/11.8 new/old ops (0.004831s for 2 clones -- as 482.5/5.8 ops, or 241.2/2.9 ops per clone), SPEEDUP of 83.190x +Applying multi-merge (3 -> 1 leaves, 1 steps, 0 -> 1 th.sp.) yielded SPEEDUP of 83.190x (0.000833s -> 1.001e-05s), will amortize in 11.9 ops by saving 0.000823s per op. +In 1 tuning rounds (tot. 0.015s, 0.0048s for constructor, 2 clones) obtained a SPEEDUP of 8219.0% (83.19x) (from 24.25 to 2017 Mflops). Employed 0.0086s for I/O of matrix plots. #pr: updating sample at index 2 (1^th of 4), 0^th touch for (0,0,0,0,0,1,0). -First run of RSB Autotuner took 0.020225 s (6.218e-04 s -> 9.060e-06 s per spmv_sxsa) (tuned: 3 -> 1 lsubm). +First run of RSB Autotuner took 0.0234132 s (8.330e-04 s -> 1.001e-05 s per spmv_sxsa) (tuned: 3 -> 1 lsubm). RSB Sparse Blocks Autotuner invoked requesting max 0 splits and max 0 merges in 1 rounds, auto threads spec. Will autotune matrix: 100 x 100, type S, 5050 nnz, 50 nnz/r, 1 subms, 1 lsubms, 2.0800 bpnz. Parameters: verbosity:1 mintimes:3 maxtimes:10 mindt:0 maxdt:10 @@ -6212,20 +6248,20 @@ # RSB_IO_WANT_SORT_METHOD: 0 # RSB_IO_WANT_SUBDIVISION_MULTIPLIER: 1 # librsb version 1.3.0.2 - 202212201855: Initialization success -3 iterations (1 th.) took 3.29e-05s; avg 1.097e-05s ( +/- 19.57/ 36.96 %); best 8.821e-06s; worst 1.502e-05s; std dev. 2.868e-06 (taking best). +3 iterations (1 th.) took 3.099e-05s; avg 1.033e-05s ( +/- 14.62/ 26.92 %); best 8.821e-06s; worst 1.311e-05s; std dev. 1.969e-06 (taking best). Reference operation time is 8.82149e-06 s (2290 Mflops) with 1 threads. Building a matrix with 5050 nnz, 100 x 100 Duplicates check: 5050 - 0 = 5050 - converted COO to RSB in 1.921e-03 s (100.00 %) - analyzed arrays in 3.600e-04 s (18.74 %) - cleaned-up arrays in 1.407e-05 s (0.73 %) - deduplicated arrays in 1.192e-05 s (0.62 %) + converted COO to RSB in 3.114e-03 s (100.00 %) + analyzed arrays in 1.106e-03 s (35.52 %) + cleaned-up arrays in 1.407e-05 s (0.45 %) + deduplicated arrays in 1.192e-05 s (0.38 %) sorted arrays in 0.000e+00 s (0.00 %) - shuffled partitions in 1.529e-03 s (79.60 %) - memory allocations took 3.099e-06 s (0.16 %) - leafs setup took 9.537e-07 s (0.05 %) - halfword conversion took 1.907e-06 s (0.10 %) -Built (100 x 100)[0xaaaac729ed20]{S} @ (0(0..100),0(0..100)) (5050 nnz, 50 nnz/r) flags 0x42644094 (coo:0, csr:1, hw:0, ic:1, fi:0), storage: 1, subm: 1, symflags:'LS' + shuffled partitions in 1.973e-03 s (63.36 %) + memory allocations took 5.007e-06 s (0.16 %) + leafs setup took 9.537e-07 s (0.03 %) + halfword conversion took 1.907e-06 s (0.06 %) +Built (100 x 100)[0xaaaae44c3d60]{S} @ (0(0..100),0(0..100)) (5050 nnz, 50 nnz/r) flags 0x42644094 (coo:0, csr:1, hw:0, ic:1, fi:0), storage: 1, subm: 1, symflags:'LS' Starting autotuning stage, with subdivision of 1 (current threads=1, requested threads=0, max threads = 12). # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 524288 bytes, per-thread 524288 bytes @@ -6259,16 +6295,16 @@ # librsb version 1.3.0.2 - 202212201855: Initialization success Building a matrix with 5050 nnz, 100 x 100 Duplicates check: 5050 - 0 = 5050 - converted COO to RSB in 1.960e-03 s (100.00 %) - analyzed arrays in 1.311e-03 s (66.90 %) - cleaned-up arrays in 1.383e-05 s (0.71 %) - deduplicated arrays in 1.216e-05 s (0.62 %) + converted COO to RSB in 1.733e-03 s (100.00 %) + analyzed arrays in 8.619e-04 s (49.73 %) + cleaned-up arrays in 1.407e-05 s (0.81 %) + deduplicated arrays in 1.216e-05 s (0.70 %) sorted arrays in 0.000e+00 s (0.00 %) - shuffled partitions in 6.180e-04 s (31.53 %) - memory allocations took 9.537e-07 s (0.05 %) - leafs setup took 0.000e+00 s (0.00 %) - halfword conversion took 2.861e-06 s (0.15 %) -Built (100 x 100)[0xaaaac7295250]{S} @ (0(0..100),0(0..100)) (5050 nnz, 50 nnz/r) flags 0x42644096 (coo:0, csr:1, hw:1, ic:1, fi:0), storage: 1, subm: 1, symflags:'LS' + shuffled partitions in 8.399e-04 s (48.47 %) + memory allocations took 1.907e-06 s (0.11 %) + leafs setup took 1.192e-06 s (0.07 %) + halfword conversion took 1.907e-06 s (0.11 %) +Built (100 x 100)[0xaaaae44ba290]{S} @ (0(0..100),0(0..100)) (5050 nnz, 50 nnz/r) flags 0x42644096 (coo:0, csr:1, hw:1, ic:1, fi:0), storage: 1, subm: 1, symflags:'LS' # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 524288 bytes, per-thread 524288 bytes # RSB_IO_WANT_MEMORY_HIERARCHY_INFO_STRING: unset @@ -6314,7 +6350,7 @@ # RSB_IO_WANT_SORT_METHOD: 0 # RSB_IO_WANT_SUBDIVISION_MULTIPLIER: 0.25 # librsb version 1.3.0.2 - 202212201855: Initialization success -3 iterations (1 th.) took 2.909e-05s; avg 9.696e-06s ( +/- 18.85/ 25.41 %); best 7.868e-06s; worst 1.216e-05s; std dev. 1.809e-06 (taking best). +3 iterations (1 th.) took 2.789e-05s; avg 9.298e-06s ( +/- 15.38/ 17.95 %); best 7.868e-06s; worst 1.097e-05s; std dev. 1.277e-06 (taking best). Reference operation time is 7.86781e-06 s (2567 Mflops) with 1 threads. Challenging best inner round reference (8.82149e-06 s/1 threads) with: subdivision 0.25, 1 leaves, 2.08 bytes/nz, 7.86781e-06 s/0 threads (speedup 1.12121 x), same?n. # librsb version 1.3.0.2 - 202212201855: Initializing @@ -6349,16 +6385,16 @@ # librsb version 1.3.0.2 - 202212201855: Initialization success Building a matrix with 5050 nnz, 100 x 100 Duplicates check: 5050 - 0 = 5050 - converted COO to RSB in 4.277e-03 s (100.00 %) - analyzed arrays in 1.961e-03 s (45.85 %) - cleaned-up arrays in 1.311e-05 s (0.31 %) - deduplicated arrays in 1.287e-05 s (0.30 %) + converted COO to RSB in 5.407e-03 s (100.00 %) + analyzed arrays in 2.005e-03 s (37.08 %) + cleaned-up arrays in 5.412e-05 s (1.00 %) + deduplicated arrays in 1.407e-05 s (0.26 %) sorted arrays in 0.000e+00 s (0.00 %) - shuffled partitions in 1.304e-03 s (30.49 %) - memory allocations took 4.053e-06 s (0.09 %) + shuffled partitions in 1.667e-03 s (30.83 %) + memory allocations took 3.099e-06 s (0.06 %) leafs setup took 1.907e-06 s (0.04 %) - halfword conversion took 9.801e-04 s (22.92 %) -Built (100 x 100)[0xaaaac729ee40]{S} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x42646096 (coo:0, csr:1, hw:1, ic:1, fi:0), storage: 1, subm: 8, symflags:'LS' + halfword conversion took 1.661e-03 s (30.72 %) +Built (100 x 100)[0xaaaae44c3e80]{S} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x42646096 (coo:0, csr:1, hw:1, ic:1, fi:0), storage: 1, subm: 8, symflags:'LS' # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 524288 bytes, per-thread 524288 bytes # RSB_IO_WANT_MEMORY_HIERARCHY_INFO_STRING: unset @@ -6404,9 +6440,9 @@ # RSB_IO_WANT_SORT_METHOD: 0 # RSB_IO_WANT_SUBDIVISION_MULTIPLIER: 0.5 # librsb version 1.3.0.2 - 202212201855: Initialization success -3 iterations (1 th.) took 0.002347s; avg 0.0007823s ( +/- 21.25/ 38.94 %); best 0.0006161s; worst 0.001087s; std dev. 0.0002157 (taking best). -Reference operation time is 0.000616074 s (32.79 Mflops) with 1 threads. -Challenging best inner round reference (7.86781e-06 s/0 threads) with: subdivision 0.5, 8 leaves, 2.185 bytes/nz, 0.000616074 s/0 threads (speedup 0.0127709 x), same?n. +3 iterations (1 th.) took 0.002495s; avg 0.0008317s ( +/- 4.17/ 4.23 %); best 0.000797s; worst 0.0008669s; std dev. 2.852e-05 (taking best). +Reference operation time is 0.000797033 s (25.34 Mflops) with 1 threads. +Challenging best inner round reference (7.86781e-06 s/0 threads) with: subdivision 0.5, 8 leaves, 2.185 bytes/nz, 0.000797033 s/0 threads (speedup 0.00987137 x), same?n. New candidate clone performs slowly; discarding it: 100 x 100, type S, 5050 nnz, 50 nnz/r, 11 subms, 8 lsubms, 2.1846 bpnz # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 524288 bytes, per-thread 524288 bytes @@ -6440,16 +6476,16 @@ # librsb version 1.3.0.2 - 202212201855: Initialization success Building a matrix with 5050 nnz, 100 x 100 Duplicates check: 5050 - 0 = 5050 - converted COO to RSB in 4.026e-03 s (100.00 %) - analyzed arrays in 1.290e-03 s (32.04 %) - cleaned-up arrays in 1.216e-05 s (0.30 %) - deduplicated arrays in 1.097e-05 s (0.27 %) + converted COO to RSB in 5.251e-03 s (100.00 %) + analyzed arrays in 1.938e-03 s (36.91 %) + cleaned-up arrays in 1.311e-05 s (0.25 %) + deduplicated arrays in 1.097e-05 s (0.21 %) sorted arrays in 0.000e+00 s (0.00 %) - shuffled partitions in 1.429e-03 s (35.49 %) - memory allocations took 1.907e-06 s (0.05 %) - leafs setup took 1.192e-06 s (0.03 %) - halfword conversion took 1.280e-03 s (31.79 %) -Built (100 x 100)[0xaaaac729ee40]{S} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x42646096 (coo:0, csr:1, hw:1, ic:1, fi:0), storage: 1, subm: 19, symflags:'LS' + shuffled partitions in 1.911e-03 s (36.39 %) + memory allocations took 2.861e-06 s (0.05 %) + leafs setup took 1.907e-06 s (0.04 %) + halfword conversion took 1.373e-03 s (26.15 %) +Built (100 x 100)[0xaaaae44c3e80]{S} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x42646096 (coo:0, csr:1, hw:1, ic:1, fi:0), storage: 1, subm: 19, symflags:'LS' # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 524288 bytes, per-thread 524288 bytes # RSB_IO_WANT_MEMORY_HIERARCHY_INFO_STRING: unset @@ -6495,9 +6531,9 @@ # RSB_IO_WANT_SORT_METHOD: 0 # RSB_IO_WANT_SUBDIVISION_MULTIPLIER: 1 # librsb version 1.3.0.2 - 202212201855: Initialization success -3 iterations (1 th.) took 0.002184s; avg 0.000728s ( +/- 15.37/ 24.59 %); best 0.0006161s; worst 0.0009069s; std dev. 0.0001279 (taking best). -Reference operation time is 0.000616074 s (32.79 Mflops) with 1 threads. -Challenging best inner round reference (7.86781e-06 s/0 threads) with: subdivision 1, 19 leaves, 2.272 bytes/nz, 0.000616074 s/0 threads (speedup 0.0127709 x), same?n. +3 iterations (1 th.) took 0.002506s; avg 0.0008353s ( +/- 14.66/ 26.55 %); best 0.0007129s; worst 0.001057s; std dev. 0.0001571 (taking best). +Reference operation time is 0.000712872 s (28.34 Mflops) with 1 threads. +Challenging best inner round reference (7.86781e-06 s/0 threads) with: subdivision 1, 19 leaves, 2.272 bytes/nz, 0.000712872 s/0 threads (speedup 0.0110368 x), same?n. New candidate clone performs slowly; discarding it: 100 x 100, type S, 5050 nnz, 50 nnz/r, 26 subms, 19 lsubms, 2.2725 bpnz # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 524288 bytes, per-thread 524288 bytes @@ -6531,16 +6567,16 @@ # librsb version 1.3.0.2 - 202212201855: Initialization success Building a matrix with 5050 nnz, 100 x 100 Duplicates check: 5050 - 0 = 5050 - converted COO to RSB in 4.169e-03 s (100.00 %) - analyzed arrays in 1.278e-03 s (30.65 %) - cleaned-up arrays in 1.192e-05 s (0.29 %) - deduplicated arrays in 1.121e-05 s (0.27 %) + converted COO to RSB in 4.336e-03 s (100.00 %) + analyzed arrays in 1.721e-03 s (39.69 %) + cleaned-up arrays in 1.192e-05 s (0.27 %) + deduplicated arrays in 1.216e-05 s (0.28 %) sorted arrays in 0.000e+00 s (0.00 %) - shuffled partitions in 1.293e-03 s (31.01 %) + shuffled partitions in 1.418e-03 s (32.71 %) memory allocations took 2.861e-06 s (0.07 %) - leafs setup took 2.146e-06 s (0.05 %) - halfword conversion took 1.570e-03 s (37.66 %) -Built (100 x 100)[0xaaaac729ee40]{S} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x42646096 (coo:0, csr:1, hw:1, ic:1, fi:0), storage: 1, subm: 36, symflags:'LS' + leafs setup took 2.861e-06 s (0.07 %) + halfword conversion took 1.167e-03 s (26.92 %) +Built (100 x 100)[0xaaaae44c3e80]{S} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x42646096 (coo:0, csr:1, hw:1, ic:1, fi:0), storage: 1, subm: 36, symflags:'LS' # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 524288 bytes, per-thread 524288 bytes # RSB_IO_WANT_MEMORY_HIERARCHY_INFO_STRING: unset @@ -6586,9 +6622,9 @@ # RSB_IO_WANT_SORT_METHOD: 0 # RSB_IO_WANT_SUBDIVISION_MULTIPLIER: 2 # librsb version 1.3.0.2 - 202212201855: Initialization success -3 iterations (1 th.) took 0.001787s; avg 0.0005957s ( +/- 11.51/ 6.10 %); best 0.0005271s; worst 0.000632s; std dev. 4.853e-05 (taking best). -Reference operation time is 0.000527143 s (38.32 Mflops) with 1 threads. -Challenging best inner round reference (7.86781e-06 s/0 threads) with: subdivision 2, 36 leaves, 2.383 bytes/nz, 0.000527143 s/0 threads (speedup 0.0149254 x), same?n. +3 iterations (1 th.) took 0.001981s; avg 0.0006603s ( +/- 1.87/ 0.99 %); best 0.000648s; worst 0.0006669s; std dev. 8.715e-06 (taking best). +Reference operation time is 0.000648022 s (31.17 Mflops) with 1 threads. +Challenging best inner round reference (7.86781e-06 s/0 threads) with: subdivision 2, 36 leaves, 2.383 bytes/nz, 0.000648022 s/0 threads (speedup 0.0121413 x), same?n. New candidate clone performs slowly; discarding it: 100 x 100, type S, 5050 nnz, 50 nnz/r, 50 subms, 36 lsubms, 2.3834 bpnz # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 524288 bytes, per-thread 524288 bytes @@ -6622,16 +6658,16 @@ # librsb version 1.3.0.2 - 202212201855: Initialization success Building a matrix with 5050 nnz, 100 x 100 Duplicates check: 5050 - 0 = 5050 - converted COO to RSB in 4.781e-03 s (100.00 %) - analyzed arrays in 1.795e-03 s (37.55 %) - cleaned-up arrays in 1.097e-05 s (0.23 %) - deduplicated arrays in 1.001e-05 s (0.21 %) + converted COO to RSB in 4.370e-03 s (100.00 %) + analyzed arrays in 1.672e-03 s (38.26 %) + cleaned-up arrays in 1.216e-05 s (0.28 %) + deduplicated arrays in 1.001e-05 s (0.23 %) sorted arrays in 0.000e+00 s (0.00 %) - shuffled partitions in 1.642e-03 s (34.34 %) - memory allocations took 2.861e-06 s (0.06 %) - leafs setup took 2.146e-06 s (0.04 %) - halfword conversion took 1.318e-03 s (27.57 %) -Built (100 x 100)[0xaaaac72c0bf0]{S} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x42646096 (coo:0, csr:1, hw:1, ic:1, fi:0), storage: 1, subm: 36, symflags:'LS' + shuffled partitions in 1.394e-03 s (31.90 %) + memory allocations took 1.073e-05 s (0.25 %) + leafs setup took 1.907e-06 s (0.04 %) + halfword conversion took 1.269e-03 s (29.04 %) +Built (100 x 100)[0xaaaae44e5c30]{S} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x42646096 (coo:0, csr:1, hw:1, ic:1, fi:0), storage: 1, subm: 36, symflags:'LS' # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 524288 bytes, per-thread 524288 bytes # RSB_IO_WANT_MEMORY_HIERARCHY_INFO_STRING: unset @@ -6677,9 +6713,9 @@ # RSB_IO_WANT_SORT_METHOD: 0 # RSB_IO_WANT_SUBDIVISION_MULTIPLIER: 4 # librsb version 1.3.0.2 - 202212201855: Initialization success -3 iterations (1 th.) took 0.001604s; avg 0.0005347s ( +/- 3.86/ 5.50 %); best 0.000514s; worst 0.0005641s; std dev. 2.135e-05 (taking best). -Reference operation time is 0.00051403 s (39.3 Mflops) with 1 threads. -Challenging best inner round reference (7.86781e-06 s/0 threads) with: subdivision 4, 36 leaves, 2.383 bytes/nz, 0.00051403 s/0 threads (speedup 0.0153061 x), same?n. +3 iterations (1 th.) took 0.001977s; avg 0.000659s ( +/- 6.66/ 13.02 %); best 0.0006151s; worst 0.0007448s; std dev. 6.07e-05 (taking best). +Reference operation time is 0.00061512 s (32.84 Mflops) with 1 threads. +Challenging best inner round reference (7.86781e-06 s/0 threads) with: subdivision 4, 36 leaves, 2.383 bytes/nz, 0.00061512 s/0 threads (speedup 0.0127907 x), same?n. New candidate clone performs slowly; discarding it: 100 x 100, type S, 5050 nnz, 50 nnz/r, 50 subms, 36 lsubms, 2.3834 bpnz Best sparse multiply performance with subdivision multiplier of 0.25: 2567.42 Mflops. # librsb version 1.3.0.2 - 202212201855: Initializing @@ -6697,9 +6733,9 @@ # RSB_IO_WANT_SORT_METHOD: 0 # RSB_IO_WANT_SUBDIVISION_MULTIPLIER: 1 # librsb version 1.3.0.2 - 202212201855: Initialization success -Last tuner inner round (1 of 1) took 0.0300021 s (eq. to 3e+03/ 4e+03 old/new op.times), gained local/global speedup 1.12121 x (8.82149e-06 : 7.86781e-06) / 1.12121 x (8.82149e-06 : 7.86781e-06). This is amortizable in 31460 op.times. -In 1 tuning rounds (tot. 0.03s, 0.021s for constructor, 0 clones) obtained a SPEEDUP of 12.1% (1.121x) (from 2290 to 2567 Mflops). -Second run of RSB Autotuner took 0.0300272 s and estimated a speedup of 1.121212 x (8.821e-06 s -> 7.868e-06 s per op) in new matrix (1 -> 1 lsubm) +Last tuner inner round (1 of 1) took 0.0337651 s (eq. to 4e+03/ 4e+03 old/new op.times), gained local/global speedup 1.12121 x (8.82149e-06 : 7.86781e-06) / 1.12121 x (8.82149e-06 : 7.86781e-06). This is amortizable in 35406 op.times. +In 1 tuning rounds (tot. 0.034s, 0.024s for constructor, 0 clones) obtained a SPEEDUP of 12.1% (1.121x) (from 2290 to 2567 Mflops). +Second run of RSB Autotuner took 0.0337889 s and estimated a speedup of 1.121212 x (8.821e-06 s -> 7.868e-06 s per op) in new matrix (1 -> 1 lsubm) RSB Autotuner suggested a new matrix: freeing the old one. #min:1 #max:1 @@ -6707,13 +6743,13 @@ #norm:10 #used index storage compared to COO:10504 vs 40400 bytes (26.00%) ; compared to CSR:10504 vs 20604 bytes (50.99%) #%:CONSTRUCTOR_*:SORT SCAN INSERT SCAN+INSERT -%:CONSTRUCTOR_TIMES:lower-100x100-5050nz S N 1 100 100 5050 0.000000 0.001808 0.005058 0.006866 -%:UNSORTEDCOO2RSB_TIME:lower-100x100-5050nz S N 1 100 100 5050 0.006866 -%:RSB_SUBDIVISION_TIME:lower-100x100-5050nz S N 1 100 100 5050 0.001808 -%:RSB_SHUFFLE_TIME:lower-100x100-5050nz S N 1 100 100 5050 0.005058 +%:CONSTRUCTOR_TIMES:lower-100x100-5050nz S N 1 100 100 5050 0.000000 0.001572 0.004101 0.005673 +%:UNSORTEDCOO2RSB_TIME:lower-100x100-5050nz S N 1 100 100 5050 0.005673 +%:RSB_SUBDIVISION_TIME:lower-100x100-5050nz S N 1 100 100 5050 0.001572 +%:RSB_SHUFFLE_TIME:lower-100x100-5050nz S N 1 100 100 5050 0.004101 %:ROW_MAJOR_SORT_TIME:lower-100x100-5050nz S N 1 100 100 5050 0.000000 %:ROW_MAJOR_SORT_SCALING:lower-100x100-5050nz S N 1 100 100 5050 nan -%:SORTEDCOO2RSB_TIME:lower-100x100-5050nz S N 1 100 100 5050 0.006866 +%:SORTEDCOO2RSB_TIME:lower-100x100-5050nz S N 1 100 100 5050 0.005673 %:ROW_MAJOR_SORT_TO_MOP:lower-100x100-5050nz S N 1 100 100 5050 0.000 %:UNSORTEDCOO2RSB_SCALING:lower-100x100-5050nz S N 1 100 100 5050 1.00 %:SORTEDCOO2RSB_SCALING:lower-100x100-5050nz S N 1 100 100 5050 1.00 @@ -6728,34 +6764,34 @@ %:SM_MINMAXAVGNNZ:lower-100x100-5050nz S N 1 100 100 5050 5050 5050 5050 # %operation:matrix CONSTRUCTOR[1] SPMV[1] SPMV[1] -%operation:lower-100x100-5050nz 0.00921488 1e+09 1e+09 +%operation:lower-100x100-5050nz 0.00763512 1e+09 1e+09 %constructor:matrix SORT[1] SCAN[1] SHUFFLE[1] INSERT[1] -%constructor:lower-100x100-5050nz 0 0.00180793 0 0.00505805 -# so far, program took 5.457s of wall clock time; ancillary tests 0.000s; I/O 0.000s; checks 0.000s; conversions 0.000s; rsb/mkl tuning 0.133s/0.000s . +%constructor:lower-100x100-5050nz 0 0.00157189 0 0.00410104 +# so far, program took 5.519s of wall clock time; ancillary tests 0.000s; I/O 0.000s; checks 0.000s; conversions 0.000s; rsb/mkl tuning 0.151s/0.000s . getrusage() stats: ru_maxrss: 6 (maximum resident set size -- MB) -ru_stime : 0.05983s (system CPU time used) -ru_utime : 6.136s (user CPU time used) +ru_stime : 0.04788s (system CPU time used) +ru_utime : 6.465s (user CPU time used) # multi-type benchmarking (DSCZ) -- now using typecode C (last was D). # Cache block size total 524288 bytes, per-thread 524288 bytes -# so far, program took 5.457s of wall clock time; ancillary tests 0.000s; I/O 0.000s; checks 0.000s; conversions 0.000s; rsb/mkl tuning 0.133s/0.000s . +# so far, program took 5.519s of wall clock time; ancillary tests 0.000s; I/O 0.000s; checks 0.000s; conversions 0.000s; rsb/mkl tuning 0.151s/0.000s . # Using 1 threads # Using alpha=1 beta=1 order=cols for rsb_spmv/rsb_spsv/rsb_spmm/rsb_spsm. # will use input matrix flags: RSB_FLAG_USE_HALFWORD_INDICES, RSB_FLAG_SORTED_INPUT, RSB_FLAG_LOWER, RSB_FLAG_QUAD_PARTITIONING, RSB_FLAG_SYMMETRIC, RSB_FLAG_OWN_PARTITIONING_ARRAYS # Using 1 threads Building a matrix with 5050 nnz, 100 x 100 Duplicates check: 5050 - 0 = 5050 - converted COO to RSB in 6.758e-03 s (100.00 %) - analyzed arrays in 2.801e-03 s (41.45 %) - cleaned-up arrays in 1.001e-05 s (0.15 %) - deduplicated arrays in 8.106e-06 s (0.12 %) + converted COO to RSB in 4.352e-03 s (100.00 %) + analyzed arrays in 6.449e-04 s (14.82 %) + cleaned-up arrays in 1.097e-05 s (0.25 %) + deduplicated arrays in 9.060e-06 s (0.21 %) sorted arrays in 0.000e+00 s (0.00 %) - shuffled partitions in 2.860e-03 s (42.32 %) - memory allocations took 3.099e-06 s (0.05 %) - leafs setup took 1.192e-06 s (0.02 %) - halfword conversion took 1.074e-03 s (15.89 %) -Built (100 x 100)[0xaaaac729ee40]{C} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x2446196 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'LS' -# Constructed matrix (took 0.007s): (100 x 100)[0xaaaac729ee40]{C} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x2446196 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'LS' + shuffled partitions in 2.456e-03 s (56.44 %) + memory allocations took 3.099e-06 s (0.07 %) + leafs setup took 0.000e+00 s (0.00 %) + halfword conversion took 1.226e-03 s (28.17 %) +Built (100 x 100)[0xaaaae44c3e80]{C} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x2446196 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'LS' +# Constructed matrix (took 0.004s): (100 x 100)[0xaaaae44c3e80]{C} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x2446196 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'LS' # matrix consistency check took 0.000s (ok) RSB Sparse Blocks Autotuner invoked requesting max 6 splits and max 6 merges in 1 rounds, threads spec.0 (specify negative values to enable threads tuning). Will autotune matrix: 100 x 100, type C, 5050 nnz, 50 nnz/r, 4 subms, 3 lsubms, 2.1212 bpnz. @@ -6806,10 +6842,10 @@ # RSB_IO_WANT_SORT_METHOD: 0 # RSB_IO_WANT_SUBDIVISION_MULTIPLIER: 1 # librsb version 1.3.0.2 - 202212201855: Initialization success -3 iterations (1 th.) took 0.004213s; avg 0.001404s ( +/- 61.33/102.52 %); best 0.0005431s; worst 0.002844s; std dev. 0.001025 (taking best). -Reference operation time is 0.000543118 s (148.8 Mflops) with 1 threads. -Starting merge (same threads) based auto-tuning procedure (transA=N, nrhs=1, order=cols) (max 6 steps, inclusive 3 grace steps) on: 100 x 100, type C, 5050 nnz, 50 nnz/r, 4 subms, 3 lsubms, 2.1212 bpnz (tpop: 0.0005431 Mflops: 148.771) -Merge (3 -> 1 leaves) took w.c.t. of 4.005e-05s, ~3.386e-05s of computing time (of which 1.407e-05s sorting, 9.537e-07s analysis) +3 iterations (1 th.) took 0.001638s; avg 0.000546s ( +/- 2.40/ 1.31 %); best 0.0005329s; worst 0.0005531s; std dev. 9.285e-06 (taking best). +Reference operation time is 0.000532866 s (151.6 Mflops) with 1 threads. +Starting merge (same threads) based auto-tuning procedure (transA=N, nrhs=1, order=cols) (max 6 steps, inclusive 3 grace steps) on: 100 x 100, type C, 5050 nnz, 50 nnz/r, 4 subms, 3 lsubms, 2.1212 bpnz (tpop: 0.0005329 Mflops: 151.633) +Merge (3 -> 1 leaves) took w.c.t. of 3.695e-05s, ~3.099e-05s of computing time (of which 1.287e-05s sorting, 9.537e-07s analysis) # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 524288 bytes, per-thread 524288 bytes # RSB_IO_WANT_MEMORY_HIERARCHY_INFO_STRING: unset @@ -6840,8 +6876,8 @@ # RSB_IO_WANT_SORT_METHOD: 0 # RSB_IO_WANT_SUBDIVISION_MULTIPLIER: 1 # librsb version 1.3.0.2 - 202212201855: Initialization success -3 iterations (1 th.) took 6.604e-05s; avg 2.201e-05s ( +/- 4.69/ 9.39 %); best 2.098e-05s; worst 2.408e-05s; std dev. 1.461e-06 (taking best). -Reference operation time is 2.09808e-05 s (3851 Mflops) with 1 threads. +3 iterations (1 th.) took 7.01e-05s; avg 2.337e-05s ( +/- 5.10/ 7.14 %); best 2.217e-05s; worst 2.503e-05s; std dev. 1.216e-06 (taking best). +Reference operation time is 2.21729e-05 s (3644 Mflops) with 1 threads. # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 524288 bytes, per-thread 524288 bytes # RSB_IO_WANT_MEMORY_HIERARCHY_INFO_STRING: unset @@ -6857,16 +6893,16 @@ # RSB_IO_WANT_SORT_METHOD: 0 # RSB_IO_WANT_SUBDIVISION_MULTIPLIER: 1 # librsb version 1.3.0.2 - 202212201855: Initialization success -After merge step 1: tpop: 2.098e-05 s ~Mflops: 3851.134 nsubm:1 otn:1 -Applying merge (3 -> 1 leaves, 1 th.) yielded SPEEDUP of 25.886x: 0.0005431s -> 2.098e-05s, so taking this instance. +After merge step 1: tpop: 2.217e-05 s ~Mflops: 3644.083 nsubm:1 otn:1 +Applying merge (3 -> 1 leaves, 1 th.) yielded SPEEDUP of 24.032x: 0.0005329s -> 2.217e-05s, so taking this instance. Saved plot to test-tuning-lower-100x100-5050nz--C-N-1--mv-tuned_merge1_1x1th.eps Merged all the matrix leaves: no reason to continue merging. -A total of 1 merge steps (of max 6) (3 -> 1 subms) took 0.01063s (of which 4.196e-05s partitioning, 0.005486s I/O); computing times: 3.386e-05s in par. loops, 1.407e-05s sorting, 9.537e-07s analyzing) -Total merge + benchmarking process took 0.01063s, equivalent to 506.6/19.6 new/old ops (0.00617s for 2 clones -- as 294.1/11.4 ops, or 147.0/5.7 ops per clone), SPEEDUP of 25.886x -Applying multi-merge (3 -> 1 leaves, 1 steps, 0 -> 1 th.sp.) yielded SPEEDUP of 25.886x (0.0005431s -> 2.098e-05s), will amortize in 20.4 ops by saving 0.0005221s per op. -In 1 tuning rounds (tot. 0.016s, 0.0062s for constructor, 2 clones) obtained a SPEEDUP of 2488.6% (25.89x) (from 148.8 to 3851 Mflops). Employed 0.0052s for I/O of matrix plots. +A total of 1 merge steps (of max 6) (3 -> 1 subms) took 0.006856s (of which 4.005e-05s partitioning, 0.005183s I/O); computing times: 3.099e-05s in par. loops, 1.287e-05s sorting, 9.537e-07s analyzing) +Total merge + benchmarking process took 0.006856s, equivalent to 309.2/12.9 new/old ops (0.003009s for 2 clones -- as 135.7/5.6 ops, or 67.9/2.8 ops per clone), SPEEDUP of 24.032x +Applying multi-merge (3 -> 1 leaves, 1 steps, 0 -> 1 th.sp.) yielded SPEEDUP of 24.032x (0.0005329s -> 2.217e-05s), will amortize in 13.4 ops by saving 0.0005107s per op. +In 1 tuning rounds (tot. 0.01s, 0.003s for constructor, 2 clones) obtained a SPEEDUP of 2303.2% (24.03x) (from 151.6 to 3644 Mflops). Employed 0.0055s for I/O of matrix plots. #pr: updating sample at index 3 (2^th of 4), 0^th touch for (0,0,0,0,0,2,0). -First run of RSB Autotuner took 0.021585 s (5.431e-04 s -> 2.098e-05 s per spmv_sxsa) (tuned: 3 -> 1 lsubm). +First run of RSB Autotuner took 0.0156832 s (5.329e-04 s -> 2.217e-05 s per spmv_sxsa) (tuned: 3 -> 1 lsubm). RSB Sparse Blocks Autotuner invoked requesting max 0 splits and max 0 merges in 1 rounds, auto threads spec. Will autotune matrix: 100 x 100, type C, 5050 nnz, 50 nnz/r, 1 subms, 1 lsubms, 2.0800 bpnz. Parameters: verbosity:1 mintimes:3 maxtimes:10 mindt:0 maxdt:10 @@ -6932,20 +6968,20 @@ # RSB_IO_WANT_SORT_METHOD: 0 # RSB_IO_WANT_SUBDIVISION_MULTIPLIER: 1 # librsb version 1.3.0.2 - 202212201855: Initialization success -3 iterations (1 th.) took 6.509e-05s; avg 2.17e-05s ( +/- 13.19/ 25.27 %); best 1.884e-05s; worst 2.718e-05s; std dev. 3.879e-06 (taking best). -Reference operation time is 1.88351e-05 s (4290 Mflops) with 1 threads. +3 iterations (1 th.) took 7.2e-05s; avg 2.4e-05s ( +/- 8.61/ 12.25 %); best 2.193e-05s; worst 2.694e-05s; std dev. 2.135e-06 (taking best). +Reference operation time is 2.19345e-05 s (3684 Mflops) with 1 threads. Building a matrix with 5050 nnz, 100 x 100 Duplicates check: 5050 - 0 = 5050 - converted COO to RSB in 3.406e-03 s (100.00 %) - analyzed arrays in 6.371e-04 s (18.70 %) - cleaned-up arrays in 9.060e-06 s (0.27 %) - deduplicated arrays in 9.060e-06 s (0.27 %) + converted COO to RSB in 1.679e-03 s (100.00 %) + analyzed arrays in 5.832e-04 s (34.73 %) + cleaned-up arrays in 1.097e-05 s (0.65 %) + deduplicated arrays in 9.060e-06 s (0.54 %) sorted arrays in 0.000e+00 s (0.00 %) - shuffled partitions in 2.745e-03 s (80.59 %) - memory allocations took 9.537e-07 s (0.03 %) - leafs setup took 9.537e-07 s (0.03 %) - halfword conversion took 2.146e-06 s (0.06 %) -Built (100 x 100)[0xaaaac729ed20]{C} @ (0(0..100),0(0..100)) (5050 nnz, 50 nnz/r) flags 0x42644094 (coo:0, csr:1, hw:0, ic:1, fi:0), storage: 1, subm: 1, symflags:'LS' + shuffled partitions in 1.073e-03 s (63.89 %) + memory allocations took 9.537e-07 s (0.06 %) + leafs setup took 9.537e-07 s (0.06 %) + halfword conversion took 1.192e-06 s (0.07 %) +Built (100 x 100)[0xaaaae44c3d60]{C} @ (0(0..100),0(0..100)) (5050 nnz, 50 nnz/r) flags 0x42644094 (coo:0, csr:1, hw:0, ic:1, fi:0), storage: 1, subm: 1, symflags:'LS' Starting autotuning stage, with subdivision of 1 (current threads=1, requested threads=0, max threads = 12). # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 524288 bytes, per-thread 524288 bytes @@ -6979,16 +7015,16 @@ # librsb version 1.3.0.2 - 202212201855: Initialization success Building a matrix with 5050 nnz, 100 x 100 Duplicates check: 5050 - 0 = 5050 - converted COO to RSB in 2.563e-03 s (100.00 %) - analyzed arrays in 6.840e-04 s (26.69 %) - cleaned-up arrays in 1.001e-05 s (0.39 %) - deduplicated arrays in 8.106e-06 s (0.32 %) + converted COO to RSB in 2.913e-03 s (100.00 %) + analyzed arrays in 7.491e-04 s (25.72 %) + cleaned-up arrays in 1.001e-05 s (0.34 %) + deduplicated arrays in 9.060e-06 s (0.31 %) sorted arrays in 0.000e+00 s (0.00 %) - shuffled partitions in 9.270e-04 s (36.17 %) + shuffled partitions in 1.075e-03 s (36.90 %) memory allocations took 1.907e-06 s (0.07 %) - leafs setup took 0.000e+00 s (0.00 %) - halfword conversion took 9.310e-04 s (36.33 %) -Built (100 x 100)[0xaaaac729ee40]{C} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x42646096 (coo:0, csr:1, hw:1, ic:1, fi:0), storage: 1, subm: 3, symflags:'LS' + leafs setup took 9.537e-07 s (0.03 %) + halfword conversion took 1.067e-03 s (36.63 %) +Built (100 x 100)[0xaaaae44c3e80]{C} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x42646096 (coo:0, csr:1, hw:1, ic:1, fi:0), storage: 1, subm: 3, symflags:'LS' # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 524288 bytes, per-thread 524288 bytes # RSB_IO_WANT_MEMORY_HIERARCHY_INFO_STRING: unset @@ -7034,9 +7070,9 @@ # RSB_IO_WANT_SORT_METHOD: 0 # RSB_IO_WANT_SUBDIVISION_MULTIPLIER: 0.25 # librsb version 1.3.0.2 - 202212201855: Initialization success -3 iterations (1 th.) took 0.001422s; avg 0.000474s ( +/- 0.40/ 0.40 %); best 0.0004721s; worst 0.0004759s; std dev. 1.557e-06 (taking best). -Reference operation time is 0.000472069 s (171.2 Mflops) with 1 threads. -Challenging best inner round reference (1.88351e-05 s/1 threads) with: subdivision 0.25, 3 leaves, 2.121 bytes/nz, 0.000472069 s/0 threads (speedup 0.039899 x), same?n. +3 iterations (1 th.) took 0.001444s; avg 0.0004813s ( +/- 20.24/ 10.12 %); best 0.0003839s; worst 0.00053s; std dev. 6.89e-05 (taking best). +Reference operation time is 0.000383854 s (210.5 Mflops) with 1 threads. +Challenging best inner round reference (2.19345e-05 s/1 threads) with: subdivision 0.25, 3 leaves, 2.121 bytes/nz, 0.000383854 s/0 threads (speedup 0.0571429 x), same?n. New candidate clone performs slowly; discarding it: 100 x 100, type C, 5050 nnz, 50 nnz/r, 4 subms, 3 lsubms, 2.1212 bpnz # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 524288 bytes, per-thread 524288 bytes @@ -7070,16 +7106,16 @@ # librsb version 1.3.0.2 - 202212201855: Initialization success Building a matrix with 5050 nnz, 100 x 100 Duplicates check: 5050 - 0 = 5050 - converted COO to RSB in 3.003e-03 s (100.00 %) - analyzed arrays in 1.129e-03 s (37.59 %) - cleaned-up arrays in 9.060e-06 s (0.30 %) - deduplicated arrays in 8.821e-06 s (0.29 %) + converted COO to RSB in 3.438e-03 s (100.00 %) + analyzed arrays in 1.282e-03 s (37.30 %) + cleaned-up arrays in 9.775e-06 s (0.28 %) + deduplicated arrays in 9.060e-06 s (0.26 %) sorted arrays in 0.000e+00 s (0.00 %) - shuffled partitions in 9.379e-04 s (31.23 %) - memory allocations took 3.338e-06 s (0.11 %) + shuffled partitions in 1.072e-03 s (31.18 %) + memory allocations took 2.146e-06 s (0.06 %) leafs setup took 9.537e-07 s (0.03 %) - halfword conversion took 9.141e-04 s (30.44 %) -Built (100 x 100)[0xaaaac729ee40]{C} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x42646096 (coo:0, csr:1, hw:1, ic:1, fi:0), storage: 1, subm: 10, symflags:'LS' + halfword conversion took 1.062e-03 s (30.89 %) +Built (100 x 100)[0xaaaae44c3e80]{C} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x42646096 (coo:0, csr:1, hw:1, ic:1, fi:0), storage: 1, subm: 10, symflags:'LS' # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 524288 bytes, per-thread 524288 bytes # RSB_IO_WANT_MEMORY_HIERARCHY_INFO_STRING: unset @@ -7125,9 +7161,9 @@ # RSB_IO_WANT_SORT_METHOD: 0 # RSB_IO_WANT_SUBDIVISION_MULTIPLIER: 0.5 # librsb version 1.3.0.2 - 202212201855: Initialization success -3 iterations (1 th.) took 0.002602s; avg 0.0008674s ( +/- 44.89/ 79.96 %); best 0.000478s; worst 0.001561s; std dev. 0.0004917 (taking best). -Reference operation time is 0.000478029 s (169 Mflops) with 1 threads. -Challenging best inner round reference (1.88351e-05 s/1 threads) with: subdivision 0.5, 10 leaves, 2.206 bytes/nz, 0.000478029 s/0 threads (speedup 0.0394015 x), same?n. +3 iterations (1 th.) took 0.00141s; avg 0.00047s ( +/- 15.74/ 12.77 %); best 0.000396s; worst 0.00053s; std dev. 5.559e-05 (taking best). +Reference operation time is 0.000396013 s (204 Mflops) with 1 threads. +Challenging best inner round reference (2.19345e-05 s/1 threads) with: subdivision 0.5, 10 leaves, 2.206 bytes/nz, 0.000396013 s/0 threads (speedup 0.0553883 x), same?n. New candidate clone performs slowly; discarding it: 100 x 100, type C, 5050 nnz, 50 nnz/r, 14 subms, 10 lsubms, 2.2059 bpnz # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 524288 bytes, per-thread 524288 bytes @@ -7161,16 +7197,16 @@ # librsb version 1.3.0.2 - 202212201855: Initialization success Building a matrix with 5050 nnz, 100 x 100 Duplicates check: 5050 - 0 = 5050 - converted COO to RSB in 3.257e-03 s (100.00 %) - analyzed arrays in 1.053e-03 s (32.33 %) - cleaned-up arrays in 8.821e-06 s (0.27 %) - deduplicated arrays in 9.060e-06 s (0.28 %) + converted COO to RSB in 3.369e-03 s (100.00 %) + analyzed arrays in 1.202e-03 s (35.68 %) + cleaned-up arrays in 1.001e-05 s (0.30 %) + deduplicated arrays in 7.868e-06 s (0.23 %) sorted arrays in 0.000e+00 s (0.00 %) - shuffled partitions in 1.103e-03 s (33.86 %) - memory allocations took 1.192e-06 s (0.04 %) - leafs setup took 9.537e-07 s (0.03 %) - halfword conversion took 1.080e-03 s (33.16 %) -Built (100 x 100)[0xaaaac729ee40]{C} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x42646096 (coo:0, csr:1, hw:1, ic:1, fi:0), storage: 1, subm: 25, symflags:'LS' + shuffled partitions in 1.080e-03 s (32.06 %) + memory allocations took 4.053e-06 s (0.12 %) + leafs setup took 1.907e-06 s (0.06 %) + halfword conversion took 1.062e-03 s (31.53 %) +Built (100 x 100)[0xaaaae44c3e80]{C} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x42646096 (coo:0, csr:1, hw:1, ic:1, fi:0), storage: 1, subm: 25, symflags:'LS' # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 524288 bytes, per-thread 524288 bytes # RSB_IO_WANT_MEMORY_HIERARCHY_INFO_STRING: unset @@ -7216,9 +7252,9 @@ # RSB_IO_WANT_SORT_METHOD: 0 # RSB_IO_WANT_SUBDIVISION_MULTIPLIER: 1 # librsb version 1.3.0.2 - 202212201855: Initialization success -3 iterations (1 th.) took 0.001767s; avg 0.000589s ( +/- 16.33/ 26.50 %); best 0.0004928s; worst 0.0007451s; std dev. 0.0001114 (taking best). -Reference operation time is 0.000492811 s (164 Mflops) with 1 threads. -Challenging best inner round reference (1.88351e-05 s/1 threads) with: subdivision 1, 25 leaves, 2.317 bytes/nz, 0.000492811 s/0 threads (speedup 0.0382196 x), same?n. +3 iterations (1 th.) took 0.001454s; avg 0.0004846s ( +/- 18.48/ 11.43 %); best 0.0003951s; worst 0.00054s; std dev. 6.392e-05 (taking best). +Reference operation time is 0.00039506 s (204.5 Mflops) with 1 threads. +Challenging best inner round reference (2.19345e-05 s/1 threads) with: subdivision 1, 25 leaves, 2.317 bytes/nz, 0.00039506 s/0 threads (speedup 0.055522 x), same?n. New candidate clone performs slowly; discarding it: 100 x 100, type C, 5050 nnz, 50 nnz/r, 34 subms, 25 lsubms, 2.3168 bpnz # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 524288 bytes, per-thread 524288 bytes @@ -7252,16 +7288,16 @@ # librsb version 1.3.0.2 - 202212201855: Initialization success Building a matrix with 5050 nnz, 100 x 100 Duplicates check: 5050 - 0 = 5050 - converted COO to RSB in 3.838e-03 s (100.00 %) - analyzed arrays in 1.396e-03 s (36.37 %) - cleaned-up arrays in 8.821e-06 s (0.23 %) - deduplicated arrays in 8.106e-06 s (0.21 %) - sorted arrays in 9.537e-07 s (0.02 %) - shuffled partitions in 1.078e-03 s (28.08 %) - memory allocations took 2.384e-06 s (0.06 %) - leafs setup took 2.146e-06 s (0.06 %) - halfword conversion took 1.341e-03 s (34.94 %) -Built (100 x 100)[0xaaaac72c5ae0]{C} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x42646096 (coo:0, csr:1, hw:1, ic:1, fi:0), storage: 1, subm: 36, symflags:'LS' + converted COO to RSB in 3.621e-03 s (100.00 %) + analyzed arrays in 1.303e-03 s (35.98 %) + cleaned-up arrays in 1.001e-05 s (0.28 %) + deduplicated arrays in 7.868e-06 s (0.22 %) + sorted arrays in 0.000e+00 s (0.00 %) + shuffled partitions in 1.090e-03 s (30.10 %) + memory allocations took 2.146e-06 s (0.06 %) + leafs setup took 1.907e-06 s (0.05 %) + halfword conversion took 1.206e-03 s (33.30 %) +Built (100 x 100)[0xaaaae44eab20]{C} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x42646096 (coo:0, csr:1, hw:1, ic:1, fi:0), storage: 1, subm: 36, symflags:'LS' # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 524288 bytes, per-thread 524288 bytes # RSB_IO_WANT_MEMORY_HIERARCHY_INFO_STRING: unset @@ -7307,9 +7343,9 @@ # RSB_IO_WANT_SORT_METHOD: 0 # RSB_IO_WANT_SUBDIVISION_MULTIPLIER: 2 # librsb version 1.3.0.2 - 202212201855: Initialization success -3 iterations (1 th.) took 0.001534s; avg 0.0005113s ( +/- 8.28/ 5.05 %); best 0.000469s; worst 0.0005372s; std dev. 3.019e-05 (taking best). -Reference operation time is 0.000468969 s (172.3 Mflops) with 1 threads. -Challenging best inner round reference (1.88351e-05 s/1 threads) with: subdivision 2, 36 leaves, 2.383 bytes/nz, 0.000468969 s/0 threads (speedup 0.0401627 x), same?n. +3 iterations (1 th.) took 0.002564s; avg 0.0008547s ( +/- 51.10/ 26.15 %); best 0.0004179s; worst 0.001078s; std dev. 0.0003088 (taking best). +Reference operation time is 0.000417948 s (193.3 Mflops) with 1 threads. +Challenging best inner round reference (2.19345e-05 s/1 threads) with: subdivision 2, 36 leaves, 2.383 bytes/nz, 0.000417948 s/0 threads (speedup 0.0524815 x), same?n. New candidate clone performs slowly; discarding it: 100 x 100, type C, 5050 nnz, 50 nnz/r, 50 subms, 36 lsubms, 2.3834 bpnz # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 524288 bytes, per-thread 524288 bytes @@ -7343,16 +7379,16 @@ # librsb version 1.3.0.2 - 202212201855: Initialization success Building a matrix with 5050 nnz, 100 x 100 Duplicates check: 5050 - 0 = 5050 - converted COO to RSB in 6.009e-03 s (100.00 %) - analyzed arrays in 2.126e-03 s (35.38 %) - cleaned-up arrays in 9.060e-06 s (0.15 %) - deduplicated arrays in 1.001e-05 s (0.17 %) + converted COO to RSB in 3.861e-03 s (100.00 %) + analyzed arrays in 1.468e-03 s (38.02 %) + cleaned-up arrays in 1.001e-05 s (0.26 %) + deduplicated arrays in 9.060e-06 s (0.23 %) sorted arrays in 0.000e+00 s (0.00 %) - shuffled partitions in 1.867e-03 s (31.07 %) - memory allocations took 4.053e-06 s (0.07 %) - leafs setup took 2.861e-06 s (0.05 %) - halfword conversion took 1.989e-03 s (33.10 %) -Built (100 x 100)[0xaaaac72c5ae0]{C} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x42646096 (coo:0, csr:1, hw:1, ic:1, fi:0), storage: 1, subm: 36, symflags:'LS' + shuffled partitions in 1.194e-03 s (30.93 %) + memory allocations took 2.861e-06 s (0.07 %) + leafs setup took 1.192e-06 s (0.03 %) + halfword conversion took 1.176e-03 s (30.46 %) +Built (100 x 100)[0xaaaae44eab20]{C} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x42646096 (coo:0, csr:1, hw:1, ic:1, fi:0), storage: 1, subm: 36, symflags:'LS' # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 524288 bytes, per-thread 524288 bytes # RSB_IO_WANT_MEMORY_HIERARCHY_INFO_STRING: unset @@ -7398,11 +7434,11 @@ # RSB_IO_WANT_SORT_METHOD: 0 # RSB_IO_WANT_SUBDIVISION_MULTIPLIER: 4 # librsb version 1.3.0.2 - 202212201855: Initialization success -3 iterations (1 th.) took 0.002721s; avg 0.0009069s ( +/- 1.31/ 0.76 %); best 0.000895s; worst 0.0009139s; std dev. 8.465e-06 (taking best). -Reference operation time is 0.000895023 s (90.28 Mflops) with 1 threads. -Challenging best inner round reference (1.88351e-05 s/1 threads) with: subdivision 4, 36 leaves, 2.383 bytes/nz, 0.000895023 s/0 threads (speedup 0.0210442 x), same?n. +3 iterations (1 th.) took 0.00163s; avg 0.0005434s ( +/- 13.30/ 9.13 %); best 0.0004711s; worst 0.0005929s; std dev. 5.225e-05 (taking best). +Reference operation time is 0.000471115 s (171.5 Mflops) with 1 threads. +Challenging best inner round reference (2.19345e-05 s/1 threads) with: subdivision 4, 36 leaves, 2.383 bytes/nz, 0.000471115 s/0 threads (speedup 0.0465587 x), same?n. New candidate clone performs slowly; discarding it: 100 x 100, type C, 5050 nnz, 50 nnz/r, 50 subms, 36 lsubms, 2.3834 bpnz -Best sparse multiply performance with subdivision multiplier of 1: 4289.87 Mflops. +Best sparse multiply performance with subdivision multiplier of 1: 3683.69 Mflops. # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 524288 bytes, per-thread 524288 bytes # RSB_IO_WANT_MEMORY_HIERARCHY_INFO_STRING: unset @@ -7418,23 +7454,23 @@ # RSB_IO_WANT_SORT_METHOD: 0 # RSB_IO_WANT_SUBDIVISION_MULTIPLIER: 1 # librsb version 1.3.0.2 - 202212201855: Initialization success -Last tuner inner round (1 of 1) took 0.033011 s (eq. to 2e+03/ 2e+03 old/new op.times), gained local/global speedup 1 x (1.88351e-05 : 1.88351e-05) / 1 x (1.88351e-05 : 1.88351e-05). This is not amortizable ! +Last tuner inner round (1 of 1) took 0.028604 s (eq. to 1e+03/ 1e+03 old/new op.times), gained local/global speedup 1 x (2.19345e-05 : 2.19345e-05) / 1 x (2.19345e-05 : 2.19345e-05). This is not amortizable ! Auto tuning inner round 1 did not find a configuration better than the original. -In 1 tuning rounds (tot. 0.033s, 0.023s for constructor, 0 clones) obtained NO speedup (best stays 4290 Mflops). -Second run of RSB Autotuner took 0.0330322 s and estimated a speedup of 1.000000 x (1.884e-05 s -> 1.884e-05 s per op) in same matrix (1 -> 1 lsubm) +In 1 tuning rounds (tot. 0.029s, 0.02s for constructor, 0 clones) obtained NO speedup (best stays 3684 Mflops). +Second run of RSB Autotuner took 0.0286231 s and estimated a speedup of 1.000000 x (2.193e-05 s -> 2.193e-05 s per op) in same matrix (1 -> 1 lsubm) #min:1 0 #max:1 0 #sum:100 0 #norm:10 0 #used index storage compared to COO:10504 vs 40400 bytes (26.00%) ; compared to CSR:10504 vs 20604 bytes (50.99%) #%:CONSTRUCTOR_*:SORT SCAN INSERT SCAN+INSERT -%:CONSTRUCTOR_TIMES:lower-100x100-5050nz S N 1 100 100 5050 0.000000 0.002801 0.002860 0.005661 -%:UNSORTEDCOO2RSB_TIME:lower-100x100-5050nz S N 1 100 100 5050 0.005661 -%:RSB_SUBDIVISION_TIME:lower-100x100-5050nz S N 1 100 100 5050 0.002801 -%:RSB_SHUFFLE_TIME:lower-100x100-5050nz S N 1 100 100 5050 0.002860 +%:CONSTRUCTOR_TIMES:lower-100x100-5050nz S N 1 100 100 5050 0.000000 0.000645 0.002456 0.003101 +%:UNSORTEDCOO2RSB_TIME:lower-100x100-5050nz S N 1 100 100 5050 0.003101 +%:RSB_SUBDIVISION_TIME:lower-100x100-5050nz S N 1 100 100 5050 0.000645 +%:RSB_SHUFFLE_TIME:lower-100x100-5050nz S N 1 100 100 5050 0.002456 %:ROW_MAJOR_SORT_TIME:lower-100x100-5050nz S N 1 100 100 5050 0.000000 %:ROW_MAJOR_SORT_SCALING:lower-100x100-5050nz S N 1 100 100 5050 nan -%:SORTEDCOO2RSB_TIME:lower-100x100-5050nz S N 1 100 100 5050 0.005661 +%:SORTEDCOO2RSB_TIME:lower-100x100-5050nz S N 1 100 100 5050 0.003101 %:ROW_MAJOR_SORT_TO_MOP:lower-100x100-5050nz S N 1 100 100 5050 0.000 %:UNSORTEDCOO2RSB_SCALING:lower-100x100-5050nz S N 1 100 100 5050 1.00 %:SORTEDCOO2RSB_SCALING:lower-100x100-5050nz S N 1 100 100 5050 1.00 @@ -7449,34 +7485,34 @@ %:SM_MINMAXAVGNNZ:lower-100x100-5050nz S N 1 100 100 5050 5050 5050 5050 # %operation:matrix CONSTRUCTOR[1] SPMV[1] SPMV[1] -%operation:lower-100x100-5050nz 0.00675797 1e+09 1e+09 +%operation:lower-100x100-5050nz 0.00435209 1e+09 1e+09 %constructor:matrix SORT[1] SCAN[1] SHUFFLE[1] INSERT[1] -%constructor:lower-100x100-5050nz 0 0.00280094 0 0.00285983 -# so far, program took 5.522s of wall clock time; ancillary tests 0.000s; I/O 0.000s; checks 0.000s; conversions 0.000s; rsb/mkl tuning 0.187s/0.000s . +%constructor:lower-100x100-5050nz 0 0.000644922 0 0.00245619 +# so far, program took 5.571s of wall clock time; ancillary tests 0.000s; I/O 0.000s; checks 0.000s; conversions 0.000s; rsb/mkl tuning 0.195s/0.000s . getrusage() stats: ru_maxrss: 6 (maximum resident set size -- MB) -ru_stime : 0.06359s (system CPU time used) -ru_utime : 6.473s (user CPU time used) +ru_stime : 0.0559s (system CPU time used) +ru_utime : 6.844s (user CPU time used) # multi-type benchmarking (DSCZ) -- now using typecode Z (last was D). # Cache block size total 524288 bytes, per-thread 524288 bytes -# so far, program took 5.522s of wall clock time; ancillary tests 0.000s; I/O 0.000s; checks 0.000s; conversions 0.000s; rsb/mkl tuning 0.187s/0.000s . +# so far, program took 5.571s of wall clock time; ancillary tests 0.000s; I/O 0.000s; checks 0.000s; conversions 0.000s; rsb/mkl tuning 0.195s/0.000s . # Using 1 threads # Using alpha=1 beta=1 order=cols for rsb_spmv/rsb_spsv/rsb_spmm/rsb_spsm. # will use input matrix flags: RSB_FLAG_USE_HALFWORD_INDICES, RSB_FLAG_SORTED_INPUT, RSB_FLAG_LOWER, RSB_FLAG_QUAD_PARTITIONING, RSB_FLAG_SYMMETRIC, RSB_FLAG_OWN_PARTITIONING_ARRAYS # Using 1 threads Building a matrix with 5050 nnz, 100 x 100 Duplicates check: 5050 - 0 = 5050 - converted COO to RSB in 5.408e-03 s (100.00 %) - analyzed arrays in 1.853e-03 s (34.26 %) - cleaned-up arrays in 8.821e-06 s (0.16 %) - deduplicated arrays in 8.106e-06 s (0.15 %) + converted COO to RSB in 4.511e-03 s (100.00 %) + analyzed arrays in 6.351e-04 s (14.08 %) + cleaned-up arrays in 1.001e-05 s (0.22 %) + deduplicated arrays in 9.060e-06 s (0.20 %) sorted arrays in 0.000e+00 s (0.00 %) - shuffled partitions in 2.500e-03 s (46.23 %) - memory allocations took 4.053e-06 s (0.07 %) + shuffled partitions in 2.360e-03 s (52.32 %) + memory allocations took 1.907e-06 s (0.04 %) leafs setup took 0.000e+00 s (0.00 %) - halfword conversion took 1.034e-03 s (19.12 %) -Built (100 x 100)[0xaaaac729ee40]{Z} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x2446196 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'LS' -# Constructed matrix (took 0.005s): (100 x 100)[0xaaaac729ee40]{Z} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x2446196 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'LS' + halfword conversion took 1.494e-03 s (33.12 %) +Built (100 x 100)[0xaaaae44c3e80]{Z} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x2446196 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'LS' +# Constructed matrix (took 0.005s): (100 x 100)[0xaaaae44c3e80]{Z} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x2446196 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'LS' # matrix consistency check took 0.000s (ok) RSB Sparse Blocks Autotuner invoked requesting max 6 splits and max 6 merges in 1 rounds, threads spec.0 (specify negative values to enable threads tuning). Will autotune matrix: 100 x 100, type Z, 5050 nnz, 50 nnz/r, 4 subms, 3 lsubms, 2.1212 bpnz. @@ -7527,10 +7563,10 @@ # RSB_IO_WANT_SORT_METHOD: 0 # RSB_IO_WANT_SUBDIVISION_MULTIPLIER: 1 # librsb version 1.3.0.2 - 202212201855: Initialization success -3 iterations (1 th.) took 0.001539s; avg 0.000513s ( +/- 37.07/ 39.61 %); best 0.0003228s; worst 0.0007162s; std dev. 0.0001609 (taking best). -Reference operation time is 0.000322819 s (250.3 Mflops) with 1 threads. -Starting merge (same threads) based auto-tuning procedure (transA=N, nrhs=1, order=cols) (max 6 steps, inclusive 3 grace steps) on: 100 x 100, type Z, 5050 nnz, 50 nnz/r, 4 subms, 3 lsubms, 2.1212 bpnz (tpop: 0.0003228 Mflops: 250.295) -Merge (3 -> 1 leaves) took w.c.t. of 3.815e-05s, ~3.29e-05s of computing time (of which 1.502e-05s sorting, 1.192e-06s analysis) +3 iterations (1 th.) took 0.001685s; avg 0.0005616s ( +/- 0.67/ 0.61 %); best 0.0005579s; worst 0.0005651s; std dev. 2.929e-06 (taking best). +Reference operation time is 0.000557899 s (144.8 Mflops) with 1 threads. +Starting merge (same threads) based auto-tuning procedure (transA=N, nrhs=1, order=cols) (max 6 steps, inclusive 3 grace steps) on: 100 x 100, type Z, 5050 nnz, 50 nnz/r, 4 subms, 3 lsubms, 2.1212 bpnz (tpop: 0.0005579 Mflops: 144.829) +Merge (3 -> 1 leaves) took w.c.t. of 3.695e-05s, ~3.314e-05s of computing time (of which 1.597e-05s sorting, 9.537e-07s analysis) # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 524288 bytes, per-thread 524288 bytes # RSB_IO_WANT_MEMORY_HIERARCHY_INFO_STRING: unset @@ -7561,7 +7597,7 @@ # RSB_IO_WANT_SORT_METHOD: 0 # RSB_IO_WANT_SUBDIVISION_MULTIPLIER: 1 # librsb version 1.3.0.2 - 202212201855: Initialization success -3 iterations (1 th.) took 5.889e-05s; avg 1.963e-05s ( +/- 2.83/ 2.02 %); best 1.907e-05s; worst 2.003e-05s; std dev. 4.052e-07 (taking best). +3 iterations (1 th.) took 6.008e-05s; avg 2.003e-05s ( +/- 4.76/ 4.76 %); best 1.907e-05s; worst 2.098e-05s; std dev. 7.787e-07 (taking best). Reference operation time is 1.90735e-05 s (4236 Mflops) with 1 threads. # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 524288 bytes, per-thread 524288 bytes @@ -7579,15 +7615,15 @@ # RSB_IO_WANT_SUBDIVISION_MULTIPLIER: 1 # librsb version 1.3.0.2 - 202212201855: Initialization success After merge step 1: tpop: 1.907e-05 s ~Mflops: 4236.247 nsubm:1 otn:1 -Applying merge (3 -> 1 leaves, 1 th.) yielded SPEEDUP of 16.925x: 0.0003228s -> 1.907e-05s, so taking this instance. +Applying merge (3 -> 1 leaves, 1 th.) yielded SPEEDUP of 29.250x: 0.0005579s -> 1.907e-05s, so taking this instance. Saved plot to test-tuning-lower-100x100-5050nz--Z-N-1--mv-tuned_merge1_1x1th.eps Merged all the matrix leaves: no reason to continue merging. -A total of 1 merge steps (of max 6) (3 -> 1 subms) took 0.006236s (of which 4.101e-05s partitioning, 0.004543s I/O); computing times: 3.29e-05s in par. loops, 1.502e-05s sorting, 1.192e-06s analyzing) -Total merge + benchmarking process took 0.006236s, equivalent to 326.9/19.3 new/old ops (0.002775s for 2 clones -- as 145.5/8.6 ops, or 72.7/4.3 ops per clone), SPEEDUP of 16.925x -Applying multi-merge (3 -> 1 leaves, 1 steps, 0 -> 1 th.sp.) yielded SPEEDUP of 16.925x (0.0003228s -> 1.907e-05s), will amortize in 20.5 ops by saving 0.0003037s per op. -In 1 tuning rounds (tot. 0.0091s, 0.0028s for constructor, 2 clones) obtained a SPEEDUP of 1592.5% (16.93x) (from 250.3 to 4236 Mflops). Employed 0.0046s for I/O of matrix plots. +A total of 1 merge steps (of max 6) (3 -> 1 subms) took 0.006837s (of which 3.886e-05s partitioning, 0.005017s I/O); computing times: 3.314e-05s in par. loops, 1.597e-05s sorting, 9.537e-07s analyzing) +Total merge + benchmarking process took 0.006837s, equivalent to 358.4/12.3 new/old ops (0.003117s for 2 clones -- as 163.4/5.6 ops, or 81.7/2.8 ops per clone), SPEEDUP of 29.250x +Applying multi-merge (3 -> 1 leaves, 1 steps, 0 -> 1 th.sp.) yielded SPEEDUP of 29.250x (0.0005579s -> 1.907e-05s), will amortize in 12.7 ops by saving 0.0005388s per op. +In 1 tuning rounds (tot. 0.01s, 0.0031s for constructor, 2 clones) obtained a SPEEDUP of 2825.0% (29.25x) (from 144.8 to 4236 Mflops). Employed 0.005s for I/O of matrix plots. #pr: updating sample at index 4 (3^th of 4), 0^th touch for (0,0,0,0,0,3,0). -First run of RSB Autotuner took 0.0138922 s (3.228e-04 s -> 1.907e-05 s per spmv_sxsa) (tuned: 3 -> 1 lsubm). +First run of RSB Autotuner took 0.0152571 s (5.579e-04 s -> 1.907e-05 s per spmv_sxsa) (tuned: 3 -> 1 lsubm). RSB Sparse Blocks Autotuner invoked requesting max 0 splits and max 0 merges in 1 rounds, auto threads spec. Will autotune matrix: 100 x 100, type Z, 5050 nnz, 50 nnz/r, 1 subms, 1 lsubms, 2.0800 bpnz. Parameters: verbosity:1 mintimes:3 maxtimes:10 mindt:0 maxdt:10 @@ -7653,20 +7689,20 @@ # RSB_IO_WANT_SORT_METHOD: 0 # RSB_IO_WANT_SUBDIVISION_MULTIPLIER: 1 # librsb version 1.3.0.2 - 202212201855: Initialization success -3 iterations (1 th.) took 6.39e-05s; avg 2.13e-05s ( +/- 11.57/ 22.01 %); best 1.884e-05s; worst 2.599e-05s; std dev. 3.317e-06 (taking best). -Reference operation time is 1.88351e-05 s (4290 Mflops) with 1 threads. +3 iterations (1 th.) took 6.294e-05s; avg 2.098e-05s ( +/- 9.09/ 18.18 %); best 1.907e-05s; worst 2.48e-05s; std dev. 2.697e-06 (taking best). +Reference operation time is 1.90735e-05 s (4236 Mflops) with 1 threads. Building a matrix with 5050 nnz, 100 x 100 Duplicates check: 5050 - 0 = 5050 - converted COO to RSB in 1.449e-03 s (100.00 %) - analyzed arrays in 2.918e-04 s (20.14 %) - cleaned-up arrays in 9.060e-06 s (0.63 %) - deduplicated arrays in 7.868e-06 s (0.54 %) - sorted arrays in 0.000e+00 s (0.00 %) - shuffled partitions in 9.811e-04 s (67.71 %) - memory allocations took 1.571e-04 s (10.84 %) - leafs setup took 9.537e-07 s (0.07 %) - halfword conversion took 9.537e-07 s (0.07 %) -Built (100 x 100)[0xaaaac729ed20]{Z} @ (0(0..100),0(0..100)) (5050 nnz, 50 nnz/r) flags 0x42644094 (coo:0, csr:1, hw:0, ic:1, fi:0), storage: 1, subm: 1, symflags:'LS' + converted COO to RSB in 4.211e-03 s (100.00 %) + analyzed arrays in 1.093e-03 s (25.95 %) + cleaned-up arrays in 9.060e-06 s (0.22 %) + deduplicated arrays in 6.914e-06 s (0.16 %) + sorted arrays in 9.537e-07 s (0.02 %) + shuffled partitions in 3.083e-03 s (73.22 %) + memory allocations took 1.407e-05 s (0.33 %) + leafs setup took 1.907e-06 s (0.05 %) + halfword conversion took 1.907e-06 s (0.05 %) +Built (100 x 100)[0xaaaae44c3d60]{Z} @ (0(0..100),0(0..100)) (5050 nnz, 50 nnz/r) flags 0x42644094 (coo:0, csr:1, hw:0, ic:1, fi:0), storage: 1, subm: 1, symflags:'LS' Starting autotuning stage, with subdivision of 1 (current threads=1, requested threads=0, max threads = 12). # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 524288 bytes, per-thread 524288 bytes @@ -7700,16 +7736,16 @@ # librsb version 1.3.0.2 - 202212201855: Initialization success Building a matrix with 5050 nnz, 100 x 100 Duplicates check: 5050 - 0 = 5050 - converted COO to RSB in 3.218e-03 s (100.00 %) - analyzed arrays in 1.197e-03 s (37.20 %) - cleaned-up arrays in 7.868e-06 s (0.24 %) - deduplicated arrays in 8.106e-06 s (0.25 %) + converted COO to RSB in 6.039e-03 s (100.00 %) + analyzed arrays in 3.427e-03 s (56.75 %) + cleaned-up arrays in 1.097e-05 s (0.18 %) + deduplicated arrays in 1.001e-05 s (0.17 %) sorted arrays in 0.000e+00 s (0.00 %) - shuffled partitions in 1.009e-03 s (31.35 %) - memory allocations took 4.053e-06 s (0.13 %) - leafs setup took 1.907e-06 s (0.06 %) - halfword conversion took 9.902e-04 s (30.77 %) -Built (100 x 100)[0xaaaac729ee40]{Z} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x42646096 (coo:0, csr:1, hw:1, ic:1, fi:0), storage: 1, subm: 6, symflags:'LS' + shuffled partitions in 1.416e-03 s (23.45 %) + memory allocations took 4.053e-06 s (0.07 %) + leafs setup took 1.907e-06 s (0.03 %) + halfword conversion took 1.169e-03 s (19.36 %) +Built (100 x 100)[0xaaaae44c3e80]{Z} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x42646096 (coo:0, csr:1, hw:1, ic:1, fi:0), storage: 1, subm: 6, symflags:'LS' # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 524288 bytes, per-thread 524288 bytes # RSB_IO_WANT_MEMORY_HIERARCHY_INFO_STRING: unset @@ -7755,9 +7791,9 @@ # RSB_IO_WANT_SORT_METHOD: 0 # RSB_IO_WANT_SUBDIVISION_MULTIPLIER: 0.25 # librsb version 1.3.0.2 - 202212201855: Initialization success -3 iterations (1 th.) took 0.001344s; avg 0.000448s ( +/- 20.97/ 10.48 %); best 0.0003541s; worst 0.000495s; std dev. 6.642e-05 (taking best). -Reference operation time is 0.000354052 s (228.2 Mflops) with 1 threads. -Challenging best inner round reference (1.88351e-05 s/1 threads) with: subdivision 0.25, 6 leaves, 2.163 bytes/nz, 0.000354052 s/0 threads (speedup 0.0531987 x), same?n. +3 iterations (1 th.) took 0.001722s; avg 0.000574s ( +/- 19.00/ 29.77 %); best 0.0004649s; worst 0.0007448s; std dev. 0.0001223 (taking best). +Reference operation time is 0.000464916 s (173.8 Mflops) with 1 threads. +Challenging best inner round reference (1.90735e-05 s/1 threads) with: subdivision 0.25, 6 leaves, 2.163 bytes/nz, 0.000464916 s/0 threads (speedup 0.0410256 x), same?n. New candidate clone performs slowly; discarding it: 100 x 100, type Z, 5050 nnz, 50 nnz/r, 8 subms, 6 lsubms, 2.1632 bpnz # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 524288 bytes, per-thread 524288 bytes @@ -7791,16 +7827,16 @@ # librsb version 1.3.0.2 - 202212201855: Initialization success Building a matrix with 5050 nnz, 100 x 100 Duplicates check: 5050 - 0 = 5050 - converted COO to RSB in 3.894e-03 s (100.00 %) - analyzed arrays in 1.350e-03 s (34.67 %) - cleaned-up arrays in 9.060e-06 s (0.23 %) - deduplicated arrays in 7.868e-06 s (0.20 %) + converted COO to RSB in 3.461e-03 s (100.00 %) + analyzed arrays in 1.002e-03 s (28.95 %) + cleaned-up arrays in 1.001e-05 s (0.29 %) + deduplicated arrays in 7.153e-06 s (0.21 %) sorted arrays in 0.000e+00 s (0.00 %) - shuffled partitions in 1.563e-03 s (40.14 %) - memory allocations took 2.861e-06 s (0.07 %) - leafs setup took 1.907e-06 s (0.05 %) - halfword conversion took 9.580e-04 s (24.60 %) -Built (100 x 100)[0xaaaac729ee40]{Z} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x42646096 (coo:0, csr:1, hw:1, ic:1, fi:0), storage: 1, subm: 16, symflags:'LS' + shuffled partitions in 1.204e-03 s (34.78 %) + memory allocations took 1.907e-06 s (0.06 %) + leafs setup took 2.146e-06 s (0.06 %) + halfword conversion took 1.233e-03 s (35.62 %) +Built (100 x 100)[0xaaaae44c3e80]{Z} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x42646096 (coo:0, csr:1, hw:1, ic:1, fi:0), storage: 1, subm: 16, symflags:'LS' # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 524288 bytes, per-thread 524288 bytes # RSB_IO_WANT_MEMORY_HIERARCHY_INFO_STRING: unset @@ -7846,9 +7882,9 @@ # RSB_IO_WANT_SORT_METHOD: 0 # RSB_IO_WANT_SUBDIVISION_MULTIPLIER: 0.5 # librsb version 1.3.0.2 - 202212201855: Initialization success -3 iterations (1 th.) took 0.001428s; avg 0.000476s ( +/- 6.73/ 12.81 %); best 0.0004439s; worst 0.0005369s; std dev. 4.312e-05 (taking best). -Reference operation time is 0.000443935 s (182 Mflops) with 1 threads. -Challenging best inner round reference (1.88351e-05 s/1 threads) with: subdivision 0.5, 16 leaves, 2.25 bytes/nz, 0.000443935 s/0 threads (speedup 0.0424275 x), same?n. +3 iterations (1 th.) took 0.001446s; avg 0.000482s ( +/- 3.10/ 2.04 %); best 0.0004671s; worst 0.0004919s; std dev. 1.074e-05 (taking best). +Reference operation time is 0.000467062 s (173 Mflops) with 1 threads. +Challenging best inner round reference (1.90735e-05 s/1 threads) with: subdivision 0.5, 16 leaves, 2.25 bytes/nz, 0.000467062 s/0 threads (speedup 0.0408372 x), same?n. New candidate clone performs slowly; discarding it: 100 x 100, type Z, 5050 nnz, 50 nnz/r, 22 subms, 16 lsubms, 2.2503 bpnz # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 524288 bytes, per-thread 524288 bytes @@ -7882,16 +7918,16 @@ # librsb version 1.3.0.2 - 202212201855: Initialization success Building a matrix with 5050 nnz, 100 x 100 Duplicates check: 5050 - 0 = 5050 - converted COO to RSB in 5.213e-03 s (100.00 %) - analyzed arrays in 1.048e-03 s (20.10 %) - cleaned-up arrays in 9.060e-06 s (0.17 %) - deduplicated arrays in 8.106e-06 s (0.16 %) + converted COO to RSB in 3.358e-03 s (100.00 %) + analyzed arrays in 1.211e-03 s (36.07 %) + cleaned-up arrays in 9.060e-06 s (0.27 %) + deduplicated arrays in 8.821e-06 s (0.26 %) sorted arrays in 0.000e+00 s (0.00 %) - shuffled partitions in 2.327e-03 s (44.64 %) - memory allocations took 1.907e-06 s (0.04 %) - leafs setup took 3.815e-06 s (0.07 %) - halfword conversion took 1.814e-03 s (34.80 %) -Built (100 x 100)[0xaaaac72ed230]{Z} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x42646096 (coo:0, csr:1, hw:1, ic:1, fi:0), storage: 1, subm: 36, symflags:'LS' + shuffled partitions in 1.138e-03 s (33.89 %) + memory allocations took 2.861e-06 s (0.09 %) + leafs setup took 1.907e-06 s (0.06 %) + halfword conversion took 9.861e-04 s (29.37 %) +Built (100 x 100)[0xaaaae4512270]{Z} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x42646096 (coo:0, csr:1, hw:1, ic:1, fi:0), storage: 1, subm: 36, symflags:'LS' # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 524288 bytes, per-thread 524288 bytes # RSB_IO_WANT_MEMORY_HIERARCHY_INFO_STRING: unset @@ -7937,9 +7973,9 @@ # RSB_IO_WANT_SORT_METHOD: 0 # RSB_IO_WANT_SUBDIVISION_MULTIPLIER: 1 # librsb version 1.3.0.2 - 202212201855: Initialization success -3 iterations (1 th.) took 0.003057s; avg 0.001019s ( +/- 24.64/ 22.48 %); best 0.0007679s; worst 0.001248s; std dev. 0.0001966 (taking best). -Reference operation time is 0.000767946 s (105.2 Mflops) with 1 threads. -Challenging best inner round reference (1.88351e-05 s/1 threads) with: subdivision 1, 36 leaves, 2.383 bytes/nz, 0.000767946 s/0 threads (speedup 0.0245265 x), same?n. +3 iterations (1 th.) took 0.001249s; avg 0.0004164s ( +/- 26.70/ 14.07 %); best 0.0003052s; worst 0.0004749s; std dev. 7.866e-05 (taking best). +Reference operation time is 0.000305176 s (264.8 Mflops) with 1 threads. +Challenging best inner round reference (1.90735e-05 s/1 threads) with: subdivision 1, 36 leaves, 2.383 bytes/nz, 0.000305176 s/0 threads (speedup 0.0625 x), same?n. New candidate clone performs slowly; discarding it: 100 x 100, type Z, 5050 nnz, 50 nnz/r, 50 subms, 36 lsubms, 2.3834 bpnz # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 524288 bytes, per-thread 524288 bytes @@ -7973,16 +8009,16 @@ # librsb version 1.3.0.2 - 202212201855: Initialization success Building a matrix with 5050 nnz, 100 x 100 Duplicates check: 5050 - 0 = 5050 - converted COO to RSB in 3.897e-03 s (100.00 %) - analyzed arrays in 1.657e-03 s (42.52 %) - cleaned-up arrays in 1.121e-05 s (0.29 %) - deduplicated arrays in 1.097e-05 s (0.28 %) + converted COO to RSB in 3.311e-03 s (100.00 %) + analyzed arrays in 1.369e-03 s (41.35 %) + cleaned-up arrays in 9.060e-06 s (0.27 %) + deduplicated arrays in 7.868e-06 s (0.24 %) sorted arrays in 0.000e+00 s (0.00 %) - shuffled partitions in 8.450e-04 s (21.68 %) - memory allocations took 3.815e-06 s (0.10 %) - leafs setup took 2.146e-06 s (0.06 %) - halfword conversion took 1.366e-03 s (35.05 %) -Built (100 x 100)[0xaaaac72ed230]{Z} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x42646096 (coo:0, csr:1, hw:1, ic:1, fi:0), storage: 1, subm: 36, symflags:'LS' + shuffled partitions in 9.739e-04 s (29.42 %) + memory allocations took 3.099e-06 s (0.09 %) + leafs setup took 1.907e-06 s (0.06 %) + halfword conversion took 9.460e-04 s (28.57 %) +Built (100 x 100)[0xaaaae4512270]{Z} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x42646096 (coo:0, csr:1, hw:1, ic:1, fi:0), storage: 1, subm: 36, symflags:'LS' # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 524288 bytes, per-thread 524288 bytes # RSB_IO_WANT_MEMORY_HIERARCHY_INFO_STRING: unset @@ -8028,9 +8064,9 @@ # RSB_IO_WANT_SORT_METHOD: 0 # RSB_IO_WANT_SUBDIVISION_MULTIPLIER: 2 # librsb version 1.3.0.2 - 202212201855: Initialization success -3 iterations (1 th.) took 0.002075s; avg 0.0006917s ( +/- 49.84/ 50.53 %); best 0.0003469s; worst 0.001041s; std dev. 0.0002835 (taking best). -Reference operation time is 0.000346899 s (232.9 Mflops) with 1 threads. -Challenging best inner round reference (1.88351e-05 s/1 threads) with: subdivision 2, 36 leaves, 2.383 bytes/nz, 0.000346899 s/0 threads (speedup 0.0542955 x), same?n. +3 iterations (1 th.) took 0.001622s; avg 0.0005407s ( +/- 14.58/ 23.74 %); best 0.0004618s; worst 0.000669s; std dev. 9.154e-05 (taking best). +Reference operation time is 0.000461817 s (175 Mflops) with 1 threads. +Challenging best inner round reference (1.90735e-05 s/1 threads) with: subdivision 2, 36 leaves, 2.383 bytes/nz, 0.000461817 s/0 threads (speedup 0.041301 x), same?n. New candidate clone performs slowly; discarding it: 100 x 100, type Z, 5050 nnz, 50 nnz/r, 50 subms, 36 lsubms, 2.3834 bpnz # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 524288 bytes, per-thread 524288 bytes @@ -8064,16 +8100,16 @@ # librsb version 1.3.0.2 - 202212201855: Initialization success Building a matrix with 5050 nnz, 100 x 100 Duplicates check: 5050 - 0 = 5050 - converted COO to RSB in 3.126e-03 s (100.00 %) - analyzed arrays in 1.367e-03 s (43.73 %) - cleaned-up arrays in 9.060e-06 s (0.29 %) - deduplicated arrays in 7.868e-06 s (0.25 %) + converted COO to RSB in 3.516e-03 s (100.00 %) + analyzed arrays in 1.439e-03 s (40.93 %) + cleaned-up arrays in 9.060e-06 s (0.26 %) + deduplicated arrays in 6.914e-06 s (0.20 %) sorted arrays in 0.000e+00 s (0.00 %) - shuffled partitions in 7.811e-04 s (24.98 %) - memory allocations took 4.053e-06 s (0.13 %) - leafs setup took 1.907e-06 s (0.06 %) - halfword conversion took 9.551e-04 s (30.55 %) -Built (100 x 100)[0xaaaac72ed230]{Z} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x42646096 (coo:0, csr:1, hw:1, ic:1, fi:0), storage: 1, subm: 36, symflags:'LS' + shuffled partitions in 1.142e-03 s (32.48 %) + memory allocations took 2.861e-06 s (0.08 %) + leafs setup took 1.907e-06 s (0.05 %) + halfword conversion took 9.141e-04 s (26.00 %) +Built (100 x 100)[0xaaaae4512270]{Z} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x42646096 (coo:0, csr:1, hw:1, ic:1, fi:0), storage: 1, subm: 36, symflags:'LS' # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 524288 bytes, per-thread 524288 bytes # RSB_IO_WANT_MEMORY_HIERARCHY_INFO_STRING: unset @@ -8119,11 +8155,11 @@ # RSB_IO_WANT_SORT_METHOD: 0 # RSB_IO_WANT_SUBDIVISION_MULTIPLIER: 4 # librsb version 1.3.0.2 - 202212201855: Initialization success -3 iterations (1 th.) took 0.001433s; avg 0.0004776s ( +/- 3.06/ 2.13 %); best 0.000463s; worst 0.0004878s; std dev. 1.06e-05 (taking best). -Reference operation time is 0.000463009 s (174.5 Mflops) with 1 threads. -Challenging best inner round reference (1.88351e-05 s/1 threads) with: subdivision 4, 36 leaves, 2.383 bytes/nz, 0.000463009 s/0 threads (speedup 0.0406797 x), same?n. +3 iterations (1 th.) took 0.001451s; avg 0.0004837s ( +/- 7.38/ 10.81 %); best 0.000448s; worst 0.000536s; std dev. 3.779e-05 (taking best). +Reference operation time is 0.000447989 s (180.4 Mflops) with 1 threads. +Challenging best inner round reference (1.90735e-05 s/1 threads) with: subdivision 4, 36 leaves, 2.383 bytes/nz, 0.000447989 s/0 threads (speedup 0.0425758 x), same?n. New candidate clone performs slowly; discarding it: 100 x 100, type Z, 5050 nnz, 50 nnz/r, 50 subms, 36 lsubms, 2.3834 bpnz -Best sparse multiply performance with subdivision multiplier of 1: 4289.87 Mflops. +Best sparse multiply performance with subdivision multiplier of 1: 4236.25 Mflops. # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 524288 bytes, per-thread 524288 bytes # RSB_IO_WANT_MEMORY_HIERARCHY_INFO_STRING: unset @@ -8139,23 +8175,23 @@ # RSB_IO_WANT_SORT_METHOD: 0 # RSB_IO_WANT_SUBDIVISION_MULTIPLIER: 1 # librsb version 1.3.0.2 - 202212201855: Initialization success -Last tuner inner round (1 of 1) took 0.031405 s (eq. to 2e+03/ 2e+03 old/new op.times), gained local/global speedup 1 x (1.88351e-05 : 1.88351e-05) / 1 x (1.88351e-05 : 1.88351e-05). This is not amortizable ! +Last tuner inner round (1 of 1) took 0.0325689 s (eq. to 2e+03/ 2e+03 old/new op.times), gained local/global speedup 1 x (1.90735e-05 : 1.90735e-05) / 1 x (1.90735e-05 : 1.90735e-05). This is not amortizable ! Auto tuning inner round 1 did not find a configuration better than the original. -In 1 tuning rounds (tot. 0.031s, 0.021s for constructor, 0 clones) obtained NO speedup (best stays 4290 Mflops). -Second run of RSB Autotuner took 0.031435 s and estimated a speedup of 1.000000 x (1.884e-05 s -> 1.884e-05 s per op) in same matrix (1 -> 1 lsubm) +In 1 tuning rounds (tot. 0.033s, 0.024s for constructor, 0 clones) obtained NO speedup (best stays 4236 Mflops). +Second run of RSB Autotuner took 0.032619 s and estimated a speedup of 1.000000 x (1.907e-05 s -> 1.907e-05 s per op) in same matrix (1 -> 1 lsubm) #min:1 0 #max:1 0 #sum:100 0 #norm:10 0 #used index storage compared to COO:10504 vs 40400 bytes (26.00%) ; compared to CSR:10504 vs 20604 bytes (50.99%) #%:CONSTRUCTOR_*:SORT SCAN INSERT SCAN+INSERT -%:CONSTRUCTOR_TIMES:lower-100x100-5050nz S N 1 100 100 5050 0.000000 0.001853 0.002500 0.004353 -%:UNSORTEDCOO2RSB_TIME:lower-100x100-5050nz S N 1 100 100 5050 0.004353 -%:RSB_SUBDIVISION_TIME:lower-100x100-5050nz S N 1 100 100 5050 0.001853 -%:RSB_SHUFFLE_TIME:lower-100x100-5050nz S N 1 100 100 5050 0.002500 +%:CONSTRUCTOR_TIMES:lower-100x100-5050nz S N 1 100 100 5050 0.000000 0.000635 0.002360 0.002995 +%:UNSORTEDCOO2RSB_TIME:lower-100x100-5050nz S N 1 100 100 5050 0.002995 +%:RSB_SUBDIVISION_TIME:lower-100x100-5050nz S N 1 100 100 5050 0.000635 +%:RSB_SHUFFLE_TIME:lower-100x100-5050nz S N 1 100 100 5050 0.002360 %:ROW_MAJOR_SORT_TIME:lower-100x100-5050nz S N 1 100 100 5050 0.000000 %:ROW_MAJOR_SORT_SCALING:lower-100x100-5050nz S N 1 100 100 5050 nan -%:SORTEDCOO2RSB_TIME:lower-100x100-5050nz S N 1 100 100 5050 0.004353 +%:SORTEDCOO2RSB_TIME:lower-100x100-5050nz S N 1 100 100 5050 0.002995 %:ROW_MAJOR_SORT_TO_MOP:lower-100x100-5050nz S N 1 100 100 5050 0.000 %:UNSORTEDCOO2RSB_SCALING:lower-100x100-5050nz S N 1 100 100 5050 1.00 %:SORTEDCOO2RSB_SCALING:lower-100x100-5050nz S N 1 100 100 5050 1.00 @@ -8170,68 +8206,68 @@ %:SM_MINMAXAVGNNZ:lower-100x100-5050nz S N 1 100 100 5050 5050 5050 5050 # %operation:matrix CONSTRUCTOR[1] SPMV[1] SPMV[1] -%operation:lower-100x100-5050nz 0.00540805 1e+09 1e+09 +%operation:lower-100x100-5050nz 0.00451088 1e+09 1e+09 %constructor:matrix SORT[1] SCAN[1] SHUFFLE[1] INSERT[1] -%constructor:lower-100x100-5050nz 0 0.00185299 0 0.00250006 -# so far, program took 5.575s of wall clock time; ancillary tests 0.000s; I/O 0.000s; checks 0.000s; conversions 0.000s; rsb/mkl tuning 0.233s/0.000s . +%constructor:lower-100x100-5050nz 0 0.000635147 0 0.00235987 +# so far, program took 5.627s of wall clock time; ancillary tests 0.000s; I/O 0.000s; checks 0.000s; conversions 0.000s; rsb/mkl tuning 0.243s/0.000s . getrusage() stats: ru_maxrss: 6 (maximum resident set size -- MB) -ru_stime : 0.06371s (system CPU time used) -ru_utime : 6.81s (user CPU time used) +ru_stime : 0.06421s (system CPU time used) +ru_utime : 7.202s (user CPU time used) # benchmarking terminated --- finalizing run. # ====== BEGIN Total summary record. #pr: ======== All results (not limiting) #pr: Dump from a base of 4 samples (of max 4) ordered by (1,1,1,1,1,4,1) = (filename x cores x incX x incY x nrhs x typecode x transA). pr: BESTCODE MTX NR NC NNZ NRHS TYPE SYM TRANS NT AT-NT AT-MKL-NT BPNZ AT-BPNZ NSUBM AT-SUBM RSBBEST-MFLOPS OPTIME MKL-OPTIME AT-OPTIME AT-MKL-OPTIME AT-TIME RWminBW-GBps CB-bpf AT-MS CMFLOPS -pr: 1:R_R lower-100x100-5050nz 100 100 5050 1 D S N 1 1 0 2.1212 2.0800 3 1 4034.52 1.219e-03 0.000e+00 5.007e-06 0.000e+00 2.847e-02 1.06e+01 2.60e+00 1 2.02e-02 -pr: 2:R_R lower-100x100-5050nz 100 100 5050 1 S S N 1 1 0 2.1212 2.0800 3 1 2229.60 6.218e-04 0.000e+00 9.060e-06 0.000e+00 2.023e-02 3.52e+00 1.56e+00 1 2.02e-02 -pr: 3:R_R lower-100x100-5050nz 100 100 5050 1 C S N 1 1 0 2.1212 2.0800 3 1 3851.13 5.431e-04 0.000e+00 2.098e-05 0.000e+00 2.158e-02 2.54e+00 6.50e-01 1 8.08e-02 -pr: 4:R_R lower-100x100-5050nz 100 100 5050 1 Z S N 1 1 0 2.1212 2.0800 3 1 4236.25 3.228e-04 0.000e+00 1.907e-05 0.000e+00 1.389e-02 5.04e+00 1.17e+00 1 8.08e-02 +pr: 1:R_R lower-100x100-5050nz 100 100 5050 1 D S N 1 1 0 2.1212 2.0800 3 1 1193.31 1.185e-03 0.000e+00 1.693e-05 0.000e+00 3.111e-02 3.15e+00 2.60e+00 1 2.02e-02 +pr: 2:R_R lower-100x100-5050nz 100 100 5050 1 S S N 1 1 0 2.1212 2.0800 3 1 2017.26 8.330e-04 0.000e+00 1.001e-05 0.000e+00 2.341e-02 3.19e+00 1.56e+00 1 2.02e-02 +pr: 3:R_R lower-100x100-5050nz 100 100 5050 1 C S N 1 1 0 2.1212 2.0800 3 1 3644.08 5.329e-04 0.000e+00 2.217e-05 0.000e+00 1.568e-02 2.40e+00 6.50e-01 1 8.08e-02 +pr: 4:R_R lower-100x100-5050nz 100 100 5050 1 Z S N 1 1 0 2.1212 2.0800 3 1 4236.25 5.579e-04 0.000e+00 1.907e-05 0.000e+00 1.526e-02 5.04e+00 1.17e+00 1 8.08e-02 #pr: below, we define 'successful' autotuning when speedup of 1.010000x is exceeded, and 'tuned' results even the ones which are same as untuned #pr: rsb autotuning was successful in 4 cases (100.00 %) and unsuccessful in 0 cases (0.00 %) -#pr: (in succ. cases rsb autotuning gave avg. 8773.0 % faster, avg. sp. ratio 88.730x, max sp. ratio 243.476x, avg. ratio 0.000x) -#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 2418.9/728.4/5685.9/9675.4 tuned ops) -#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 34.7/ 23.4/ 43.0/138.7 untuned ops) -#pr: (and amortizes from untuned rsb in avg. 35.9, min. 23.4, max. 45.7 ops) +#pr: (in succ. cases rsb autotuning gave avg. 5062.2 % faster, avg. sp. ratio 51.622x, max sp. ratio 83.190x, avg. ratio 0.000x) +#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 1420.8/707.3/2338.1/5683.3 tuned ops) +#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 27.8/ 26.3/ 29.4/111.1 untuned ops) +#pr: (and amortizes from untuned rsb in avg. 28.5, min. 26.6, max. 30.7 ops) #pr: (avg/min/max (avg) nnz per subm before successful tuning were 1683/ 1683/ 1683) #pr: (avg/min/max (avg) nnz per subm after successful tuning were 5050/ 5050/ 5050) #pr: (avg/min/max (avg) bytes per subm before successful tuning were 15150/ 6733/ 26933) #pr: (avg/min/max (avg) bytes per subm after successful tuning were 45450/ 20200/ 80800) #pr: (avg/min/max (avg) bytes per nnz before successful tuning were 2.121/ 2.121/ 2.121) -#pr: (avg/min/max operands (mtx,lhs,rhs) read bandwidth lower bound 5.355/ 2.502/ 10.487,GBps) -#pr: (avg/min/max operands (mtx,rhs:r;lhs:rw) bandwidth lower bound 21.747/ 2.541/ 10.646,GBps) +#pr: (avg/min/max operands (mtx,lhs,rhs) read bandwidth lower bound 3.393/ 2.368/ 4.955,GBps) +#pr: (avg/min/max operands (mtx,rhs:r;lhs:rw) bandwidth lower bound 13.778/ 2.404/ 5.039,GBps) #pr: (avg/min/max code balance (bytes read at least once per flop) 1.495/ 0.650/ 2.599) #pr: (avg/min/max (avg) bytes per nnz after successful tuning were 2.080/ 2.080/ 2.080) #pr: (matrix has been subdivided more/less/same in resp. 0 / 4 /0 cases) #pr: (matrix has used more/less/same threads in resp. 0 / 0 /4 cases) #pr: no unsuccessful rsb autotuning attempt (according to 1.01x threshold) -#pr: rsb auto tuning (either succ. or uns.) time was: on avg.: 0.02 s, min 0.01 s, max 0.03 s, tot 0.08 s (4 samples) -#pr: rsb auto tuning ( only successful ) time was: on avg.: 0.02 s, min 0.01 s, max 0.03 s, tot 0.08 s (4 samples) -#pr: best tun. rsb canon. mflops were: on avg. 3.588e+03, min 2.230e+03, max 4.236e+03 (4 samples) -#pr: ref. unt. rsb canon. mflops were: on avg. 1.120e+02, min 1.657e+01, max 2.503e+02 (4 samples) -#pr: best tun. rsb operation time was: on avg. 1.353e-05s, min 5.007e-06s, max 2.098e-05s, tot 5.412e-05s (4 samples) -#pr: ref. unt. rsb operation time was: on avg. 6.767e-04s, min 3.228e-04s, max 1.219e-03s, tot 2.707e-03s (4 samples) -#pr: min / max ratio of in-memory MEMSET bandwidth to extrapolated read bandwidth ratio: 4.541e+00 1.903e+01 -#pr: in-cache to in-memory MEMSET bandwidth ratio: 1.001e+00 +#pr: rsb auto tuning (either succ. or uns.) time was: on avg.: 0.02 s, min 0.02 s, max 0.03 s, tot 0.09 s (4 samples) +#pr: rsb auto tuning ( only successful ) time was: on avg.: 0.02 s, min 0.02 s, max 0.03 s, tot 0.09 s (4 samples) +#pr: best tun. rsb canon. mflops were: on avg. 2.773e+03, min 1.193e+03, max 4.236e+03 (4 samples) +#pr: ref. unt. rsb canon. mflops were: on avg. 8.444e+01, min 1.704e+01, max 1.516e+02 (4 samples) +#pr: best tun. rsb operation time was: on avg. 1.705e-05s, min 1.001e-05s, max 2.217e-05s, tot 6.819e-05s (4 samples) +#pr: ref. unt. rsb operation time was: on avg. 7.772e-04s, min 5.329e-04s, max 1.185e-03s, tot 3.109e-03s (4 samples) +#pr: min / max ratio of in-memory MEMSET bandwidth to extrapolated read bandwidth ratio: 9.627e+00 2.014e+01 +#pr: in-cache to in-memory MEMSET bandwidth ratio: 9.986e-01 #pr: Record collection took 0.25 s. #pr: Record comprises 40 memory benchmark samples (prepend RSB_PR_MBW=1 to dump this). -#pr: Record comprises 104 environment variables in 5819 bytes (prepend RSB_PR_ENV=1 to dump this). +#pr: Record comprises 104 environment variables in 5873 bytes (prepend RSB_PR_ENV=1 to dump this). # ====== END Total summary record. #pr: ======== Saved a performance record of 4 samples to test.rpr # Removing the temporary record file test.rpr.tmp. -# terminating run at 1796064037 (after 5.6s of w.c.t.) +# terminating run at 1761654553 (after 5.6s of w.c.t.) + ls -ltr test-tuning-lower-100x100-5050nz--C-N-1--base.eps test-tuning-lower-100x100-5050nz--C-N-1--mv-tuned_merge1_1x1th.eps test-tuning-lower-100x100-5050nz--D-N-1--base.eps test-tuning-lower-100x100-5050nz--D-N-1--mv-tuned_merge1_1x1th.eps test-tuning-lower-100x100-5050nz--S-N-1--base.eps test-tuning-lower-100x100-5050nz--S-N-1--mv-tuned_merge1_1x1th.eps test-tuning-lower-100x100-5050nz--Z-N-1--base.eps test-tuning-lower-100x100-5050nz--Z-N-1--mv-tuned_merge1_1x1th.eps --rw-r--r-- 1 pbuilder1 pbuilder1 85637 Nov 30 06:40 test-tuning-lower-100x100-5050nz--D-N-1--base.eps --rw-r--r-- 1 pbuilder1 pbuilder1 84561 Nov 30 06:40 test-tuning-lower-100x100-5050nz--D-N-1--mv-tuned_merge1_1x1th.eps --rw-r--r-- 1 pbuilder1 pbuilder1 85639 Nov 30 06:40 test-tuning-lower-100x100-5050nz--S-N-1--base.eps --rw-r--r-- 1 pbuilder1 pbuilder1 84561 Nov 30 06:40 test-tuning-lower-100x100-5050nz--S-N-1--mv-tuned_merge1_1x1th.eps --rw-r--r-- 1 pbuilder1 pbuilder1 85639 Nov 30 06:40 test-tuning-lower-100x100-5050nz--C-N-1--base.eps --rw-r--r-- 1 pbuilder1 pbuilder1 84561 Nov 30 06:40 test-tuning-lower-100x100-5050nz--C-N-1--mv-tuned_merge1_1x1th.eps --rw-r--r-- 1 pbuilder1 pbuilder1 85639 Nov 30 06:40 test-tuning-lower-100x100-5050nz--Z-N-1--base.eps --rw-r--r-- 1 pbuilder1 pbuilder1 84561 Nov 30 06:40 test-tuning-lower-100x100-5050nz--Z-N-1--mv-tuned_merge1_1x1th.eps +-rw-r--r-- 1 pbuilder2 pbuilder2 85640 Oct 29 02:29 test-tuning-lower-100x100-5050nz--D-N-1--base.eps +-rw-r--r-- 1 pbuilder2 pbuilder2 84564 Oct 29 02:29 test-tuning-lower-100x100-5050nz--D-N-1--mv-tuned_merge1_1x1th.eps +-rw-r--r-- 1 pbuilder2 pbuilder2 85644 Oct 29 02:29 test-tuning-lower-100x100-5050nz--S-N-1--base.eps +-rw-r--r-- 1 pbuilder2 pbuilder2 84566 Oct 29 02:29 test-tuning-lower-100x100-5050nz--S-N-1--mv-tuned_merge1_1x1th.eps +-rw-r--r-- 1 pbuilder2 pbuilder2 85644 Oct 29 02:29 test-tuning-lower-100x100-5050nz--C-N-1--base.eps +-rw-r--r-- 1 pbuilder2 pbuilder2 84566 Oct 29 02:29 test-tuning-lower-100x100-5050nz--C-N-1--mv-tuned_merge1_1x1th.eps +-rw-r--r-- 1 pbuilder2 pbuilder2 85644 Oct 29 02:29 test-tuning-lower-100x100-5050nz--Z-N-1--base.eps +-rw-r--r-- 1 pbuilder2 pbuilder2 84566 Oct 29 02:29 test-tuning-lower-100x100-5050nz--Z-N-1--mv-tuned_merge1_1x1th.eps + rsbench --read-performance-record test.rpr + ls -ltr test.txt --rw-r--r-- 1 pbuilder1 pbuilder1 4093 Nov 30 06:40 test.txt +-rw-r--r-- 1 pbuilder2 pbuilder2 4092 Oct 29 02:29 test.txt + RSB_PR_WLTC=2 + RSB_PR_SR=0 + rsbench --read-performance-record test.rpr @@ -8241,29 +8277,29 @@ /usr/bin/kpsepath ++ kpsepath tex ++ sed 's/!!//g;s/:/\n/g;' -+ find . /nonexistent/first-build/.texlive2025/texmf-config/tex/kpsewhich// /nonexistent/first-build/.texlive2025/texmf-var/tex/kpsewhich// /nonexistent/first-build/texmf/tex/kpsewhich// /usr/local/share/texmf/tex/kpsewhich// /etc/texmf/tex/kpsewhich// /var/lib/texmf/tex/kpsewhich// /usr/share/texmf/tex/kpsewhich// /usr/share/texlive/texmf-dist/tex/kpsewhich// /nonexistent/first-build/.texlive2025/texmf-config/tex/generic// /nonexistent/first-build/.texlive2025/texmf-var/tex/generic// /nonexistent/first-build/texmf/tex/generic// /usr/local/share/texmf/tex/generic// /etc/texmf/tex/generic// /var/lib/texmf/tex/generic// /usr/share/texmf/tex/generic// /usr/share/texlive/texmf-dist/tex/generic// /nonexistent/first-build/.texlive2025/texmf-config/tex/latex// /nonexistent/first-build/.texlive2025/texmf-var/tex/latex// /nonexistent/first-build/texmf/tex/latex// /usr/local/share/texmf/tex/latex// /etc/texmf/tex/latex// /var/lib/texmf/tex/latex// /usr/share/texmf/tex/latex// /usr/share/texlive/texmf-dist/tex/latex// /nonexistent/first-build/.texlive2025/texmf-config/tex/// /nonexistent/first-build/.texlive2025/texmf-var/tex/// /nonexistent/first-build/texmf/tex/// /usr/local/share/texmf/tex/// /etc/texmf/tex/// /var/lib/texmf/tex/// /usr/share/texmf/tex/// /usr/share/texlive/texmf-dist/tex/// -name sciposter.cls -find: '/nonexistent/first-build/.texlive2025/texmf-config/tex/kpsewhich//': No such file or directory -find: '/nonexistent/first-build/.texlive2025/texmf-var/tex/kpsewhich//': No such file or directory -find: '/nonexistent/first-build/texmf/tex/kpsewhich//': No such file or directory ++ find . /nonexistent/second-build/.texlive2025/texmf-config/tex/kpsewhich// /nonexistent/second-build/.texlive2025/texmf-var/tex/kpsewhich// /nonexistent/second-build/texmf/tex/kpsewhich// /usr/local/share/texmf/tex/kpsewhich// /etc/texmf/tex/kpsewhich// /var/lib/texmf/tex/kpsewhich// /usr/share/texmf/tex/kpsewhich// /usr/share/texlive/texmf-dist/tex/kpsewhich// /nonexistent/second-build/.texlive2025/texmf-config/tex/generic// /nonexistent/second-build/.texlive2025/texmf-var/tex/generic// /nonexistent/second-build/texmf/tex/generic// /usr/local/share/texmf/tex/generic// /etc/texmf/tex/generic// /var/lib/texmf/tex/generic// /usr/share/texmf/tex/generic// /usr/share/texlive/texmf-dist/tex/generic// /nonexistent/second-build/.texlive2025/texmf-config/tex/latex// /nonexistent/second-build/.texlive2025/texmf-var/tex/latex// /nonexistent/second-build/texmf/tex/latex// /usr/local/share/texmf/tex/latex// /etc/texmf/tex/latex// /var/lib/texmf/tex/latex// /usr/share/texmf/tex/latex// /usr/share/texlive/texmf-dist/tex/latex// /nonexistent/second-build/.texlive2025/texmf-config/tex/// /nonexistent/second-build/.texlive2025/texmf-var/tex/// /nonexistent/second-build/texmf/tex/// /usr/local/share/texmf/tex/// /etc/texmf/tex/// /var/lib/texmf/tex/// /usr/share/texmf/tex/// /usr/share/texlive/texmf-dist/tex/// -name sciposter.cls +find: '/nonexistent/second-build/.texlive2025/texmf-config/tex/kpsewhich//': No such file or directory +find: '/nonexistent/second-build/.texlive2025/texmf-var/tex/kpsewhich//': No such file or directory +find: '/nonexistent/second-build/texmf/tex/kpsewhich//': No such file or directory find: '/usr/local/share/texmf/tex/kpsewhich//': No such file or directory find: '/etc/texmf/tex/kpsewhich//': No such file or directory find: '/var/lib/texmf/tex/kpsewhich//': No such file or directory find: '/usr/share/texmf/tex/kpsewhich//': No such file or directory find: '/usr/share/texlive/texmf-dist/tex/kpsewhich//': No such file or directory -find: '/nonexistent/first-build/.texlive2025/texmf-config/tex/generic//': No such file or directory -find: '/nonexistent/first-build/.texlive2025/texmf-var/tex/generic//': No such file or directory -find: '/nonexistent/first-build/texmf/tex/generic//': No such file or directory +find: '/nonexistent/second-build/.texlive2025/texmf-config/tex/generic//': No such file or directory +find: '/nonexistent/second-build/.texlive2025/texmf-var/tex/generic//': No such file or directory +find: '/nonexistent/second-build/texmf/tex/generic//': No such file or directory find: '/usr/local/share/texmf/tex/generic//': No such file or directory find: '/usr/share/texmf/tex/generic//': No such file or directory -find: '/nonexistent/first-build/.texlive2025/texmf-config/tex/latex//': No such file or directory -find: '/nonexistent/first-build/.texlive2025/texmf-var/tex/latex//': No such file or directory -find: '/nonexistent/first-build/texmf/tex/latex//': No such file or directory +find: '/nonexistent/second-build/.texlive2025/texmf-config/tex/latex//': No such file or directory +find: '/nonexistent/second-build/.texlive2025/texmf-var/tex/latex//': No such file or directory +find: '/nonexistent/second-build/texmf/tex/latex//': No such file or directory find: '/usr/local/share/texmf/tex/latex//': No such file or directory find: '/etc/texmf/tex/latex//': No such file or directory find: '/var/lib/texmf/tex/latex//': No such file or directory -find: '/nonexistent/first-build/.texlive2025/texmf-config/tex///': No such file or directory -find: '/nonexistent/first-build/.texlive2025/texmf-var/tex///': No such file or directory -find: '/nonexistent/first-build/texmf/tex///': No such file or directory +find: '/nonexistent/second-build/.texlive2025/texmf-config/tex///': No such file or directory +find: '/nonexistent/second-build/.texlive2025/texmf-var/tex///': No such file or directory +find: '/nonexistent/second-build/texmf/tex///': No such file or directory find: '/usr/local/share/texmf/tex///': No such file or directory + exit 0 for mf in pd.mtx vf.mtx ; do if test -f /build/reproducible-path/librsb-1.3.0.2+dfsg/examples/$mf ; then true; else cp -p /build/reproducible-path/librsb-1.3.0.2+dfsg/$mf /build/reproducible-path/librsb-1.3.0.2+dfsg/examples/$mf ; fi; done @@ -8278,7 +8314,7 @@ This error may be safely ignored. Correctly allocated a matrix. Summary information of the matrix: -(3 x 3)[0xaaab0fbf74a0]{D} @ (0(0..3),0(0..3)) (3 nnz, 1 nnz/r) flags 0x2040384 (coo:1, csr:0, hw:0, ic:1, fi:0), storage: 40, subm: 1, symflags:'' +(3 x 3)[0xaaab1b3c74a0]{D} @ (0(0..3),0(0..3)) (3 nnz, 1 nnz/r) flags 0x2040384 (coo:1, csr:0, hw:0, ic:1, fi:0), storage: 40, subm: 1, symflags:'' Correctly performed a SPMV. Correctly freed the matrix. Correctly finalized the library. @@ -8293,7 +8329,7 @@ This error may be safely ignored. Correctly allocated a matrix. Summary information of the matrix: -(3 x 3)[0xaaaae88844a0]{D} @ (0(0..3),0(0..3)) (3 nnz, 1 nnz/r) flags 0x2040384 (coo:1, csr:0, hw:0, ic:1, fi:0), storage: 40, subm: 1, symflags:'' +(3 x 3)[0xaaaae043e4a0]{D} @ (0(0..3),0(0..3)) (3 nnz, 1 nnz/r) flags 0x2040384 (coo:1, csr:0, hw:0, ic:1, fi:0), storage: 40, subm: 1, symflags:'' Correctly performed a SPMV. Correctly freed the matrix. Correctly finalized the library. @@ -8357,51 +8393,51 @@ Done. Building a matrix with 5 nnz, 5 x 5 Duplicates check: 5 - 0 = 5 - converted COO to RSB in 3.684e-03 s (100.00 %) - analyzed arrays in 1.450e-03 s (39.36 %) + converted COO to RSB in 9.496e-03 s (100.00 %) + analyzed arrays in 3.114e-03 s (32.79 %) cleaned-up arrays in 0.000e+00 s (0.00 %) - deduplicated arrays in 0.000e+00 s (0.00 %) - sorted arrays in 2.470e-04 s (6.71 %) - shuffled partitions in 9.890e-04 s (26.85 %) - memory allocations took 2.861e-06 s (0.08 %) - leafs setup took 9.537e-07 s (0.03 %) - halfword conversion took 9.940e-04 s (26.98 %) -Built (5 x 5)[0xaaaae8886820]{D} @ (0(0..0),0(0..0)) (5 nnz, 1 nnz/r) flags 0x2046186 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 2, symflags:'' + deduplicated arrays in 9.537e-07 s (0.01 %) + sorted arrays in 1.957e-03 s (20.61 %) + shuffled partitions in 1.996e-03 s (21.02 %) + memory allocations took 5.245e-06 s (0.06 %) + leafs setup took 1.907e-06 s (0.02 %) + halfword conversion took 2.420e-03 s (25.48 %) +Built (5 x 5)[0xaaaae0440820]{D} @ (0(0..0),0(0..0)) (5 nnz, 1 nnz/r) flags 0x2046186 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 2, symflags:'' Allocated matrix of 5 nonzeroes: -(5 x 5)[0xaaaae8886820]{D} @ (0(0..0),0(0..0)) (5 nnz, 1 nnz/r) flags 0x2046186 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 2, symflags:'' +(5 x 5)[0xaaaae0440820]{D} @ (0(0..0),0(0..0)) (5 nnz, 1 nnz/r) flags 0x2046186 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 2, symflags:'' -Before auto-tuning, 100 multiplications took 0.051023s. +Before auto-tuning, 100 multiplications took 0.082394s. Threads autotuning (may take more than 1.500000s)... Will use autotuning routine to sample matrix: 5 x 5, type D, 5 nnz, 1 nnz/r, 3 subms, 2 lsubms, 4.0000 bpnz. Parameters: verbosity:1 mintimes:3 maxtimes:10 mindt:0 maxdt:0.1 -Sampling (15 x 0.1 s stages, transA=N, nrhs=2, timer gran.=2.93016e-08), 12 suggested as starting thread count(default). -3 iterations (12 th.) took 0.001563s; avg 0.000521s ( +/- 23.81/ 31.88 %); best 0.000397s; worst 0.0006871s; std dev. 0.0001221 (taking best). -Reference operation time is 0.000396967 s (0.05038 Mflops) with 12 threads. -3 iterations (12 th.) took 0.001431s; avg 0.000477s ( +/- 0.43/ 0.42 %); best 0.0004749s; worst 0.000479s; std dev. 1.656e-06 (taking best). -Reference operation time is 0.00047493 s (0.04211 Mflops) with 12 threads. -After 0.003033s, autotuning routine did not find a better threads count configuration. -(5 x 5)[0xaaaae8886820]{D} @ (0(0..0),0(0..0)) (5 nnz, 1 nnz/r) flags 0x2046186 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 2, symflags:'' -After threads auto-tuning, 100 multiplications took 0.046746s -- effective speedup of 1.09149 x +Sampling (15 x 0.1 s stages, transA=N, nrhs=2, timer gran.=7.59959e-08), 12 suggested as starting thread count(default). +3 iterations (12 th.) took 0.002273s; avg 0.0007577s ( +/- 4.56/ 5.32 %); best 0.0007231s; worst 0.000798s; std dev. 3.083e-05 (taking best). +Reference operation time is 0.000723124 s (0.02766 Mflops) with 12 threads. +3 iterations (12 th.) took 0.002133s; avg 0.000711s ( +/- 0.68/ 1.26 %); best 0.0007062s; worst 0.00072s; std dev. 6.357e-06 (taking best). +Reference operation time is 0.000706196 s (0.02832 Mflops) with 12 threads. +After 0.004449s, autotuning routine did not find a better threads count configuration. +(5 x 5)[0xaaaae0440820]{D} @ (0(0..0),0(0..0)) (5 nnz, 1 nnz/r) flags 0x2046186 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 2, symflags:'' +After threads auto-tuning, 100 multiplications took 0.077650s -- effective speedup of 1.06109 x Matrix autotuning (may take more than 1.500000s; using 12 threads )... Will autotune matrix: 5 x 5, type D, 5 nnz, 1 nnz/r, 3 subms, 2 lsubms, 4.0000 bpnz. Parameters: verbosity:1 mintimes:3 maxtimes:10 mindt:0 maxdt:0.1 -Starting autotuning (15 x 0.1 s stages, transA=N, nrhs=2, timer gran.=2.93016e-08), 12 suggested as starting thread count. -3 iterations (12 th.) took 0.001202s; avg 0.0004007s ( +/- 13.43/ 6.86 %); best 0.0003469s; worst 0.0004282s; std dev. 3.805e-05 (taking best). -Reference operation time is 0.000346899 s (0.05765 Mflops) with 12 threads. -Starting merge (user-supplied threads) based auto-tuning procedure (transA=N, nrhs=2, order=cols) (max 6 steps, inclusive 3 grace steps) on: 5 x 5, type D, 5 nnz, 1 nnz/r, 3 subms, 2 lsubms, 4.0000 bpnz (tpop: 0.0003469 Mflops: 0.058) -Merge (2 -> 1 leaves) took w.c.t. of 1.001e-05s, ~3.099e-06s of computing time (of which 0s sorting, 9.537e-07s analysis) -3 iterations (12 th.) took 2.146e-06s; avg 7.153e-07s ( +/- 95.90/200.00 %); best 2.93e-08s; worst 2.146e-06s; std dev. 1.012e-06 (taking best). -Reference operation time is 2.93016e-08 s (682.6 Mflops) with 12 threads. -After merge step 1: tpop: 2.93e-08 s ~Mflops: 682.556 nsubm:1 otn:12 -Applying merge (2 -> 1 leaves, 12 th.) yielded SPEEDUP of 11838.893x: 0.0003469s -> 2.93e-08s, so taking this instance. +Starting autotuning (15 x 0.1 s stages, transA=N, nrhs=2, timer gran.=7.59959e-08), 12 suggested as starting thread count. +3 iterations (12 th.) took 0.001595s; avg 0.0005317s ( +/- 0.67/ 0.63 %); best 0.0005281s; worst 0.000535s; std dev. 2.828e-06 (taking best). +Reference operation time is 0.000528097 s (0.03787 Mflops) with 12 threads. +Starting merge (user-supplied threads) based auto-tuning procedure (transA=N, nrhs=2, order=cols) (max 6 steps, inclusive 3 grace steps) on: 5 x 5, type D, 5 nnz, 1 nnz/r, 3 subms, 2 lsubms, 4.0000 bpnz (tpop: 0.0005281 Mflops: 0.038) +Merge (2 -> 1 leaves) took w.c.t. of 1.097e-05s, ~3.099e-06s of computing time (of which 9.537e-07s sorting, 1.907e-06s analysis) +3 iterations (12 th.) took 9.537e-07s; avg 3.179e-07s ( +/- 76.09/200.00 %); best 7.6e-08s; worst 9.537e-07s; std dev. 4.496e-07 (taking best). +Reference operation time is 7.59959e-08 s (263.2 Mflops) with 12 threads. +After merge step 1: tpop: 7.6e-08 s ~Mflops: 263.172 nsubm:1 otn:12 +Applying merge (2 -> 1 leaves, 12 th.) yielded SPEEDUP of 6949.020x: 0.0005281s -> 7.6e-08s, so taking this instance. Merged all the matrix leaves: no reason to continue merging. -A total of 1 merge steps (of max 6) (2 -> 1 subms) took 0.001505s (of which 0.000169s partitioning, 0s I/O); computing times: 3.099e-06s in par. loops, 0s sorting, 9.537e-07s analyzing) -Total merge + benchmarking process took 0.001505s, equivalent to 51367.0/4.3 new/old ops (0.002595s for 2 clones -- as 88559.8/7.5 ops, or 44279.9/3.7 ops per clone), SPEEDUP of 11838.893x -Applying multi-merge (2 -> 1 leaves, 1 steps, 12 -> 12 th.sp.) yielded SPEEDUP of 11838.893x (0.0003469s -> 2.93e-08s), will amortize in 4.3 ops by saving 0.0003469s per op. -In 1 tuning rounds (tot. 0.004s, 0.0026s for constructor, 2 clones) obtained a SPEEDUP of 1183789.3% (1.184e+04x) (from 0.05765 to 682.6 Mflops). -After 0.004007s, autotuning routine declared speedup of 11838.9 x, when using threads count of 12. -(5 x 5)[0xaaaae8889d70]{D} @ (0(0..5),0(0..5)) (5 nnz, 1 nnz/r) flags 0x2040186 (coo:1, csr:0, hw:1, ic:1, fi:0), storage: 40, subm: 1, symflags:'' -After threads auto-tuning, 100 multiplications took 0.000010s -- further speedup of 4668.26 x +A total of 1 merge steps (of max 6) (2 -> 1 subms) took 0.001872s (of which 2.789e-05s partitioning, 0s I/O); computing times: 3.099e-06s in par. loops, 9.537e-07s sorting, 1.907e-06s analyzing) +Total merge + benchmarking process took 0.001872s, equivalent to 24630.6/3.5 new/old ops (0.003193s for 2 clones -- as 42017.3/6.0 ops, or 21008.6/3.0 ops per clone), SPEEDUP of 6949.020x +Applying multi-merge (2 -> 1 leaves, 1 steps, 12 -> 12 th.sp.) yielded SPEEDUP of 6949.020x (0.0005281s -> 7.6e-08s), will amortize in 3.5 ops by saving 0.000528s per op. +In 1 tuning rounds (tot. 0.0048s, 0.0032s for constructor, 2 clones) obtained a SPEEDUP of 694802.0% (6949x) (from 0.03787 to 263.2 Mflops). +After 0.004852s, autotuning routine declared speedup of 6949.02 x, when using threads count of 12. +(5 x 5)[0xaaaae0443d70]{D} @ (0(0..5),0(0..5)) (5 nnz, 1 nnz/r) flags 0x2040186 (coo:1, csr:0, hw:1, ic:1, fi:0), storage: 40, subm: 1, symflags:'' +After threads auto-tuning, 100 multiplications took 0.000010s -- further speedup of 7754.48 x 0/2 0 0 -> 0 1/2 1 0 -> 5 0/2 0 3 -> 0 @@ -8412,7 +8448,7 @@ Correctly initialized the library. Correctly allocated a matrix with 7 nonzeroes. Summary information of the matrix: -(6 x 6)[0xaaaae8886820]{D} @ (0(1..2),0(5..6)) (1 nnz, 0.17 nnz/r) flags 0x20443ee (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 1, symflags:'UT' +(6 x 6)[0xaaaae0440820]{D} @ (0(1..2),0(5..6)) (1 nnz, 0.17 nnz/r) flags 0x20443ee (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 1, symflags:'UT' Matrix printout: %%MatrixMarket matrix coordinate real general 6 6 1 @@ -8563,61 +8599,61 @@ Creating 500 x 500 matrix with 62500 nonzeroes. Building a matrix with 62500 nnz, 500 x 500 Duplicates check: 62500 - 0 = 62500 - converted COO to RSB in 8.653e-03 s (100.00 %) - analyzed arrays in 1.032e-03 s (11.93 %) - cleaned-up arrays in 1.059e-04 s (1.22 %) - deduplicated arrays in 9.084e-05 s (1.05 %) - sorted arrays in 3.794e-03 s (43.85 %) - shuffled partitions in 2.060e-03 s (23.81 %) - memory allocations took 2.003e-05 s (0.23 %) + converted COO to RSB in 7.900e-03 s (100.00 %) + analyzed arrays in 9.270e-04 s (11.73 %) + cleaned-up arrays in 1.049e-04 s (1.33 %) + deduplicated arrays in 1.051e-04 s (1.33 %) + sorted arrays in 3.455e-03 s (43.73 %) + shuffled partitions in 2.188e-03 s (27.70 %) + memory allocations took 2.217e-05 s (0.28 %) leafs setup took 5.007e-06 s (0.06 %) - halfword conversion took 1.542e-03 s (17.82 %) -Built (500 x 500)[0xaaaac7ed62d0]{D} @ (0(0..0),0(0..0)) (62500 nnz, 1.2e+02 nnz/r) flags 0x2046186 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 55, symflags:'' + halfword conversion took 1.090e-03 s (13.80 %) +Built (500 x 500)[0xaaaacc7d62d0]{D} @ (0(0..0),0(0..0)) (62500 nnz, 1.2e+02 nnz/r) flags 0x2046186 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 55, symflags:'' Allocated matrix of 62500 nonzeroes: -(500 x 500)[0xaaaac7ed62d0]{D} @ (0(0..0),0(0..0)) (62500 nnz, 1.2e+02 nnz/r) flags 0x2046186 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 55, symflags:'' +(500 x 500)[0xaaaacc7d62d0]{D} @ (0(0..0),0(0..0)) (62500 nnz, 1.2e+02 nnz/r) flags 0x2046186 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 55, symflags:'' -Before auto-tuning, 100 multiplications took 0.132993s. +Before auto-tuning, 100 multiplications took 0.119712s. Threads autotuning (may take more than 1.500000s)... -Will use autotuning routine to sample matrix: 500 x 500, type D, 62500 nnz, 1.2e+02 nnz/r, 75 subms, 55 lsubms, 2.1195 bpnz. +Will use autotuning routine to sample matrix: 500 x 500, type D, 62500 nnz, 1.2e+02 nnz/r, 75 subms, 55 lsubms, 2.1196 bpnz. Parameters: verbosity:1 mintimes:3 maxtimes:10 mindt:0 maxdt:0.1 -Sampling (15 x 0.1 s stages, transA=N, nrhs=2, timer gran.=3.07083e-08), 12 suggested as starting thread count(default). -3 iterations (12 th.) took 0.003485s; avg 0.001162s ( +/- 11.24/ 7.52 %); best 0.001031s; worst 0.001249s; std dev. 9.407e-05 (taking best). -Reference operation time is 0.00103116 s (242.4 Mflops) with 12 threads. -3 iterations (12 th.) took 0.003376s; avg 0.001125s ( +/- 14.96/ 17.90 %); best 0.000957s; worst 0.001327s; std dev. 0.0001528 (taking best). -Reference operation time is 0.000957012 s (261.2 Mflops) with 12 threads. -After 0.006929s, autotuning routine did not find a better threads count configuration. -(500 x 500)[0xaaaac7ed62d0]{D} @ (0(0..0),0(0..0)) (62500 nnz, 1.2e+02 nnz/r) flags 0x2046186 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 55, symflags:'' -After threads auto-tuning, 100 multiplications took 0.140922s -- effective speedup of 0.943734 x +Sampling (15 x 0.1 s stages, transA=N, nrhs=2, timer gran.=2.93612e-08), 12 suggested as starting thread count(default). +3 iterations (12 th.) took 0.002907s; avg 0.000969s ( +/- 40.36/ 50.06 %); best 0.0005779s; worst 0.001454s; std dev. 0.0003638 (taking best). +Reference operation time is 0.000577927 s (432.6 Mflops) with 12 threads. +3 iterations (12 th.) took 0.002383s; avg 0.0007943s ( +/- 30.52/ 23.99 %); best 0.0005519s; worst 0.0009849s; std dev. 0.0001805 (taking best). +Reference operation time is 0.000551939 s (452.9 Mflops) with 12 threads. +After 0.005340s, autotuning routine did not find a better threads count configuration. +(500 x 500)[0xaaaacc7d62d0]{D} @ (0(0..0),0(0..0)) (62500 nnz, 1.2e+02 nnz/r) flags 0x2046186 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 55, symflags:'' +After threads auto-tuning, 100 multiplications took 0.124010s -- effective speedup of 0.96534 x Matrix autotuning (may take more than 1.500000s; using 12 threads )... -Will autotune matrix: 500 x 500, type D, 62500 nnz, 1.2e+02 nnz/r, 75 subms, 55 lsubms, 2.1195 bpnz. +Will autotune matrix: 500 x 500, type D, 62500 nnz, 1.2e+02 nnz/r, 75 subms, 55 lsubms, 2.1196 bpnz. Parameters: verbosity:1 mintimes:3 maxtimes:10 mindt:0 maxdt:0.1 -Starting autotuning (15 x 0.1 s stages, transA=N, nrhs=2, timer gran.=3.07083e-08), 12 suggested as starting thread count. -3 iterations (12 th.) took 0.00273s; avg 0.00091s ( +/- 13.09/ 9.23 %); best 0.0007908s; worst 0.000994s; std dev. 8.657e-05 (taking best). -Reference operation time is 0.000790834 s (316.1 Mflops) with 12 threads. -Starting merge (user-supplied threads) based auto-tuning procedure (transA=N, nrhs=2, order=cols) (max 6 steps, inclusive 3 grace steps) on: 500 x 500, type D, 62500 nnz, 1.2e+02 nnz/r, 75 subms, 55 lsubms, 2.1195 bpnz (tpop: 0.0007908 Mflops: 316.122) -Merge (55 -> 37 leaves) took w.c.t. of 0.0003181s, ~0.001277s of computing time (of which 0.0001249s sorting, 8.821e-06s analysis) -3 iterations (12 th.) took 0.003005s; avg 0.001002s ( +/- 42.30/ 62.73 %); best 0.0005779s; worst 0.00163s; std dev. 0.0004533 (taking best). -Reference operation time is 0.000577927 s (432.6 Mflops) with 12 threads. -After merge step 1: tpop: 0.0005779 s ~Mflops: 432.581 nsubm:37 otn:12 -Applying merge (55 -> 37 leaves, 12 th.) yielded SPEEDUP of 1.368x: 0.0007908s -> 0.0005779s, so taking this instance. -Merge (37 -> 28 leaves) took w.c.t. of 9.108e-05s, ~0.000114s of computing time (of which 5.364e-05s sorting, 6.199e-06s analysis) -3 iterations (12 th.) took 0.002076s; avg 0.000692s ( +/- 9.39/ 8.07 %); best 0.000627s; worst 0.0007479s; std dev. 4.977e-05 (taking best). -Reference operation time is 0.000627041 s (398.7 Mflops) with 12 threads. -After merge step 2: tpop: 0.000627 s ~Mflops: 398.698 nsubm:28 otn:12 -Applying merge (37 -> 28 leaves, 12 th.) yielded SLOWDOWN (1th of 3 tolerable) of 1.085x: 0.0005779s -> 0.000627s. -Merge (28 -> 22 leaves) took w.c.t. of 0.0007141s, ~6.771e-05s of computing time (of which 3.314e-05s sorting, 4.053e-06s analysis) -3 iterations (12 th.) took 0.005087s; avg 0.001696s ( +/- 46.99/ 61.94 %); best 0.0008988s; worst 0.002746s; std dev. 0.0007752 (taking best). -Reference operation time is 0.000898838 s (278.1 Mflops) with 12 threads. -After merge step 3: tpop: 0.0008988 s ~Mflops: 278.137 nsubm:22 otn:12 -Applying merge (28 -> 22 leaves, 12 th.) yielded SLOWDOWN (2th of 3 tolerable) of 1.555x: 0.0005779s -> 0.0008988s. -Skipping further merge based tests after 2 definite performance degradations in a row (and last exceeding limit). -A total of 3 merge steps (of max 6) (55 -> 22 subms) took 0.01392s (of which 0.001146s partitioning, 0s I/O); computing times: 0.001459s in par. loops, 0.0002117s sorting, 1.907e-05s analyzing) -Total merge + benchmarking process took 0.01392s, equivalent to 24.1/17.6 new/old ops (0.008278s for 2 clones -- as 14.3/10.5 ops, or 7.2/5.2 ops per clone), SPEEDUP of 1.368x -Applying multi-merge (55 -> 37 leaves, 1 steps, 12 -> 12 th.sp.) yielded SPEEDUP of 1.368x (0.0007908s -> 0.0005779s), will amortize in 65.4 ops by saving 0.0002129s per op. -In 1 tuning rounds (tot. 0.023s, 0.0083s for constructor, 2 clones) obtained a SPEEDUP of 36.8% (1.368x) (from 316.1 to 432.6 Mflops). -After 0.022683s, autotuning routine declared speedup of 1.3684 x, when using threads count of 12. -(500 x 500)[0xaaaac7ede9f0]{D} @ (0(0..0),0(0..0)) (62500 nnz, 1.2e+02 nnz/r) flags 0x2046186 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 37, symflags:'' -After threads auto-tuning, 100 multiplications took 0.134161s -- further speedup of 1.0504 x +Starting autotuning (15 x 0.1 s stages, transA=N, nrhs=2, timer gran.=2.93612e-08), 12 suggested as starting thread count. +3 iterations (12 th.) took 0.003383s; avg 0.001128s ( +/- 18.68/ 28.40 %); best 0.000917s; worst 0.001448s; std dev. 0.0002302 (taking best). +Reference operation time is 0.000916958 s (272.6 Mflops) with 12 threads. +Starting merge (user-supplied threads) based auto-tuning procedure (transA=N, nrhs=2, order=cols) (max 6 steps, inclusive 3 grace steps) on: 500 x 500, type D, 62500 nnz, 1.2e+02 nnz/r, 75 subms, 55 lsubms, 2.1196 bpnz (tpop: 0.000917 Mflops: 272.641) +Merge (55 -> 37 leaves) took w.c.t. of 0.000504s, ~0.001041s of computing time (of which 0.0001175s sorting, 1.001e-05s analysis) +3 iterations (12 th.) took 0.003372s; avg 0.001124s ( +/- 13.24/ 6.67 %); best 0.0009751s; worst 0.001199s; std dev. 0.0001053 (taking best). +Reference operation time is 0.000975132 s (256.4 Mflops) with 12 threads. +After merge step 1: tpop: 0.0009751 s ~Mflops: 256.376 nsubm:37 otn:12 +Applying merge (55 -> 37 leaves, 12 th.) yielded SLOWDOWN (1th of 3 tolerable) of 1.063x: 0.000917s -> 0.0009751s. +Merge (37 -> 28 leaves) took w.c.t. of 0.0004661s, ~0.0001171s of computing time (of which 4.697e-05s sorting, 4.053e-06s analysis) +3 iterations (12 th.) took 0.002201s; avg 0.0007337s ( +/- 25.29/ 30.28 %); best 0.0005481s; worst 0.0009558s; std dev. 0.0001684 (taking best). +Reference operation time is 0.000548124 s (456.1 Mflops) with 12 threads. +After merge step 2: tpop: 0.0005481 s ~Mflops: 456.101 nsubm:28 otn:12 +Applying merge (37 -> 28 leaves, 12 th.) yielded SPEEDUP of 1.673x: 0.000917s -> 0.0005481s, so taking this instance. +Merge (28 -> 22 leaves) took w.c.t. of 0.000457s, ~8.702e-05s of computing time (of which 3.29e-05s sorting, 2.861e-06s analysis) +3 iterations (12 th.) took 0.006251s; avg 0.002084s ( +/- 63.48/ 83.86 %); best 0.000761s; worst 0.003831s; std dev. 0.001289 (taking best). +Reference operation time is 0.000761032 s (328.5 Mflops) with 12 threads. +After merge step 3: tpop: 0.000761 s ~Mflops: 328.501 nsubm:22 otn:12 +Applying merge (28 -> 22 leaves, 12 th.) yielded SLOWDOWN (1th of 3 tolerable) of 1.388x: 0.0005481s -> 0.000761s. +Skipping further merge based tests after 1 definite performance degradations in a row (and last exceeding limit). +A total of 3 merge steps (of max 6) (55 -> 22 subms) took 0.01472s (of which 0.001454s partitioning, 0s I/O); computing times: 0.001245s in par. loops, 0.0001974s sorting, 1.693e-05s analyzing) +Total merge + benchmarking process took 0.01472s, equivalent to 26.9/16.1 new/old ops (0.00278s for 2 clones -- as 5.1/3.0 ops, or 2.5/1.5 ops per clone), SPEEDUP of 1.673x +Applying multi-merge (55 -> 28 leaves, 2 steps, 12 -> 12 th.sp.) yielded SPEEDUP of 1.673x (0.000917s -> 0.0005481s), will amortize in 39.9 ops by saving 0.0003688s per op. +In 1 tuning rounds (tot. 0.02s, 0.0028s for constructor, 2 clones) obtained a SPEEDUP of 67.3% (1.673x) (from 272.6 to 456.1 Mflops). +After 0.019765s, autotuning routine declared speedup of 1.6729 x, when using threads count of 12. +(500 x 500)[0xaaaacc7de9f0]{D} @ (0(0..0),0(0..0)) (62500 nnz, 1.2e+02 nnz/r) flags 0x2046186 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 28, symflags:'' +After threads auto-tuning, 100 multiplications took 0.072883s -- further speedup of 1.7015 x librsb timer-based profiling is not supported in this build. If you wish to have it, re-configure librsb with its support. So you can safely ignore the error you might just have seen printed out on screen. /build/reproducible-path/librsb-1.3.0.2+dfsg/examples/backsolve Hello, RSB! @@ -8625,19 +8661,19 @@ Correctly initialized the library. Building a matrix with 7 nnz, 6 x 6 Duplicates check: 1 - 0 = 1 - converted COO to RSB in 1.929e-03 s (100.00 %) - analyzed arrays in 1.472e-03 s (76.31 %) - cleaned-up arrays in 4.053e-06 s (0.21 %) - deduplicated arrays in 9.537e-07 s (0.05 %) - sorted arrays in 9.537e-07 s (0.05 %) - shuffled partitions in 4.330e-04 s (22.44 %) - memory allocations took 7.868e-06 s (0.41 %) + converted COO to RSB in 1.892e-03 s (100.00 %) + analyzed arrays in 1.448e-03 s (76.55 %) + cleaned-up arrays in 3.099e-06 s (0.16 %) + deduplicated arrays in 0.000e+00 s (0.00 %) + sorted arrays in 1.907e-06 s (0.10 %) + shuffled partitions in 4.230e-04 s (22.36 %) + memory allocations took 7.868e-06 s (0.42 %) leafs setup took 2.146e-06 s (0.11 %) - halfword conversion took 5.960e-06 s (0.31 %) -Built (6 x 6)[0xaaab0d8024d0]{D} @ (0(0..1),0(5..6)) (1 nnz, 0.17 nnz/r) flags 0x20443ee (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 1, symflags:'UT' + halfword conversion took 4.768e-06 s (0.25 %) +Built (6 x 6)[0xaaab0d5044d0]{D} @ (0(0..1),0(5..6)) (1 nnz, 0.17 nnz/r) flags 0x20443ee (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 1, symflags:'UT' Correctly allocated a matrix with 7 nonzeroes. Summary information of the matrix: -(6 x 6)[0xaaab0d8024d0]{D} @ (0(0..1),0(5..6)) (1 nnz, 0.17 nnz/r) flags 0x20443ee (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 1, symflags:'UT' +(6 x 6)[0xaaab0d5044d0]{D} @ (0(0..1),0(5..6)) (1 nnz, 0.17 nnz/r) flags 0x20443ee (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 1, symflags:'UT' Matrix printout: %%MatrixMarket matrix coordinate real general 6 6 1 @@ -8663,55 +8699,55 @@ 1 1 Will autotune matrix: 6 x 6, type D, 1 nnz, 0.17 nnz/r, 1 subms, 1 lsubms, 4.0000 bpnz. -Parameters: verbosity:1 mintimes:3 maxtimes:10 mindt:0 maxdt:2.965e-08 -3 iterations (12 th.) took 1.407e-05s; avg 4.689e-06s ( +/- 99.37/200.00 %); best 2.965e-08s; worst 1.407e-05s; std dev. 6.631e-06 (taking best). -Reference operation time is 2.96474e-08 s (67.46 Mflops) with 12 threads. -Starting merge (same threads) based auto-tuning procedure (transA=N, nrhs=1, order=cols) (max 6 steps, inclusive 3 grace steps) on: 6 x 6, type D, 1 nnz, 0.17 nnz/r, 1 subms, 1 lsubms, 4.0000 bpnz (tpop: 2.965e-08 Mflops: 67.460) +Parameters: verbosity:1 mintimes:3 maxtimes:10 mindt:0 maxdt:2.935e-08 +3 iterations (12 th.) took 1.407e-05s; avg 4.689e-06s ( +/- 99.37/179.66 %); best 2.935e-08s; worst 1.311e-05s; std dev. 5.969e-06 (taking best). +Reference operation time is 2.93493e-08 s (68.14 Mflops) with 12 threads. +Starting merge (same threads) based auto-tuning procedure (transA=N, nrhs=1, order=cols) (max 6 steps, inclusive 3 grace steps) on: 6 x 6, type D, 1 nnz, 0.17 nnz/r, 1 subms, 1 lsubms, 4.0000 bpnz (tpop: 2.935e-08 Mflops: 68.145) Merge (1 -> 1 leaves) took w.c.t. of 0s, ~0s of computing time (of which 0s sorting, 0s analysis) -3 iterations (12 th.) took 9.537e-07s; avg 3.179e-07s ( +/- 90.67/200.00 %); best 2.965e-08s; worst 9.537e-07s; std dev. 4.496e-07 (taking best). -Reference operation time is 2.96474e-08 s (67.46 Mflops) with 12 threads. -After merge step 1: tpop: 2.965e-08 s ~Mflops: 67.460 nsubm:1 otn:12 -Applying merge (1 -> 1 leaves, 12 th.) yielded NEGLIGIBLE change (1th in a row) (old/new=1.00000x): 2.965e-08s -> 2.965e-08s, so IGNORING this instance. +3 iterations (12 th.) took 9.537e-07s; avg 3.179e-07s ( +/- 90.77/200.00 %); best 2.935e-08s; worst 9.537e-07s; std dev. 4.496e-07 (taking best). +Reference operation time is 2.93493e-08 s (68.14 Mflops) with 12 threads. +After merge step 1: tpop: 2.935e-08 s ~Mflops: 68.145 nsubm:1 otn:12 +Applying merge (1 -> 1 leaves, 12 th.) yielded NEGLIGIBLE change (1th in a row) (old/new=1.00000x): 2.935e-08s -> 2.935e-08s, so IGNORING this instance. Merged all the matrix leaves: no reason to continue merging. -A total of 1 merge steps (of max 6) (1 -> 1 subms) took 8.106e-06s (of which 2.146e-06s partitioning, 0s I/O); computing times: 0s in par. loops, 0s sorting, 0s analyzing) -Total merge + benchmarking process took 8.106e-06s, equivalent to 273.4/273.4 new/old ops (0.001289s for 1 clones -- as 43474.1/43474.1 ops, or 43474.1/43474.1 ops per clone), SPEEDUP of 1.000x (NO SPEEDUP) +A total of 1 merge steps (of max 6) (1 -> 1 subms) took 7.868e-06s (of which 1.907e-06s partitioning, 0s I/O); computing times: 0s in par. loops, 0s sorting, 0s analyzing) +Total merge + benchmarking process took 7.868e-06s, equivalent to 268.1/268.1 new/old ops (0.001314s for 1 clones -- as 44776.6/44776.6 ops, or 44776.6/44776.6 ops per clone), SPEEDUP of 1.000x (NO SPEEDUP) Merging based autotuning FAILED (=NO SPEEDUP); let's try splitting then... -3 iterations (12 th.) took 9.537e-07s; avg 3.179e-07s ( +/- 90.67/200.00 %); best 2.965e-08s; worst 9.537e-07s; std dev. 4.496e-07 (taking best). -Reference operation time is 2.96474e-08 s (67.46 Mflops) with 12 threads. -Starting split (same threads) based auto-tuning procedure (transA=N, nrhs=1, order=cols) (max 6 steps, inclusive 3 grace steps) on: 6 x 6, type D, 1 nnz, 0.17 nnz/r, 1 subms, 1 lsubms, 4.0000 bpnz (tpop: 2.965e-08 Mflops: 67.460) -Split (1 -> 1 leaves, 1 -> 1 subms) took 1.407e-05s (of which: 2.146e-06s analysis, 0s mem.mgmt); compute time: 0s overall, 0s searches, 0s shuffle, 0s switch, 0s quadrants. -3 iterations (12 th.) took 9.537e-07s; avg 3.179e-07s ( +/- 90.67/200.00 %); best 2.965e-08s; worst 9.537e-07s; std dev. 4.496e-07 (taking best). -Reference operation time is 2.96474e-08 s (67.46 Mflops) with 12 threads. -After split step 1: tpop: 2.965e-08 s ~Mflops: 67.460 nsubm:1 otn:12 -Applying split (1 -> 1 leaves, 12 th.) yielded NEGLIGIBLE change (1th in a row) (old/new=1.00000x): 2.965e-08s -> 2.965e-08s, so IGNORING this instance. +3 iterations (12 th.) took 9.537e-07s; avg 3.179e-07s ( +/- 90.77/200.00 %); best 2.935e-08s; worst 9.537e-07s; std dev. 4.496e-07 (taking best). +Reference operation time is 2.93493e-08 s (68.14 Mflops) with 12 threads. +Starting split (same threads) based auto-tuning procedure (transA=N, nrhs=1, order=cols) (max 6 steps, inclusive 3 grace steps) on: 6 x 6, type D, 1 nnz, 0.17 nnz/r, 1 subms, 1 lsubms, 4.0000 bpnz (tpop: 2.935e-08 Mflops: 68.145) +Split (1 -> 1 leaves, 1 -> 1 subms) took 1.097e-05s (of which: 9.537e-07s analysis, 0s mem.mgmt); compute time: 0s overall, 0s searches, 0s shuffle, 0s switch, 0s quadrants. +3 iterations (12 th.) took 9.537e-07s; avg 3.179e-07s ( +/- 90.77/200.00 %); best 2.935e-08s; worst 9.537e-07s; std dev. 4.496e-07 (taking best). +Reference operation time is 2.93493e-08 s (68.14 Mflops) with 12 threads. +After split step 1: tpop: 2.935e-08 s ~Mflops: 68.145 nsubm:1 otn:12 +Applying split (1 -> 1 leaves, 12 th.) yielded NEGLIGIBLE change (1th in a row) (old/new=1.00000x): 2.935e-08s -> 2.935e-08s, so IGNORING this instance. Split (1 -> 1 leaves, 1 -> 1 subms) took 9.537e-07s (of which: 0s analysis, 0s mem.mgmt); compute time: 0s overall, 0s searches, 0s shuffle, 0s switch, 0s quadrants. -3 iterations (12 th.) took 1.907e-06s; avg 6.358e-07s ( +/- 95.34/ 50.00 %); best 2.965e-08s; worst 9.537e-07s; std dev. 4.496e-07 (taking best). -Reference operation time is 2.96474e-08 s (67.46 Mflops) with 12 threads. -After split step 2: tpop: 2.965e-08 s ~Mflops: 67.460 nsubm:1 otn:12 -Applying split (1 -> 1 leaves, 12 th.) yielded NEGLIGIBLE change (2th in a row) (old/new=1.00000x): 2.965e-08s -> 2.965e-08s, so IGNORING this instance. -Split (1 -> 1 leaves, 1 -> 1 subms) took 1.597e-05s (of which: 1.192e-05s analysis, 0s mem.mgmt); compute time: 0s overall, 0s searches, 0s shuffle, 0s switch, 0s quadrants. -3 iterations (12 th.) took 9.537e-07s; avg 3.179e-07s ( +/- 90.67/200.00 %); best 2.965e-08s; worst 9.537e-07s; std dev. 4.496e-07 (taking best). -Reference operation time is 2.96474e-08 s (67.46 Mflops) with 12 threads. -After split step 3: tpop: 2.965e-08 s ~Mflops: 67.460 nsubm:1 otn:12 -Applying split (1 -> 1 leaves, 12 th.) yielded NEGLIGIBLE change (3th in a row) (old/new=1.00000x): 2.965e-08s -> 2.965e-08s, so IGNORING this instance. +3 iterations (12 th.) took 1.192e-06s; avg 3.974e-07s ( +/- 92.61/200.00 %); best 2.935e-08s; worst 1.192e-06s; std dev. 5.62e-07 (taking best). +Reference operation time is 2.93493e-08 s (68.14 Mflops) with 12 threads. +After split step 2: tpop: 2.935e-08 s ~Mflops: 68.145 nsubm:1 otn:12 +Applying split (1 -> 1 leaves, 12 th.) yielded NEGLIGIBLE change (2th in a row) (old/new=1.00000x): 2.935e-08s -> 2.935e-08s, so IGNORING this instance. Split (1 -> 1 leaves, 1 -> 1 subms) took 1.192e-06s (of which: 0s analysis, 0s mem.mgmt); compute time: 0s overall, 0s searches, 0s shuffle, 0s switch, 0s quadrants. -3 iterations (12 th.) took 0s; avg 0s ( +/- -inf/ nan %); best 2.965e-08s; worst 0s; std dev. 0 (taking best). -Reference operation time is 2.96474e-08 s (67.46 Mflops) with 12 threads. -After split step 4: tpop: 2.965e-08 s ~Mflops: 67.460 nsubm:1 otn:12 -Applying split (1 -> 1 leaves, 12 th.) yielded NEGLIGIBLE change (4th in a row) (old/new=1.00000x): 2.965e-08s -> 2.965e-08s, so IGNORING this instance. +3 iterations (12 th.) took 9.537e-07s; avg 3.179e-07s ( +/- 90.77/200.00 %); best 2.935e-08s; worst 9.537e-07s; std dev. 4.496e-07 (taking best). +Reference operation time is 2.93493e-08 s (68.14 Mflops) with 12 threads. +After split step 3: tpop: 2.935e-08 s ~Mflops: 68.145 nsubm:1 otn:12 +Applying split (1 -> 1 leaves, 12 th.) yielded NEGLIGIBLE change (3th in a row) (old/new=1.00000x): 2.935e-08s -> 2.935e-08s, so IGNORING this instance. +Split (1 -> 1 leaves, 1 -> 1 subms) took 9.537e-07s (of which: 9.537e-07s analysis, 0s mem.mgmt); compute time: 0s overall, 0s searches, 0s shuffle, 0s switch, 0s quadrants. +3 iterations (12 th.) took 0s; avg 0s ( +/- -inf/ nan %); best 2.935e-08s; worst 0s; std dev. 0 (taking best). +Reference operation time is 2.93493e-08 s (68.14 Mflops) with 12 threads. +After split step 4: tpop: 2.935e-08 s ~Mflops: 68.145 nsubm:1 otn:12 +Applying split (1 -> 1 leaves, 12 th.) yielded NEGLIGIBLE change (4th in a row) (old/new=1.00000x): 2.935e-08s -> 2.935e-08s, so IGNORING this instance. +Split (1 -> 1 leaves, 1 -> 1 subms) took 9.537e-07s (of which: 0s analysis, 0s mem.mgmt); compute time: 0s overall, 0s searches, 0s shuffle, 0s switch, 0s quadrants. +3 iterations (12 th.) took 9.537e-07s; avg 3.179e-07s ( +/- 90.77/200.00 %); best 2.935e-08s; worst 9.537e-07s; std dev. 4.496e-07 (taking best). +Reference operation time is 2.93493e-08 s (68.14 Mflops) with 12 threads. +After split step 5: tpop: 2.935e-08 s ~Mflops: 68.145 nsubm:1 otn:12 +Applying split (1 -> 1 leaves, 12 th.) yielded NEGLIGIBLE change (5th in a row) (old/new=1.00000x): 2.935e-08s -> 2.935e-08s, so IGNORING this instance. Split (1 -> 1 leaves, 1 -> 1 subms) took 9.537e-07s (of which: 0s analysis, 0s mem.mgmt); compute time: 0s overall, 0s searches, 0s shuffle, 0s switch, 0s quadrants. -3 iterations (12 th.) took 0s; avg 0s ( +/- -inf/ nan %); best 2.965e-08s; worst 0s; std dev. 0 (taking best). -Reference operation time is 2.96474e-08 s (67.46 Mflops) with 12 threads. -After split step 5: tpop: 2.965e-08 s ~Mflops: 67.460 nsubm:1 otn:12 -Applying split (1 -> 1 leaves, 12 th.) yielded NEGLIGIBLE change (5th in a row) (old/new=1.00000x): 2.965e-08s -> 2.965e-08s, so IGNORING this instance. -Split (1 -> 1 leaves, 1 -> 1 subms) took 1.907e-06s (of which: 9.537e-07s analysis, 0s mem.mgmt); compute time: 0s overall, 0s searches, 0s shuffle, 0s switch, 0s quadrants. -3 iterations (12 th.) took 9.537e-07s; avg 3.179e-07s ( +/- 90.67/200.00 %); best 2.965e-08s; worst 9.537e-07s; std dev. 4.496e-07 (taking best). -Reference operation time is 2.96474e-08 s (67.46 Mflops) with 12 threads. -After split step 6: tpop: 2.965e-08 s ~Mflops: 67.460 nsubm:1 otn:12 -Applying split (1 -> 1 leaves, 12 th.) yielded NEGLIGIBLE change (6th in a row) (old/new=1.00000x): 2.965e-08s -> 2.965e-08s, so IGNORING this instance. -A total of 6 split steps (of max 6) (1 -> 1 subms) took 0.000458s (of which 0.0004261s partitioning, 0s I/O); computing times: 0s in par. loops, 0s sorting, 1.502e-05s analyzing) -Total split + benchmarking process took 0.000458s, equivalent to 15448.3/15448.3 new/old ops (0.001281s for 1 clones -- as 43208.7/43208.7 ops, or 43208.7/43208.7 ops per clone), SPEEDUP of 1.000x (NO SPEEDUP) -In 1 tuning rounds (tot. 0.0031s, 0.0026s for constructor, 2 clones) obtained NO speedup (best stays 67.46 Mflops). +3 iterations (12 th.) took 9.537e-07s; avg 3.179e-07s ( +/- 90.77/200.00 %); best 2.935e-08s; worst 9.537e-07s; std dev. 4.496e-07 (taking best). +Reference operation time is 2.93493e-08 s (68.14 Mflops) with 12 threads. +After split step 6: tpop: 2.935e-08 s ~Mflops: 68.145 nsubm:1 otn:12 +Applying split (1 -> 1 leaves, 12 th.) yielded NEGLIGIBLE change (6th in a row) (old/new=1.00000x): 2.935e-08s -> 2.935e-08s, so IGNORING this instance. +A total of 6 split steps (of max 6) (1 -> 1 subms) took 6.509e-05s (of which 3.791e-05s partitioning, 0s I/O); computing times: 0s in par. loops, 0s sorting, 1.907e-06s analyzing) +Total split + benchmarking process took 6.509e-05s, equivalent to 2217.7/2217.7 new/old ops (0.001474s for 1 clones -- as 50219.3/50219.3 ops, or 50219.3/50219.3 ops per clone), SPEEDUP of 1.000x (NO SPEEDUP) +In 1 tuning rounds (tot. 0.0029s, 0.0028s for constructor, 2 clones) obtained NO speedup (best stays 68.14 Mflops). Backsolving we should get a unitary vector: %%MatrixMarket matrix array real general @@ -8746,119 +8782,190 @@ /build/reproducible-path/librsb-1.3.0.2+dfsg/examples/fortran Building a matrix with 210 nnz, 20 x 20 Duplicates check: 210 - 0 = 210 - converted COO to RSB in 3.716e-03 s (100.00 %) - analyzed arrays in 1.105e-03 s (29.73 %) - cleaned-up arrays in 9.537e-07 s (0.03 %) - deduplicated arrays in 2.146e-06 s (0.06 %) - sorted arrays in 8.750e-04 s (23.55 %) - shuffled partitions in 8.459e-04 s (22.76 %) - memory allocations took 2.193e-05 s (0.59 %) - leafs setup took 4.053e-06 s (0.11 %) - halfword conversion took 8.490e-04 s (22.85 %) -Built (20 x 20)[0xaaab10cac9f0]{D} @ (0(0..0),0(0..0)) (210 nnz, 10 nnz/r) flags 0x2446396 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 22, symflags:'LS' + converted COO to RSB in 3.649e-03 s (100.00 %) + analyzed arrays in 8.810e-04 s (24.14 %) + cleaned-up arrays in 1.192e-06 s (0.03 %) + deduplicated arrays in 9.537e-07 s (0.03 %) + sorted arrays in 9.830e-04 s (26.94 %) + shuffled partitions in 8.540e-04 s (23.40 %) + memory allocations took 1.979e-05 s (0.54 %) + leafs setup took 3.099e-06 s (0.08 %) + halfword conversion took 8.969e-04 s (24.58 %) +Built (20 x 20)[0xaaaaf81b09f0]{D} @ (0(0..0),0(0..0)) (210 nnz, 10 nnz/r) flags 0x2446396 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 22, symflags:'LS' Will autotune matrix: 20 x 20, type D, 210 nnz, 10 nnz/r, 30 subms, 22 lsubms, 3.7524 bpnz. -Parameters: verbosity:1 mintimes:3 maxtimes:10 mindt:0 maxdt:2.999e-08 -Starting autotuning (16 x 2.99931e-08 s stages, transA=N, nrhs=1, timer gran.=2.99931e-08), 12 suggested as starting thread count(default). -3 iterations (12 th.) took 0.002898s; avg 0.000966s ( +/- 34.89/ 27.13 %); best 0.0006289s; worst 0.001228s; std dev. 0.0002503 (taking best). -Reference operation time is 0.000628948 s (1.336 Mflops) with 12 threads. -Starting merge (same threads) based auto-tuning procedure (transA=N, nrhs=1, order=cols) (max 6 steps, inclusive 3 grace steps) on: 20 x 20, type D, 210 nnz, 10 nnz/r, 30 subms, 22 lsubms, 3.7524 bpnz (tpop: 0.0006289 Mflops: 1.336) -Merge (22 -> 16 leaves) took w.c.t. of 0.0004649s, ~0.0001051s of computing time (of which 2.146e-06s sorting, 2.861e-06s analysis) -3 iterations (12 th.) took 0.003095s; avg 0.001032s ( +/- 34.27/ 56.04 %); best 0.0006781s; worst 0.00161s; std dev. 0.0004122 (taking best). -Reference operation time is 0.000678062 s (1.239 Mflops) with 12 threads. -After merge step 1: tpop: 0.0006781 s ~Mflops: 1.239 nsubm:16 otn:12 -Applying merge (22 -> 16 leaves, 12 th.) yielded SLOWDOWN (1th of 3 tolerable) of 1.078x: 0.0006289s -> 0.0006781s. -Merge (16 -> 10 leaves) took w.c.t. of 0.000242s, ~8.821e-06s of computing time (of which 1.907e-06s sorting, 2.861e-06s analysis) -3 iterations (12 th.) took 0.002431s; avg 0.0008103s ( +/- 63.99/ 34.29 %); best 0.0002918s; worst 0.001088s; std dev. 0.0003669 (taking best). -Reference operation time is 0.000291824 s (2.878 Mflops) with 12 threads. -After merge step 2: tpop: 0.0002918 s ~Mflops: 2.878 nsubm:10 otn:12 -Applying merge (16 -> 10 leaves, 12 th.) yielded SPEEDUP of 2.155x: 0.0006289s -> 0.0002918s, so taking this instance. -Merge (10 -> 8 leaves) took w.c.t. of 1.097e-05s, ~5.007e-06s of computing time (of which 9.537e-07s sorting, 3.099e-06s analysis) -3 iterations (12 th.) took 0.003221s; avg 0.001074s ( +/- 35.56/ 57.88 %); best 0.0006919s; worst 0.001695s; std dev. 0.0004433 (taking best). -Reference operation time is 0.000691891 s (1.214 Mflops) with 12 threads. -After merge step 3: tpop: 0.0006919 s ~Mflops: 1.214 nsubm:8 otn:12 -Applying merge (10 -> 8 leaves, 12 th.) yielded SLOWDOWN (1th of 3 tolerable) of 2.371x: 0.0002918s -> 0.0006919s. -Skipping further merge based tests after 1 definite performance degradations in a row (and last exceeding limit). -A total of 3 merge steps (of max 6) (22 -> 8 subms) took 0.01167s (of which 0.000726s partitioning, 0s I/O); computing times: 0.000119s in par. loops, 5.007e-06s sorting, 8.821e-06s analyzing) -Total merge + benchmarking process took 0.01167s, equivalent to 40.0/18.6 new/old ops (0.003468s for 2 clones -- as 11.9/5.5 ops, or 5.9/2.8 ops per clone), SPEEDUP of 2.155x -Applying multi-merge (22 -> 10 leaves, 2 steps, 0 -> 12 th.sp.) yielded SPEEDUP of 2.155x (0.0006289s -> 0.0002918s), will amortize in 34.6 ops by saving 0.0003371s per op. -In 1 tuning rounds (tot. 0.016s, 0.0035s for constructor, 2 clones) obtained a SPEEDUP of 115.5% (2.155x) (from 1.336 to 2.878 Mflops). +Parameters: verbosity:1 mintimes:3 maxtimes:10 mindt:0 maxdt:2.935e-08 +Starting autotuning (16 x 2.93493e-08 s stages, transA=N, nrhs=1, timer gran.=2.93493e-08), 12 suggested as starting thread count(default). +3 iterations (12 th.) took 0.003623s; avg 0.001208s ( +/- 49.40/ 73.47 %); best 0.0006111s; worst 0.002095s; std dev. 0.0006397 (taking best). +Reference operation time is 0.000611067 s (1.375 Mflops) with 12 threads. +Starting merge (same threads) based auto-tuning procedure (transA=N, nrhs=1, order=cols) (max 6 steps, inclusive 3 grace steps) on: 20 x 20, type D, 210 nnz, 10 nnz/r, 30 subms, 22 lsubms, 3.7524 bpnz (tpop: 0.0006111 Mflops: 1.375) +Merge (22 -> 16 leaves) took w.c.t. of 0.0003009s, ~0.0001049s of computing time (of which 2.146e-06s sorting, 4.053e-06s analysis) +3 iterations (12 th.) took 0.008533s; avg 0.002844s ( +/- 84.57/156.02 %); best 0.0004389s; worst 0.007282s; std dev. 0.003142 (taking best). +Reference operation time is 0.000438929 s (1.914 Mflops) with 12 threads. +After merge step 1: tpop: 0.0004389 s ~Mflops: 1.914 nsubm:16 otn:12 +Applying merge (22 -> 16 leaves, 12 th.) yielded SPEEDUP of 1.392x: 0.0006111s -> 0.0004389s, so taking this instance. +Merge (16 -> 10 leaves) took w.c.t. of 3.004e-05s, ~8.106e-06s of computing time (of which 2.146e-06s sorting, 2.861e-06s analysis) +3 iterations (12 th.) took 0.00199s; avg 0.0006634s ( +/- 36.06/ 69.89 %); best 0.0004241s; worst 0.001127s; std dev. 0.0003279 (taking best). +Reference operation time is 0.000424147 s (1.98 Mflops) with 12 threads. +After merge step 2: tpop: 0.0004241 s ~Mflops: 1.980 nsubm:10 otn:12 +Applying merge (16 -> 10 leaves, 12 th.) yielded SPEEDUP of 1.035x: 0.0004389s -> 0.0004241s, so taking this instance. +Merge (10 -> 8 leaves) took w.c.t. of 7.153e-06s, ~2.861e-06s of computing time (of which 9.537e-07s sorting, 2.146e-06s analysis) +3 iterations (12 th.) took 0.001274s; avg 0.0004246s ( +/- 1.57/ 2.19 %); best 0.0004179s; worst 0.0004339s; std dev. 6.78e-06 (taking best). +Reference operation time is 0.000417948 s (2.01 Mflops) with 12 threads. +After merge step 3: tpop: 0.0004179 s ~Mflops: 2.010 nsubm:8 otn:12 +Applying merge (10 -> 8 leaves, 12 th.) yielded SPEEDUP of 1.015x: 0.0004241s -> 0.0004179s, so taking this instance. +Merge (8 -> 6 leaves) took w.c.t. of 5.96e-06s, ~2.146e-06s of computing time (of which 9.537e-07s sorting, 9.537e-07s analysis) +3 iterations (12 th.) took 0.001837s; avg 0.0006123s ( +/- 30.11/ 59.71 %); best 0.000428s; worst 0.000978s; std dev. 0.0002586 (taking best). +Reference operation time is 0.000427961 s (1.963 Mflops) with 12 threads. +After merge step 4: tpop: 0.000428 s ~Mflops: 1.963 nsubm:6 otn:12 +Applying merge (8 -> 6 leaves, 12 th.) yielded SLOWDOWN (1th of 3 tolerable) of 1.024x: 0.0004179s -> 0.000428s. +Merge (6 -> 3 leaves) took w.c.t. of 5.96e-06s, ~2.861e-06s of computing time (of which 9.537e-07s sorting, 0s analysis) +3 iterations (12 th.) took 0.001307s; avg 0.0004357s ( +/- 1.55/ 1.46 %); best 0.0004289s; worst 0.000442s; std dev. 5.361e-06 (taking best). +Reference operation time is 0.000428915 s (1.958 Mflops) with 12 threads. +After merge step 5: tpop: 0.0004289 s ~Mflops: 1.958 nsubm:3 otn:12 +Applying merge (6 -> 3 leaves, 12 th.) yielded SLOWDOWN (2th of 3 tolerable) of 1.026x: 0.0004179s -> 0.0004289s. +Merge (3 -> 1 leaves) took w.c.t. of 1.001e-05s, ~5.007e-06s of computing time (of which 9.537e-07s sorting, 1.907e-06s analysis) +3 iterations (12 th.) took 2.146e-06s; avg 7.153e-07s ( +/- 95.90/200.00 %); best 2.935e-08s; worst 2.146e-06s; std dev. 1.012e-06 (taking best). +Reference operation time is 2.93493e-08 s (2.862e+04 Mflops) with 12 threads. +After merge step 6: tpop: 2.935e-08 s ~Mflops: 28620.758 nsubm:1 otn:12 +Applying merge (3 -> 1 leaves, 12 th.) yielded SPEEDUP of 14240.455x: 0.0004179s -> 2.935e-08s, so taking this instance. +Merged all the matrix leaves: no reason to continue merging. +A total of 6 merge steps (of max 6) (22 -> 1 subms) took 0.02086s (of which 0.0006487s partitioning, 0s I/O); computing times: 0.0001259s in par. loops, 8.106e-06s sorting, 1.192e-05s analyzing) +Total merge + benchmarking process took 0.02086s, equivalent to 710641.8/34.1 new/old ops (0.006483s for 5 clones -- as 220893.6/10.6 ops, or 44178.7/2.1 ops per clone), SPEEDUP of 20820.471x +Applying multi-merge (22 -> 1 leaves, 6 steps, 0 -> 12 th.sp.) yielded SPEEDUP of 20820.471x (0.0006111s -> 2.935e-08s), will amortize in 34.1 ops by saving 0.000611s per op. +In 1 tuning rounds (tot. 0.026s, 0.0065s for constructor, 5 clones) obtained a SPEEDUP of 2081947.1% (2.082e+04x) (from 1.375 to 2.862e+04 Mflops). autotuner chose 12 threads -Will autotune matrix: 20 x 20, type D, 210 nnz, 10 nnz/r, 14 subms, 10 lsubms, 3.1429 bpnz. -Parameters: verbosity:1 mintimes:3 maxtimes:10 mindt:0 maxdt:2.999e-08 -Starting autotuning (16 x 2.99931e-08 s stages, transA=N, nrhs=1, timer gran.=2.99931e-08), 12 suggested as starting thread count(default). -3 iterations (12 th.) took 0.001503s; avg 0.0005011s ( +/- 52.09/ 49.69 %); best 0.0002401s; worst 0.0007501s; std dev. 0.0002084 (taking best). -~ 12 threads: 0.0002401s (3.5 Mflops) (0/2 degradations so far) - -3 iterations (11 th.) took 0.002171s; avg 0.0007237s ( +/- 35.62/ 63.90 %); best 0.0004659s; worst 0.001186s; std dev. 0.0003277 (taking best). - 11 threads: 0.0004659s (1.8 Mflops) (1/2 degradations so far) - -3 iterations (10 th.) took 0.001685s; avg 0.0005617s ( +/- 24.15/ 18.38 %); best 0.0004261s; worst 0.0006649s; std dev. 0.0001002 (taking best). - 10 threads: 0.0004261s (2 Mflops) (2/2 degradations so far) - -Best threads choice is 12; starting threads were 12; max speed gap is 1.9x; search took 0.0054s. -Starting merge (and threads) based auto-tuning procedure (transA=N, nrhs=1, order=cols) (max 6 steps, inclusive 3 grace steps) on: 20 x 20, type D, 210 nnz, 10 nnz/r, 14 subms, 10 lsubms, 3.1429 bpnz (tpop: 0.0002401 Mflops: 3.499) -Merge (10 -> 8 leaves) took w.c.t. of 1.001e-05s, ~4.053e-06s of computing time (of which 9.537e-07s sorting, 2.146e-06s analysis) -3 iterations (12 th.) took 0.002661s; avg 0.000887s ( +/- 33.58/ 30.66 %); best 0.0005891s; worst 0.001159s; std dev. 0.0002333 (taking best). -~ 12 threads: 0.0005891s (1.4 Mflops) (0/2 degradations so far) - -3 iterations (11 th.) took 0.002955s; avg 0.000985s ( +/- 65.10/121.94 %); best 0.0003438s; worst 0.002186s; std dev. 0.0008499 (taking best). - 11 threads: 0.0003438s (2.4 Mflops) (0/2 degradations so far) - -3 iterations (10 th.) took 0.001285s; avg 0.0004283s ( +/- 3.36/ 2.71 %); best 0.0004139s; worst 0.0004399s; std dev. 1.079e-05 (taking best). - 10 threads: 0.0004139s (2 Mflops) (1/2 degradations so far) - -3 iterations (9 th.) took 0.001761s; avg 0.000587s ( +/- 29.49/ 48.05 %); best 0.0004139s; worst 0.000869s; std dev. 0.0002012 (taking best). - 9 threads: 0.0004139s (2 Mflops) (2/2 degradations so far) - -Best threads choice is 11; starting threads were 12; max speed gap is 1.7x; search took 0.0087s. -After merge step 1: tpop: 0.0003438 s ~Mflops: 2.443 nsubm:8 otn:11 -Applying merge (10 -> 8 leaves, 11 th.) yielded SLOWDOWN (1th of 3 tolerable) of 1.432x: 0.0002401s -> 0.0003438s. -Skipping further merge based tests after 1 definite performance degradations in a row (and last exceeding limit). -A total of 1 merge steps (of max 6) (10 -> 8 subms) took 0.008695s (of which 1.192e-05s partitioning, 0s I/O); computing times: 4.053e-06s in par. loops, 9.537e-07s sorting, 2.146e-06s analyzing) -Total merge + benchmarking process took 0.008695s, equivalent to 36.2/36.2 new/old ops (0.001587s for 1 clones -- as 6.6/6.6 ops, or 6.6/6.6 ops per clone), SPEEDUP of 1.000x (NO SPEEDUP) +Will autotune matrix: 20 x 20, type D, 210 nnz, 10 nnz/r, 1 subms, 1 lsubms, 2.4000 bpnz. +Parameters: verbosity:1 mintimes:3 maxtimes:10 mindt:0 maxdt:2.935e-08 +Starting autotuning (16 x 2.93493e-08 s stages, transA=N, nrhs=1, timer gran.=2.93493e-08), 12 suggested as starting thread count(default). +3 iterations (12 th.) took 1.907e-06s; avg 6.358e-07s ( +/- 95.38/200.00 %); best 2.935e-08s; worst 1.907e-06s; std dev. 8.991e-07 (taking best). +~ 12 threads: 2.935e-08s (2.9e+04 Mflops) (0/2 degradations so far) - +3 iterations (11 th.) took 9.537e-07s; avg 3.179e-07s ( +/- 90.77/200.00 %); best 2.935e-08s; worst 9.537e-07s; std dev. 4.496e-07 (taking best). + 11 threads: 2.935e-08s (2.9e+04 Mflops) (0/2 degradations so far) - +3 iterations (10 th.) took 9.537e-07s; avg 3.179e-07s ( +/- 90.77/200.00 %); best 2.935e-08s; worst 9.537e-07s; std dev. 4.496e-07 (taking best). + 10 threads: 2.935e-08s (2.9e+04 Mflops) (0/2 degradations so far) - +3 iterations (9 th.) took 9.537e-07s; avg 3.179e-07s ( +/- 90.77/200.00 %); best 2.935e-08s; worst 9.537e-07s; std dev. 4.496e-07 (taking best). + 9 threads: 2.935e-08s (2.9e+04 Mflops) (0/2 degradations so far) - +3 iterations (8 th.) took 9.537e-07s; avg 3.179e-07s ( +/- 90.77/200.00 %); best 2.935e-08s; worst 9.537e-07s; std dev. 4.496e-07 (taking best). + 8 threads: 2.935e-08s (2.9e+04 Mflops) (0/2 degradations so far) - +3 iterations (7 th.) took 9.537e-07s; avg 3.179e-07s ( +/- 90.77/200.00 %); best 2.935e-08s; worst 9.537e-07s; std dev. 4.496e-07 (taking best). + 7 threads: 2.935e-08s (2.9e+04 Mflops) (0/2 degradations so far) - +3 iterations (6 th.) took 1.192e-06s; avg 3.974e-07s ( +/- 92.61/200.00 %); best 2.935e-08s; worst 1.192e-06s; std dev. 5.62e-07 (taking best). + 6 threads: 2.935e-08s (2.9e+04 Mflops) (0/2 degradations so far) - +3 iterations (5 th.) took 1.907e-06s; avg 6.358e-07s ( +/- 95.38/ 50.00 %); best 2.935e-08s; worst 9.537e-07s; std dev. 4.496e-07 (taking best). + 5 threads: 2.935e-08s (2.9e+04 Mflops) (0/2 degradations so far) - +3 iterations (4 th.) took 9.537e-07s; avg 3.179e-07s ( +/- 90.77/200.00 %); best 2.935e-08s; worst 9.537e-07s; std dev. 4.496e-07 (taking best). + 4 threads: 2.935e-08s (2.9e+04 Mflops) (0/2 degradations so far) - +3 iterations (3 th.) took 1.192e-06s; avg 3.974e-07s ( +/- 92.61/200.00 %); best 2.935e-08s; worst 1.192e-06s; std dev. 5.62e-07 (taking best). + 3 threads: 2.935e-08s (2.9e+04 Mflops) (0/2 degradations so far) - +3 iterations (2 th.) took 9.537e-07s; avg 3.179e-07s ( +/- 90.77/200.00 %); best 2.935e-08s; worst 9.537e-07s; std dev. 4.496e-07 (taking best). + 2 threads: 2.935e-08s (2.9e+04 Mflops) (0/2 degradations so far) - +3 iterations (1 th.) took 1.907e-06s; avg 6.358e-07s ( +/- 95.38/ 50.00 %); best 2.935e-08s; worst 9.537e-07s; std dev. 4.496e-07 (taking best). + 1 threads: 2.935e-08s (2.9e+04 Mflops) (0/2 degradations so far) - +Best threads choice is 12; starting threads were 12; max speed gap is 1x; search took 4.6e-05s. +Starting merge (and threads) based auto-tuning procedure (transA=N, nrhs=1, order=cols) (max 6 steps, inclusive 3 grace steps) on: 20 x 20, type D, 210 nnz, 10 nnz/r, 1 subms, 1 lsubms, 2.4000 bpnz (tpop: 2.935e-08 Mflops: 28620.758) +Merge (1 -> 1 leaves) took w.c.t. of 0s, ~0s of computing time (of which 0s sorting, 0s analysis) +3 iterations (12 th.) took 2.146e-06s; avg 7.153e-07s ( +/- 95.90/ 66.67 %); best 2.935e-08s; worst 1.192e-06s; std dev. 5.15e-07 (taking best). +~ 12 threads: 2.935e-08s (2.9e+04 Mflops) (0/2 degradations so far) - +3 iterations (11 th.) took 9.537e-07s; avg 3.179e-07s ( +/- 90.77/200.00 %); best 2.935e-08s; worst 9.537e-07s; std dev. 4.496e-07 (taking best). + 11 threads: 2.935e-08s (2.9e+04 Mflops) (0/2 degradations so far) - +3 iterations (10 th.) took 1.907e-06s; avg 6.358e-07s ( +/- 95.38/ 50.00 %); best 2.935e-08s; worst 9.537e-07s; std dev. 4.496e-07 (taking best). + 10 threads: 2.935e-08s (2.9e+04 Mflops) (0/2 degradations so far) - +3 iterations (9 th.) took 1.192e-06s; avg 3.974e-07s ( +/- 92.61/200.00 %); best 2.935e-08s; worst 1.192e-06s; std dev. 5.62e-07 (taking best). + 9 threads: 2.935e-08s (2.9e+04 Mflops) (0/2 degradations so far) - +3 iterations (8 th.) took 9.537e-07s; avg 3.179e-07s ( +/- 90.77/200.00 %); best 2.935e-08s; worst 9.537e-07s; std dev. 4.496e-07 (taking best). + 8 threads: 2.935e-08s (2.9e+04 Mflops) (0/2 degradations so far) - +3 iterations (7 th.) took 9.537e-07s; avg 3.179e-07s ( +/- 90.77/200.00 %); best 2.935e-08s; worst 9.537e-07s; std dev. 4.496e-07 (taking best). + 7 threads: 2.935e-08s (2.9e+04 Mflops) (0/2 degradations so far) - +3 iterations (6 th.) took 1.192e-06s; avg 3.974e-07s ( +/- 92.61/200.00 %); best 2.935e-08s; worst 1.192e-06s; std dev. 5.62e-07 (taking best). + 6 threads: 2.935e-08s (2.9e+04 Mflops) (0/2 degradations so far) - +3 iterations (5 th.) took 9.537e-07s; avg 3.179e-07s ( +/- 90.77/200.00 %); best 2.935e-08s; worst 9.537e-07s; std dev. 4.496e-07 (taking best). + 5 threads: 2.935e-08s (2.9e+04 Mflops) (0/2 degradations so far) - +3 iterations (4 th.) took 1.192e-06s; avg 3.974e-07s ( +/- 92.61/200.00 %); best 2.935e-08s; worst 1.192e-06s; std dev. 5.62e-07 (taking best). + 4 threads: 2.935e-08s (2.9e+04 Mflops) (0/2 degradations so far) - +3 iterations (3 th.) took 1.907e-06s; avg 6.358e-07s ( +/- 95.38/ 50.00 %); best 2.935e-08s; worst 9.537e-07s; std dev. 4.496e-07 (taking best). + 3 threads: 2.935e-08s (2.9e+04 Mflops) (0/2 degradations so far) - +3 iterations (2 th.) took 9.537e-07s; avg 3.179e-07s ( +/- 90.77/200.00 %); best 2.935e-08s; worst 9.537e-07s; std dev. 4.496e-07 (taking best). + 2 threads: 2.935e-08s (2.9e+04 Mflops) (0/2 degradations so far) - +3 iterations (1 th.) took 1.192e-06s; avg 3.974e-07s ( +/- 92.61/200.00 %); best 2.935e-08s; worst 1.192e-06s; std dev. 5.62e-07 (taking best). + 1 threads: 2.935e-08s (2.9e+04 Mflops) (0/2 degradations so far) - +Best threads choice is 12; starting threads were 12; max speed gap is 1x; search took 5.6e-05s. +After merge step 1: tpop: 2.935e-08 s ~Mflops: 28620.758 nsubm:1 otn:12 +Applying merge (1 -> 1 leaves, 12 th.) yielded NEGLIGIBLE change (1th in a row) (old/new=1.00000x): 2.935e-08s -> 2.935e-08s, so IGNORING this instance. +Merged all the matrix leaves: no reason to continue merging. +A total of 1 merge steps (of max 6) (1 -> 1 subms) took 5.913e-05s (of which 9.537e-07s partitioning, 0s I/O); computing times: 0s in par. loops, 0s sorting, 0s analyzing) +Total merge + benchmarking process took 5.913e-05s, equivalent to 2014.6/2014.6 new/old ops (0.001092s for 1 clones -- as 37213.6/37213.6 ops, or 37213.6/37213.6 ops per clone), SPEEDUP of 1.000x (NO SPEEDUP) Merging based autotuning FAILED (=NO SPEEDUP); let's try splitting then... -3 iterations (12 th.) took 0.002978s; avg 0.0009927s ( +/- 31.38/ 50.40 %); best 0.0006812s; worst 0.001493s; std dev. 0.0003573 (taking best). -~ 12 threads: 0.0006812s (1.2 Mflops) (0/2 degradations so far) - -3 iterations (11 th.) took 0.004147s; avg 0.001382s ( +/- 57.60/ 65.08 %); best 0.000586s; worst 0.002282s; std dev. 0.0006962 (taking best). - 11 threads: 0.000586s (1.4 Mflops) (0/2 degradations so far) - -3 iterations (10 th.) took 0.002305s; avg 0.0007683s ( +/- 68.50/ 80.66 %); best 0.000242s; worst 0.001388s; std dev. 0.0004725 (taking best). - 10 threads: 0.000242s (3.5 Mflops) (0/2 degradations so far) - -3 iterations (9 th.) took 0.005657s; avg 0.001886s ( +/- 82.29/159.11 %); best 0.000334s; worst 0.004886s; std dev. 0.002122 (taking best). - 9 threads: 0.000334s (2.5 Mflops) (1/2 degradations so far) - -3 iterations (8 th.) took 0.001807s; avg 0.0006023s ( +/- 27.60/ 13.88 %); best 0.0004361s; worst 0.0006859s; std dev. 0.0001176 (taking best). - 8 threads: 0.0004361s (1.9 Mflops) (2/2 degradations so far) - -Best threads choice is 10; starting threads were 12; max speed gap is 2.8x; search took 0.017s. -Starting split (and threads) based auto-tuning procedure (transA=N, nrhs=1, order=cols) (max 6 steps, inclusive 3 grace steps) on: 20 x 20, type D, 210 nnz, 10 nnz/r, 14 subms, 10 lsubms, 3.1429 bpnz (tpop: 0.000242 Mflops: 3.471) -Split (10 -> 25 leaves, 14 -> 34 subms) took 0.000458s (of which: 3.099e-06s analysis, -8.98e+09s mem.mgmt); compute time: 0.0008991s overall, 5.722e-06s searches, 0.0008934s shuffle, 0.0007794s switch, 4.101e-05s quadrants. -3 iterations (12 th.) took 0.004514s; avg 0.001505s ( +/- 70.83/ 40.29 %); best 0.0004389s; worst 0.002111s; std dev. 0.000756 (taking best). -~ 12 threads: 0.0004389s (1.9 Mflops) (0/2 degradations so far) - -3 iterations (11 th.) took 0.02064s; avg 0.006882s ( +/- 89.86/127.33 %); best 0.0006981s; worst 0.01564s; std dev. 0.006368 (taking best). - 11 threads: 0.0006981s (1.2 Mflops) (1/2 degradations so far) - -3 iterations (10 th.) took 0.006828s; avg 0.002276s ( +/- 70.17/ 75.08 %); best 0.000679s; worst 0.003985s; std dev. 0.001352 (taking best). - 10 threads: 0.000679s (1.2 Mflops) (2/2 degradations so far) - -Best threads choice is 12; starting threads were 12; max speed gap is 1.6x; search took 0.032s. -After split step 1: tpop: 0.0004389 s ~Mflops: 1.914 nsubm:25 otn:12 -Applying split (10 -> 25 leaves, 12 th.) yielded SLOWDOWN (1th of 3 tolerable) of 1.814x: 0.000242s -> 0.0004389s. +3 iterations (12 th.) took 1.907e-06s; avg 6.358e-07s ( +/- 95.38/ 50.00 %); best 2.935e-08s; worst 9.537e-07s; std dev. 4.496e-07 (taking best). +~ 12 threads: 2.935e-08s (2.9e+04 Mflops) (0/2 degradations so far) - +3 iterations (11 th.) took 9.537e-07s; avg 3.179e-07s ( +/- 90.77/200.00 %); best 2.935e-08s; worst 9.537e-07s; std dev. 4.496e-07 (taking best). + 11 threads: 2.935e-08s (2.9e+04 Mflops) (0/2 degradations so far) - +3 iterations (10 th.) took 1.907e-06s; avg 6.358e-07s ( +/- 95.38/ 50.00 %); best 2.935e-08s; worst 9.537e-07s; std dev. 4.496e-07 (taking best). + 10 threads: 2.935e-08s (2.9e+04 Mflops) (0/2 degradations so far) - +3 iterations (9 th.) took 9.537e-07s; avg 3.179e-07s ( +/- 90.77/200.00 %); best 2.935e-08s; worst 9.537e-07s; std dev. 4.496e-07 (taking best). + 9 threads: 2.935e-08s (2.9e+04 Mflops) (0/2 degradations so far) - +3 iterations (8 th.) took 9.537e-07s; avg 3.179e-07s ( +/- 90.77/200.00 %); best 2.935e-08s; worst 9.537e-07s; std dev. 4.496e-07 (taking best). + 8 threads: 2.935e-08s (2.9e+04 Mflops) (0/2 degradations so far) - +3 iterations (7 th.) took 9.537e-07s; avg 3.179e-07s ( +/- 90.77/200.00 %); best 2.935e-08s; worst 9.537e-07s; std dev. 4.496e-07 (taking best). + 7 threads: 2.935e-08s (2.9e+04 Mflops) (0/2 degradations so far) - +3 iterations (6 th.) took 1.192e-06s; avg 3.974e-07s ( +/- 92.61/200.00 %); best 2.935e-08s; worst 1.192e-06s; std dev. 5.62e-07 (taking best). + 6 threads: 2.935e-08s (2.9e+04 Mflops) (0/2 degradations so far) - +3 iterations (5 th.) took 1.907e-06s; avg 6.358e-07s ( +/- 95.38/ 50.00 %); best 2.935e-08s; worst 9.537e-07s; std dev. 4.496e-07 (taking best). + 5 threads: 2.935e-08s (2.9e+04 Mflops) (0/2 degradations so far) - +3 iterations (4 th.) took 2.146e-06s; avg 7.153e-07s ( +/- 95.90/ 66.67 %); best 2.935e-08s; worst 1.192e-06s; std dev. 5.15e-07 (taking best). + 4 threads: 2.935e-08s (2.9e+04 Mflops) (0/2 degradations so far) - +3 iterations (3 th.) took 9.537e-07s; avg 3.179e-07s ( +/- 90.77/200.00 %); best 2.935e-08s; worst 9.537e-07s; std dev. 4.496e-07 (taking best). + 3 threads: 2.935e-08s (2.9e+04 Mflops) (0/2 degradations so far) - +3 iterations (2 th.) took 9.537e-07s; avg 3.179e-07s ( +/- 90.77/200.00 %); best 2.935e-08s; worst 9.537e-07s; std dev. 4.496e-07 (taking best). + 2 threads: 2.935e-08s (2.9e+04 Mflops) (0/2 degradations so far) - +3 iterations (1 th.) took 1.192e-06s; avg 3.974e-07s ( +/- 92.61/200.00 %); best 2.935e-08s; worst 1.192e-06s; std dev. 5.62e-07 (taking best). + 1 threads: 2.935e-08s (2.9e+04 Mflops) (0/2 degradations so far) - +Best threads choice is 12; starting threads were 12; max speed gap is 1x; search took 6.7e-05s. +Starting split (and threads) based auto-tuning procedure (transA=N, nrhs=1, order=cols) (max 6 steps, inclusive 3 grace steps) on: 20 x 20, type D, 210 nnz, 10 nnz/r, 1 subms, 1 lsubms, 2.4000 bpnz (tpop: 2.935e-08 Mflops: 28620.758) +Split (1 -> 3 leaves, 1 -> 4 subms) took 1.907e-05s (of which: 9.537e-07s analysis, -1.762e+09s mem.mgmt); compute time: 7.868e-06s overall, 9.537e-07s searches, 6.914e-06s shuffle, 1.907e-06s switch, 1.192e-06s quadrants. +3 iterations (12 th.) took 0.00192s; avg 0.00064s ( +/- 33.43/ 51.25 %); best 0.0004261s; worst 0.000968s; std dev. 0.0002355 (taking best). +~ 12 threads: 0.0004261s (2 Mflops) (0/2 degradations so far) - +3 iterations (11 th.) took 0.002064s; avg 0.000688s ( +/- 37.93/ 47.38 %); best 0.000427s; worst 0.001014s; std dev. 0.000244 (taking best). + 11 threads: 0.000427s (2 Mflops) (1/2 degradations so far) - +3 iterations (10 th.) took 0.001821s; avg 0.000607s ( +/- 30.48/ 60.45 %); best 0.000422s; worst 0.0009739s; std dev. 0.0002595 (taking best). + 10 threads: 0.000422s (2 Mflops) (0/2 degradations so far) - +3 iterations (9 th.) took 0.001292s; avg 0.0004307s ( +/- 6.22/ 8.45 %); best 0.0004039s; worst 0.0004671s; std dev. 2.667e-05 (taking best). + 9 threads: 0.0004039s (2.1 Mflops) (0/2 degradations so far) - +3 iterations (8 th.) took 0.001187s; avg 0.0003957s ( +/- 14.32/ 8.46 %); best 0.000339s; worst 0.0004292s; std dev. 4.029e-05 (taking best). + 8 threads: 0.000339s (2.5 Mflops) (0/2 degradations so far) - +3 iterations (7 th.) took 0.001274s; avg 0.0004247s ( +/- 1.09/ 1.50 %); best 0.0004201s; worst 0.0004311s; std dev. 4.645e-06 (taking best). + 7 threads: 0.0004201s (2 Mflops) (1/2 degradations so far) - +3 iterations (6 th.) took 0.0018s; avg 0.0006s ( +/- 29.83/ 56.79 %); best 0.000421s; worst 0.0009408s; std dev. 0.0002411 (taking best). + 6 threads: 0.000421s (2 Mflops) (2/2 degradations so far) - +Best threads choice is 8; starting threads were 12; max speed gap is 1.3x; search took 0.011s. +After split step 1: tpop: 0.000339 s ~Mflops: 2.478 nsubm:3 otn:8 +Applying split (1 -> 3 leaves, 8 th.) yielded SLOWDOWN (1th of 3 tolerable) of 11551.584x: 2.935e-08s -> 0.000339s. Skipping further split based tests after 1 definite performance degradations in a row (and last exceeding limit). -A total of 1 split steps (of max 6) (10 -> 25 subms) took 0.03252s (of which 0.0004969s partitioning, 0s I/O); computing times: 0.0008991s in par. loops, 5.722e-06s sorting, 3.099e-06s analyzing) -Total split + benchmarking process took 0.03252s, equivalent to 134.4/134.4 new/old ops (0.001314s for 1 clones -- as 5.4/5.4 ops, or 5.4/5.4 ops per clone), SPEEDUP of 1.000x (NO SPEEDUP) -In 1 tuning rounds (tot. 0.066s, 0.0029s for constructor, 2 clones) obtained NO speedup (best stays 3.471 Mflops). +A total of 1 split steps (of max 6) (1 -> 3 subms) took 0.01143s (of which 2.48e-05s partitioning, 0s I/O); computing times: 7.868e-06s in par. loops, 9.537e-07s sorting, 9.537e-07s analyzing) +Total split + benchmarking process took 0.01143s, equivalent to 389374.5/389374.5 new/old ops (0.001381s for 1 clones -- as 47051.2/47051.2 ops, or 47051.2/47051.2 ops per clone), SPEEDUP of 1.000x (NO SPEEDUP) +In 1 tuning rounds (tot. 0.014s, 0.0025s for constructor, 2 clones) obtained NO speedup (best stays 2.862e+04 Mflops). check results are ok Building a matrix with 36 nnz, 6 x 6 Duplicates check: 36 - 0 = 36 - converted COO to RSB in 2.185e-03 s (100.00 %) - analyzed arrays in 8.712e-04 s (39.87 %) - cleaned-up arrays in 9.537e-07 s (0.04 %) - deduplicated arrays in 0.000e+00 s (0.00 %) - sorted arrays in 8.829e-04 s (40.40 %) - shuffled partitions in 4.199e-04 s (19.21 %) - memory allocations took 7.153e-06 s (0.33 %) - leafs setup took 1.192e-06 s (0.05 %) - halfword conversion took 9.537e-07 s (0.04 %) -Built (6 x 6)[0xaaab10cb60c0]{Z} @ (0(0..6),0(0..6)) (36 nnz, 6 nnz/r) flags 0x20440b4 (coo:0, csr:1, hw:0, ic:1, fi:0), storage: 1, subm: 1, symflags:'UL' + converted COO to RSB in 1.325e-03 s (100.00 %) + analyzed arrays in 6.461e-04 s (48.76 %) + cleaned-up arrays in 1.192e-06 s (0.09 %) + deduplicated arrays in 9.537e-07 s (0.07 %) + sorted arrays in 2.549e-04 s (19.23 %) + shuffled partitions in 4.170e-04 s (31.47 %) + memory allocations took 4.053e-06 s (0.31 %) + leafs setup took 0.000e+00 s (0.00 %) + halfword conversion took 9.537e-07 s (0.07 %) +Built (6 x 6)[0xaaaaf81bb990]{Z} @ (0(0..6),0(0..6)) (36 nnz, 6 nnz/r) flags 0x20440b4 (coo:0, csr:1, hw:0, ic:1, fi:0), storage: 1, subm: 1, symflags:'UL' Read matrix pd.mtx 6 x 6 : 36 Matrix has no symmetry Using NRHS=4 -Repeated USMV took 0.1881E-03 s -A single USMM took 0.9918E-04 s -USMM-to-USMV speed ratio is is 1.897 x +Repeated USMV took 0.1831E-03 s +A single USMM took 0.9179E-04 s +USMM-to-USMV speed ratio is is 1.995 x Call auto-tuning routine.. Repeat measurement. -Tuned USMM took 0.2146E-05 s -Tuned-to-untuned speed ratio is is 46.22 x +Tuned USMM took 0.9537E-06 s +Tuned-to-untuned speed ratio is is 96.25 x FAILED: 0 PASSED: 2 /build/reproducible-path/librsb-1.3.0.2+dfsg/examples/fortran_rsb_fi @@ -8907,218 +9014,238 @@ Loading matrix from file "/build/reproducible-path/librsb-1.3.0.2+dfsg/pd.mtx". Building a matrix with 36 nnz, 6 x 6 Duplicates check: 36 - 0 = 36 - converted COO to RSB in 4.632e-03 s (100.00 %) - analyzed arrays in 1.247e-03 s (26.92 %) - cleaned-up arrays in 2.146e-06 s (0.05 %) + converted COO to RSB in 4.537e-03 s (100.00 %) + analyzed arrays in 9.170e-04 s (20.21 %) + cleaned-up arrays in 9.537e-07 s (0.02 %) deduplicated arrays in 9.537e-07 s (0.02 %) - sorted arrays in 1.037e-03 s (22.39 %) - shuffled partitions in 8.640e-04 s (18.65 %) + sorted arrays in 1.064e-03 s (23.45 %) + shuffled partitions in 8.650e-04 s (19.06 %) memory allocations took 8.106e-06 s (0.18 %) - leafs setup took 4.053e-06 s (0.09 %) - halfword conversion took 1.459e-03 s (31.50 %) -Built (6 x 6)[0xaaaadc5f6a20]{D} @ (0(0..0),0(0..0)) (36 nnz, 6 nnz/r) flags 0x42046186 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 22, symflags:'' + leafs setup took 3.099e-06 s (0.07 %) + halfword conversion took 1.669e-03 s (36.78 %) +Built (6 x 6)[0xaaab0e710a20]{D} @ (0(0..0),0(0..0)) (36 nnz, 6 nnz/r) flags 0x42046186 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 22, symflags:'' Considering D clone. Base matrix: -(6 x 6)[0xaaaadc5faaa0]{D} @ (0(0..0),0(0..0)) (36 nnz, 6 nnz/r) flags 0x2046186 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 22, symflags:'' +(6 x 6)[0xaaab0e714aa0]{D} @ (0(0..0),0(0..0)) (36 nnz, 6 nnz/r) flags 0x2046186 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 22, symflags:'' Will use autotuning routine to sample matrix: 6 x 6, type D, 36 nnz, 6 nnz/r, 29 subms, 22 lsubms, 4.6667 bpnz. Parameters: verbosity:1 mintimes:3 maxtimes:10 mindt:0 maxdt:0.1 -3 iterations (12 th.) took 0.001862s; avg 0.0006207s ( +/- 52.94/ 43.39 %); best 0.0002921s; worst 0.00089s; std dev. 0.0002477 (taking best). -Reference operation time is 0.000292063 s (0.493 Mflops) with 12 threads. -After 0.001895s, autotuning routine did not find a better threads count configuration. +3 iterations (12 th.) took 0.002863s; avg 0.0009543s ( +/- 25.17/ 40.73 %); best 0.0007141s; worst 0.001343s; std dev. 0.0002774 (taking best). +Reference operation time is 0.000714064 s (0.2017 Mflops) with 12 threads. +After 0.002895s, autotuning routine did not find a better threads count configuration. Will autotune matrix: 6 x 6, type D, 36 nnz, 6 nnz/r, 29 subms, 22 lsubms, 4.6667 bpnz. Parameters: verbosity:1 mintimes:3 maxtimes:10 mindt:0 maxdt:0.1 -3 iterations (12 th.) took 0.001484s; avg 0.0004946s ( +/- 8.03/ 9.80 %); best 0.0004549s; worst 0.0005431s; std dev. 3.654e-05 (taking best). -Reference operation time is 0.000454903 s (0.3166 Mflops) with 12 threads. -Starting merge (same threads) based auto-tuning procedure (transA=N, nrhs=2, order=cols) (max 6 steps, inclusive 3 grace steps) on: 6 x 6, type D, 36 nnz, 6 nnz/r, 29 subms, 22 lsubms, 4.6667 bpnz (tpop: 0.0004549 Mflops: 0.317) -Merge (22 -> 16 leaves) took w.c.t. of 0.00033s, ~0.0001371s of computing time (of which 1.907e-06s sorting, 6.914e-06s analysis) -3 iterations (12 th.) took 0.004214s; avg 0.001405s ( +/- 44.84/ 65.17 %); best 0.0007749s; worst 0.00232s; std dev. 0.0006623 (taking best). -Reference operation time is 0.00077486 s (0.1858 Mflops) with 12 threads. -After merge step 1: tpop: 0.0007749 s ~Mflops: 0.186 nsubm:16 otn:12 -Applying merge (22 -> 16 leaves, 12 th.) yielded SLOWDOWN (1th of 3 tolerable) of 1.703x: 0.0004549s -> 0.0007749s. -Skipping further merge based tests after 1 definite performance degradations in a row (and last exceeding limit). -A total of 1 merge steps (of max 6) (22 -> 16 subms) took 0.004564s (of which 0.000335s partitioning, 0s I/O); computing times: 0.0001371s in par. loops, 1.907e-06s sorting, 6.914e-06s analyzing) -Total merge + benchmarking process took 0.004564s, equivalent to 10.0/10.0 new/old ops (0.001268s for 1 clones -- as 2.8/2.8 ops, or 2.8/2.8 ops per clone), SPEEDUP of 1.000x (NO SPEEDUP) -Merging based autotuning FAILED (=NO SPEEDUP); let's try splitting then... -3 iterations (12 th.) took 0.002114s; avg 0.0007046s ( +/- 60.85/ 47.46 %); best 0.0002759s; worst 0.001039s; std dev. 0.0003186 (taking best). -Reference operation time is 0.00027585 s (0.522 Mflops) with 12 threads. -Starting split (same threads) based auto-tuning procedure (transA=N, nrhs=2, order=cols) (max 6 steps, inclusive 3 grace steps) on: 6 x 6, type D, 36 nnz, 6 nnz/r, 29 subms, 22 lsubms, 4.6667 bpnz (tpop: 0.0002759 Mflops: 0.522) -Split (22 -> 28 leaves, 29 -> 37 subms) took 0.000936s (of which: 3.099e-06s analysis, -3.592e+09s mem.mgmt); compute time: 0.0001101s overall, 9.537e-07s searches, 0.0001092s shuffle, 5.317e-05s switch, 2.146e-06s quadrants. -3 iterations (12 th.) took 0.002413s; avg 0.0008043s ( +/- 38.20/ 73.55 %); best 0.0004971s; worst 0.001396s; std dev. 0.0004184 (taking best). -Reference operation time is 0.000497103 s (0.2897 Mflops) with 12 threads. -After split step 1: tpop: 0.0004971 s ~Mflops: 0.290 nsubm:28 otn:12 -Applying split (22 -> 28 leaves, 12 th.) yielded SLOWDOWN (1th of 3 tolerable) of 1.802x: 0.0002759s -> 0.0004971s. -Skipping further split based tests after 1 definite performance degradations in a row (and last exceeding limit). -A total of 1 split steps (of max 6) (22 -> 28 subms) took 0.003412s (of which 0.000977s partitioning, 0s I/O); computing times: 0.0001101s in par. loops, 9.537e-07s sorting, 3.099e-06s analyzing) -Total split + benchmarking process took 0.003412s, equivalent to 12.4/12.4 new/old ops (0.001103s for 1 clones -- as 4.0/4.0 ops, or 4.0/4.0 ops per clone), SPEEDUP of 1.000x (NO SPEEDUP) -In 1 tuning rounds (tot. 0.014s, 0.0024s for constructor, 2 clones) obtained NO speedup (best stays 0.522 Mflops). -After 0.014013s, global autotuning found old matrix optimal, with declared speedup 1 x when using 12 threads +3 iterations (12 th.) took 0.00269s; avg 0.0008967s ( +/- 10.77/ 19.22 %); best 0.0008001s; worst 0.001069s; std dev. 0.0001222 (taking best). +Reference operation time is 0.000800133 s (0.18 Mflops) with 12 threads. +Starting merge (same threads) based auto-tuning procedure (transA=N, nrhs=2, order=cols) (max 6 steps, inclusive 3 grace steps) on: 6 x 6, type D, 36 nnz, 6 nnz/r, 29 subms, 22 lsubms, 4.6667 bpnz (tpop: 0.0008001 Mflops: 0.180) +Merge (22 -> 16 leaves) took w.c.t. of 0.0004158s, ~0.000227s of computing time (of which 1.907e-06s sorting, 2.861e-06s analysis) +3 iterations (12 th.) took 0.002664s; avg 0.000888s ( +/- 49.12/ 78.15 %); best 0.0004518s; worst 0.001582s; std dev. 0.0004961 (taking best). +Reference operation time is 0.000451803 s (0.3187 Mflops) with 12 threads. +After merge step 1: tpop: 0.0004518 s ~Mflops: 0.319 nsubm:16 otn:12 +Applying merge (22 -> 16 leaves, 12 th.) yielded SPEEDUP of 1.771x: 0.0008001s -> 0.0004518s, so taking this instance. +Merge (16 -> 10 leaves) took w.c.t. of 0.000304s, ~1.407e-05s of computing time (of which 9.537e-07s sorting, 2.146e-06s analysis) +3 iterations (12 th.) took 0.001795s; avg 0.0005984s ( +/- 24.13/ 46.39 %); best 0.0004539s; worst 0.0008759s; std dev. 0.0001963 (taking best). +Reference operation time is 0.000453949 s (0.3172 Mflops) with 12 threads. +After merge step 2: tpop: 0.0004539 s ~Mflops: 0.317 nsubm:10 otn:12 +Applying merge (16 -> 10 leaves, 12 th.) yielded NEGLIGIBLE change (1th in a row) (old/new=0.99527x): 0.0004518s -> 0.0004539s, so IGNORING this instance. +Merge (10 -> 7 leaves) took w.c.t. of 5.96e-06s, ~3.099e-06s of computing time (of which 0s sorting, 1.907e-06s analysis) +3 iterations (12 th.) took 0.001543s; avg 0.0005143s ( +/- 16.61/ 29.88 %); best 0.0004289s; worst 0.000668s; std dev. 0.0001089 (taking best). +Reference operation time is 0.000428915 s (0.3357 Mflops) with 12 threads. +After merge step 3: tpop: 0.0004289 s ~Mflops: 0.336 nsubm:7 otn:12 +Applying merge (10 -> 7 leaves, 12 th.) yielded SPEEDUP of 1.053x: 0.0004518s -> 0.0004289s, so taking this instance. +Merge (7 -> 4 leaves) took w.c.t. of 7.868e-06s, ~2.146e-06s of computing time (of which 1.192e-06s sorting, 1.907e-06s analysis) +3 iterations (12 th.) took 0.001526s; avg 0.0005086s ( +/- 32.73/ 41.14 %); best 0.0003421s; worst 0.0007179s; std dev. 0.0001563 (taking best). +Reference operation time is 0.000342131 s (0.4209 Mflops) with 12 threads. +After merge step 4: tpop: 0.0003421 s ~Mflops: 0.421 nsubm:4 otn:12 +Applying merge (7 -> 4 leaves, 12 th.) yielded SPEEDUP of 1.254x: 0.0004289s -> 0.0003421s, so taking this instance. +Merge (4 -> 1 leaves) took w.c.t. of 5.007e-06s, ~2.146e-06s of computing time (of which 0s sorting, 0s analysis) +3 iterations (12 th.) took 2.146e-06s; avg 7.153e-07s ( +/- 95.90/ 66.67 %); best 2.935e-08s; worst 1.192e-06s; std dev. 5.15e-07 (taking best). +Reference operation time is 2.93493e-08 s (4906 Mflops) with 12 threads. +After merge step 5: tpop: 2.935e-08 s ~Mflops: 4906.416 nsubm:1 otn:12 +Applying merge (4 -> 1 leaves, 12 th.) yielded SPEEDUP of 11657.189x: 0.0003421s -> 2.935e-08s, so taking this instance. +Merged all the matrix leaves: no reason to continue merging. +A total of 5 merge steps (of max 6) (22 -> 1 subms) took 0.0143s (of which 0.0007501s partitioning, 0s I/O); computing times: 0.0002484s in par. loops, 4.053e-06s sorting, 8.821e-06s analyzing) +Total merge + benchmarking process took 0.0143s, equivalent to 487132.4/17.9 new/old ops (0.007766s for 5 clones -- as 264622.3/9.7 ops, or 52924.5/1.9 ops per clone), SPEEDUP of 27262.388x +Applying multi-merge (22 -> 1 leaves, 5 steps, 0 -> 12 th.sp.) yielded SPEEDUP of 27262.388x (0.0008001s -> 2.935e-08s), will amortize in 17.9 ops by saving 0.0008001s per op. +In 1 tuning rounds (tot. 0.019s, 0.0078s for constructor, 5 clones) obtained a SPEEDUP of 2726138.8% (2.726e+04x) (from 0.18 to 4906 Mflops). +After 0.018825s, global autotuning declared speedup of 27262.4 x, when using threads count of 12 and a new matrix: +(6 x 6)[0xaaab0e716e70]{D} @ (0(0..6),0(0..6)) (36 nnz, 6 nnz/r) flags 0x2244086 (coo:0, csr:1, hw:1, ic:1, fi:0), storage: 1, subm: 1, symflags:'' Considering S clone. Building a matrix with 36 nnz, 6 x 6 Duplicates check: 36 - 0 = 36 - converted COO to RSB in 5.313e-03 s (100.00 %) - analyzed arrays in 1.569e-03 s (29.53 %) - cleaned-up arrays in 9.537e-07 s (0.02 %) + converted COO to RSB in 2.776e-03 s (100.00 %) + analyzed arrays in 9.248e-04 s (33.32 %) + cleaned-up arrays in 9.537e-07 s (0.03 %) deduplicated arrays in 0.000e+00 s (0.00 %) sorted arrays in 0.000e+00 s (0.00 %) - shuffled partitions in 1.251e-03 s (23.55 %) - memory allocations took 1.907e-06 s (0.04 %) - leafs setup took 1.192e-06 s (0.02 %) - halfword conversion took 2.489e-03 s (46.85 %) -Built (6 x 6)[0xaaaadc5fce90]{S} @ (0(0..0),0(0..0)) (36 nnz, 6 nnz/r) flags 0x42046186 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 16, symflags:'' + shuffled partitions in 9.072e-04 s (32.68 %) + memory allocations took 2.861e-06 s (0.10 %) + leafs setup took 9.537e-07 s (0.03 %) + halfword conversion took 9.379e-04 s (33.79 %) +Built (6 x 6)[0xaaab0e716e70]{S} @ (0(0..0),0(0..0)) (36 nnz, 6 nnz/r) flags 0x42046186 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 16, symflags:'' Base matrix: -(6 x 6)[0xaaaadc5fce90]{S} @ (0(0..0),0(0..0)) (36 nnz, 6 nnz/r) flags 0x2046186 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 16, symflags:'' +(6 x 6)[0xaaab0e716e70]{S} @ (0(0..0),0(0..0)) (36 nnz, 6 nnz/r) flags 0x2046186 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 16, symflags:'' -Will use autotuning routine to sample matrix: 6 x 6, type S, 36 nnz, 6 nnz/r, 21 subms, 16 lsubms, 4.5000 bpnz. +Will use autotuning routine to sample matrix: 6 x 6, type S, 36 nnz, 6 nnz/r, 21 subms, 16 lsubms, 4.8889 bpnz. Parameters: verbosity:1 mintimes:3 maxtimes:10 mindt:0 maxdt:0.1 -3 iterations (12 th.) took 0.01015s; avg 0.003382s ( +/- 87.05/164.90 %); best 0.000438s; worst 0.008958s; std dev. 0.003945 (taking best). -Reference operation time is 0.000437975 s (0.3288 Mflops) with 12 threads. -After 0.010165s, autotuning routine did not find a better threads count configuration. +3 iterations (12 th.) took 0.003258s; avg 0.001086s ( +/- 45.31/ 64.74 %); best 0.0005939s; worst 0.001789s; std dev. 0.0005102 (taking best). +Reference operation time is 0.000593901 s (0.2425 Mflops) with 12 threads. +After 0.003268s, autotuning routine did not find a better threads count configuration. -Will autotune matrix: 6 x 6, type S, 36 nnz, 6 nnz/r, 21 subms, 16 lsubms, 4.5000 bpnz. +Will autotune matrix: 6 x 6, type S, 36 nnz, 6 nnz/r, 21 subms, 16 lsubms, 4.8889 bpnz. Parameters: verbosity:1 mintimes:3 maxtimes:10 mindt:0 maxdt:0.1 -3 iterations (12 th.) took 0.001617s; avg 0.000539s ( +/- 20.78/ 39.34 %); best 0.000427s; worst 0.000751s; std dev. 0.00015 (taking best). -Reference operation time is 0.000427008 s (0.3372 Mflops) with 12 threads. -Starting merge (same threads) based auto-tuning procedure (transA=N, nrhs=2, order=cols) (max 6 steps, inclusive 3 grace steps) on: 6 x 6, type S, 36 nnz, 6 nnz/r, 21 subms, 16 lsubms, 4.5000 bpnz (tpop: 0.000427 Mflops: 0.337) -Merge (16 -> 13 leaves) took w.c.t. of 8.821e-06s, ~3.099e-06s of computing time (of which 0s sorting, 1.907e-06s analysis) -3 iterations (12 th.) took 0.001526s; avg 0.0005086s ( +/- 15.86/ 22.48 %); best 0.000428s; worst 0.000623s; std dev. 8.311e-05 (taking best). -Reference operation time is 0.000427961 s (0.3365 Mflops) with 12 threads. -After merge step 1: tpop: 0.000428 s ~Mflops: 0.336 nsubm:13 otn:12 -Applying merge (16 -> 13 leaves, 12 th.) yielded NEGLIGIBLE change (1th in a row) (old/new=0.99777x): 0.000427s -> 0.000428s, so IGNORING this instance. -Merge (13 -> 10 leaves) took w.c.t. of 0.0002098s, ~1.907e-06s of computing time (of which 9.537e-07s sorting, 0.000206s analysis) -3 iterations (12 th.) took 0.002049s; avg 0.000683s ( +/- 33.26/ 27.97 %); best 0.0004559s; worst 0.000874s; std dev. 0.0001726 (taking best). -Reference operation time is 0.000455856 s (0.3159 Mflops) with 12 threads. -After merge step 2: tpop: 0.0004559 s ~Mflops: 0.316 nsubm:10 otn:12 -Applying merge (13 -> 10 leaves, 12 th.) yielded SLOWDOWN (1th of 3 tolerable) of 1.068x: 0.000427s -> 0.0004559s. -Merge (10 -> 7 leaves) took w.c.t. of 5.007e-06s, ~1.192e-06s of computing time (of which 0s sorting, 9.537e-07s analysis) -3 iterations (12 th.) took 0.003219s; avg 0.001073s ( +/- 58.36/116.03 %); best 0.0004468s; worst 0.002318s; std dev. 0.0008804 (taking best). -Reference operation time is 0.000446796 s (0.3223 Mflops) with 12 threads. -After merge step 3: tpop: 0.0004468 s ~Mflops: 0.322 nsubm:7 otn:12 -Applying merge (10 -> 7 leaves, 12 th.) yielded SLOWDOWN (2th of 3 tolerable) of 1.046x: 0.000427s -> 0.0004468s. -Merge (7 -> 4 leaves) took w.c.t. of 5.96e-06s, ~2.146e-06s of computing time (of which 0s sorting, 1.907e-06s analysis) -3 iterations (12 th.) took 0.002324s; avg 0.0007747s ( +/- 17.77/ 34.77 %); best 0.0006371s; worst 0.001044s; std dev. 0.0001905 (taking best). -Reference operation time is 0.000637054 s (0.226 Mflops) with 12 threads. -After merge step 4: tpop: 0.0006371 s ~Mflops: 0.226 nsubm:4 otn:12 -Applying merge (7 -> 4 leaves, 12 th.) yielded SLOWDOWN (3th of 3 tolerable) of 1.492x: 0.000427s -> 0.0006371s. -Skipping further merge based tests after 3 definite performance degradations in a row (and last exceeding limit). -A total of 4 merge steps (of max 6) (16 -> 4 subms) took 0.009389s (of which 0.0002367s partitioning, 0s I/O); computing times: 8.345e-06s in par. loops, 9.537e-07s sorting, 0.0002108s analyzing) -Total merge + benchmarking process took 0.009389s, equivalent to 22.0/22.0 new/old ops (0.001579s for 1 clones -- as 3.7/3.7 ops, or 3.7/3.7 ops per clone), SPEEDUP of 1.000x (NO SPEEDUP) -Merging based autotuning FAILED (=NO SPEEDUP); let's try splitting then... -3 iterations (12 th.) took 0.002483s; avg 0.0008276s ( +/- 46.85/ 45.10 %); best 0.0004399s; worst 0.001201s; std dev. 0.0003109 (taking best). -Reference operation time is 0.000439882 s (0.3274 Mflops) with 12 threads. -Starting split (same threads) based auto-tuning procedure (transA=N, nrhs=2, order=cols) (max 6 steps, inclusive 3 grace steps) on: 6 x 6, type S, 36 nnz, 6 nnz/r, 21 subms, 16 lsubms, 4.5000 bpnz (tpop: 0.0004399 Mflops: 0.327) -Split (16 -> 25 leaves, 21 -> 33 subms) took 0.000864s (of which: 3.099e-06s analysis, -5.388e+09s mem.mgmt); compute time: 0.0003171s overall, 0s searches, 0.0003171s shuffle, 0.00021s switch, 4.053e-06s quadrants. -3 iterations (12 th.) took 0.003753s; avg 0.001251s ( +/- 25.82/ 14.88 %); best 0.0009279s; worst 0.001437s; std dev. 0.0002293 (taking best). -Reference operation time is 0.000927925 s (0.1552 Mflops) with 12 threads. -After split step 1: tpop: 0.0009279 s ~Mflops: 0.155 nsubm:25 otn:12 -Applying split (16 -> 25 leaves, 12 th.) yielded SLOWDOWN (1th of 3 tolerable) of 2.109x: 0.0004399s -> 0.0009279s. -Skipping further split based tests after 1 definite performance degradations in a row (and last exceeding limit). -A total of 1 split steps (of max 6) (16 -> 25 subms) took 0.004637s (of which 0.000874s partitioning, 0s I/O); computing times: 0.0003171s in par. loops, 0s sorting, 3.099e-06s analyzing) -Total split + benchmarking process took 0.004637s, equivalent to 10.5/10.5 new/old ops (0.001738s for 1 clones -- as 4.0/4.0 ops, or 4.0/4.0 ops per clone), SPEEDUP of 1.000x (NO SPEEDUP) -In 1 tuning rounds (tot. 0.022s, 0.0033s for constructor, 2 clones) obtained NO speedup (best stays 0.3274 Mflops). -After 0.021511s, global autotuning found old matrix optimal, with declared speedup 1 x when using 12 threads +3 iterations (12 th.) took 0.002081s; avg 0.0006936s ( +/- 10.91/ 9.13 %); best 0.000618s; worst 0.000757s; std dev. 5.741e-05 (taking best). +Reference operation time is 0.000617981 s (0.233 Mflops) with 12 threads. +Starting merge (same threads) based auto-tuning procedure (transA=N, nrhs=2, order=cols) (max 6 steps, inclusive 3 grace steps) on: 6 x 6, type S, 36 nnz, 6 nnz/r, 21 subms, 16 lsubms, 4.8889 bpnz (tpop: 0.000618 Mflops: 0.233) +Merge (16 -> 10 leaves) took w.c.t. of 0.0002649s, ~8.821e-06s of computing time (of which 0s sorting, 1.907e-06s analysis) +3 iterations (12 th.) took 0.001774s; avg 0.0005914s ( +/- 26.26/ 49.13 %); best 0.0004361s; worst 0.0008819s; std dev. 0.0002056 (taking best). +Reference operation time is 0.000436068 s (0.3302 Mflops) with 12 threads. +After merge step 1: tpop: 0.0004361 s ~Mflops: 0.330 nsubm:10 otn:12 +Applying merge (16 -> 10 leaves, 12 th.) yielded SPEEDUP of 1.417x: 0.000618s -> 0.0004361s, so taking this instance. +Merge (10 -> 7 leaves) took w.c.t. of 6.914e-06s, ~3.099e-06s of computing time (of which 0s sorting, 1.907e-06s analysis) +3 iterations (12 th.) took 0.002324s; avg 0.0007747s ( +/- 42.70/ 84.47 %); best 0.0004439s; worst 0.001429s; std dev. 0.0004627 (taking best). +Reference operation time is 0.000443935 s (0.3244 Mflops) with 12 threads. +After merge step 2: tpop: 0.0004439 s ~Mflops: 0.324 nsubm:7 otn:12 +Applying merge (10 -> 7 leaves, 12 th.) yielded NEGLIGIBLE change (1th in a row) (old/new=0.98228x): 0.0004361s -> 0.0004439s, so IGNORING this instance. +Merge (7 -> 4 leaves) took w.c.t. of 7.868e-06s, ~3.815e-06s of computing time (of which 0s sorting, 1.907e-06s analysis) +3 iterations (12 th.) took 0.001686s; avg 0.000562s ( +/- 2.50/ 2.67 %); best 0.0005479s; worst 0.000577s; std dev. 1.189e-05 (taking best). +Reference operation time is 0.000547886 s (0.2628 Mflops) with 12 threads. +After merge step 3: tpop: 0.0005479 s ~Mflops: 0.263 nsubm:4 otn:12 +Applying merge (7 -> 4 leaves, 12 th.) yielded SLOWDOWN (1th of 3 tolerable) of 1.256x: 0.0004361s -> 0.0005479s. +Skipping further merge based tests after 1 definite performance degradations in a row (and last exceeding limit). +A total of 3 merge steps (of max 6) (16 -> 4 subms) took 0.007366s (of which 0.0003009s partitioning, 0s I/O); computing times: 1.574e-05s in par. loops, 0s sorting, 5.722e-06s analyzing) +Total merge + benchmarking process took 0.007366s, equivalent to 16.9/11.9 new/old ops (0.002645s for 2 clones -- as 6.1/4.3 ops, or 3.0/2.1 ops per clone), SPEEDUP of 1.417x +Applying multi-merge (16 -> 10 leaves, 1 steps, 0 -> 12 th.sp.) yielded SPEEDUP of 1.417x (0.000618s -> 0.0004361s), will amortize in 40.5 ops by saving 0.0001819s per op. +In 1 tuning rounds (tot. 0.011s, 0.0026s for constructor, 2 clones) obtained a SPEEDUP of 41.7% (1.417x) (from 0.233 to 0.3302 Mflops). +After 0.010875s, global autotuning declared speedup of 1.41717 x, when using threads count of 12 and a new matrix: +(6 x 6)[0xaaab0e714aa0]{S} @ (0(0..0),0(0..0)) (36 nnz, 6 nnz/r) flags 0x2046186 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 10, symflags:'' Considering C clone. Building a matrix with 36 nnz, 6 x 6 Duplicates check: 36 - 0 = 36 - converted COO to RSB in 4.132e-03 s (100.00 %) - analyzed arrays in 1.708e-03 s (41.34 %) - cleaned-up arrays in 9.537e-07 s (0.02 %) - deduplicated arrays in 0.000e+00 s (0.00 %) + converted COO to RSB in 3.512e-03 s (100.00 %) + analyzed arrays in 1.321e-03 s (37.61 %) + cleaned-up arrays in 0.000e+00 s (0.00 %) + deduplicated arrays in 9.537e-07 s (0.03 %) sorted arrays in 0.000e+00 s (0.00 %) - shuffled partitions in 1.313e-03 s (31.78 %) - memory allocations took 2.861e-06 s (0.07 %) + shuffled partitions in 1.095e-03 s (31.18 %) + memory allocations took 2.146e-06 s (0.06 %) leafs setup took 1.907e-06 s (0.05 %) - halfword conversion took 1.105e-03 s (26.74 %) -Built (6 x 6)[0xaaaadc5ff670]{C} @ (0(0..0),0(0..0)) (36 nnz, 6 nnz/r) flags 0x42046186 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 22, symflags:'' + halfword conversion took 1.090e-03 s (31.04 %) +Built (6 x 6)[0xaaab0e71aab0]{C} @ (0(0..0),0(0..0)) (36 nnz, 6 nnz/r) flags 0x42046186 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 22, symflags:'' Base matrix: -(6 x 6)[0xaaaadc5ff670]{C} @ (0(0..0),0(0..0)) (36 nnz, 6 nnz/r) flags 0x2046186 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 22, symflags:'' +(6 x 6)[0xaaab0e71aab0]{C} @ (0(0..0),0(0..0)) (36 nnz, 6 nnz/r) flags 0x2046186 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 22, symflags:'' Will use autotuning routine to sample matrix: 6 x 6, type C, 36 nnz, 6 nnz/r, 29 subms, 22 lsubms, 4.6667 bpnz. Parameters: verbosity:1 mintimes:3 maxtimes:10 mindt:0 maxdt:0.1 -3 iterations (12 th.) took 0.003467s; avg 0.001156s ( +/- 33.53/ 17.50 %); best 0.0007682s; worst 0.001358s; std dev. 0.000274 (taking best). -Reference operation time is 0.000768185 s (0.7498 Mflops) with 12 threads. -After 0.003512s, autotuning routine did not find a better threads count configuration. +3 iterations (12 th.) took 0.006161s; avg 0.002054s ( +/- 74.19/144.79 %); best 0.00053s; worst 0.005027s; std dev. 0.002103 (taking best). +Reference operation time is 0.000530005 s (1.087 Mflops) with 12 threads. +After 0.006173s, autotuning routine did not find a better threads count configuration. Will autotune matrix: 6 x 6, type C, 36 nnz, 6 nnz/r, 29 subms, 22 lsubms, 4.6667 bpnz. Parameters: verbosity:1 mintimes:3 maxtimes:10 mindt:0 maxdt:0.1 -3 iterations (12 th.) took 0.002159s; avg 0.0007196s ( +/- 34.40/ 66.88 %); best 0.0004721s; worst 0.001201s; std dev. 0.0003404 (taking best). -Reference operation time is 0.000472069 s (1.22 Mflops) with 12 threads. -Starting merge (same threads) based auto-tuning procedure (transA=N, nrhs=2, order=cols) (max 6 steps, inclusive 3 grace steps) on: 6 x 6, type C, 36 nnz, 6 nnz/r, 29 subms, 22 lsubms, 4.6667 bpnz (tpop: 0.0004721 Mflops: 1.220) -Merge (22 -> 16 leaves) took w.c.t. of 4.792e-05s, ~8.106e-06s of computing time (of which 9.537e-07s sorting, 1.907e-06s analysis) -3 iterations (12 th.) took 0.005311s; avg 0.00177s ( +/- 23.63/ 43.52 %); best 0.001352s; worst 0.002541s; std dev. 0.0005455 (taking best). -Reference operation time is 0.00135207 s (0.426 Mflops) with 12 threads. -After merge step 1: tpop: 0.001352 s ~Mflops: 0.426 nsubm:16 otn:12 -Applying merge (22 -> 16 leaves, 12 th.) yielded SLOWDOWN (1th of 3 tolerable) of 2.864x: 0.0004721s -> 0.001352s. -Skipping further merge based tests after 1 definite performance degradations in a row (and last exceeding limit). -A total of 1 merge steps (of max 6) (22 -> 16 subms) took 0.005378s (of which 5.078e-05s partitioning, 0s I/O); computing times: 8.106e-06s in par. loops, 9.537e-07s sorting, 1.907e-06s analyzing) -Total merge + benchmarking process took 0.005378s, equivalent to 11.4/11.4 new/old ops (0.0013s for 1 clones -- as 2.8/2.8 ops, or 2.8/2.8 ops per clone), SPEEDUP of 1.000x (NO SPEEDUP) -Merging based autotuning FAILED (=NO SPEEDUP); let's try splitting then... -3 iterations (12 th.) took 0.001613s; avg 0.0005376s ( +/- 10.91/ 21.29 %); best 0.000479s; worst 0.0006521s; std dev. 8.093e-05 (taking best). -Reference operation time is 0.000478983 s (1.203 Mflops) with 12 threads. -Starting split (same threads) based auto-tuning procedure (transA=N, nrhs=2, order=cols) (max 6 steps, inclusive 3 grace steps) on: 6 x 6, type C, 36 nnz, 6 nnz/r, 29 subms, 22 lsubms, 4.6667 bpnz (tpop: 0.000479 Mflops: 1.203) -Split (22 -> 28 leaves, 29 -> 37 subms) took 0.000453s (of which: 3.099e-06s analysis, -3.592e+09s mem.mgmt); compute time: 2.003e-05s overall, 1.192e-06s searches, 1.884e-05s shuffle, 8.106e-06s switch, 1.907e-06s quadrants. -3 iterations (12 th.) took 0.002491s; avg 0.0008303s ( +/- 15.55/ 9.23 %); best 0.0007012s; worst 0.0009069s; std dev. 9.185e-05 (taking best). -Reference operation time is 0.000701189 s (0.8215 Mflops) with 12 threads. -After split step 1: tpop: 0.0007012 s ~Mflops: 0.821 nsubm:28 otn:12 -Applying split (22 -> 28 leaves, 12 th.) yielded SLOWDOWN (1th of 3 tolerable) of 1.464x: 0.000479s -> 0.0007012s. -Skipping further split based tests after 1 definite performance degradations in a row (and last exceeding limit). -A total of 1 split steps (of max 6) (22 -> 28 subms) took 0.002978s (of which 0.0004742s partitioning, 0s I/O); computing times: 2.003e-05s in par. loops, 1.192e-06s sorting, 3.099e-06s analyzing) -Total split + benchmarking process took 0.002978s, equivalent to 6.2/6.2 new/old ops (0.001802s for 1 clones -- as 3.8/3.8 ops, or 3.8/3.8 ops per clone), SPEEDUP of 1.000x (NO SPEEDUP) -In 1 tuning rounds (tot. 0.015s, 0.0031s for constructor, 2 clones) obtained NO speedup (best stays 1.203 Mflops). -After 0.015288s, global autotuning found old matrix optimal, with declared speedup 1 x when using 12 threads +3 iterations (12 th.) took 0.002922s; avg 0.000974s ( +/- 43.53/ 74.11 %); best 0.00055s; worst 0.001696s; std dev. 0.000513 (taking best). +Reference operation time is 0.000550032 s (1.047 Mflops) with 12 threads. +Starting merge (same threads) based auto-tuning procedure (transA=N, nrhs=2, order=cols) (max 6 steps, inclusive 3 grace steps) on: 6 x 6, type C, 36 nnz, 6 nnz/r, 29 subms, 22 lsubms, 4.6667 bpnz (tpop: 0.00055 Mflops: 1.047) +Merge (22 -> 16 leaves) took w.c.t. of 0.0006411s, ~5.007e-06s of computing time (of which 9.537e-07s sorting, 1.907e-06s analysis) +3 iterations (12 th.) took 0.004031s; avg 0.001344s ( +/- 65.77/118.73 %); best 0.0004599s; worst 0.002939s; std dev. 0.00113 (taking best). +Reference operation time is 0.000459909 s (1.252 Mflops) with 12 threads. +After merge step 1: tpop: 0.0004599 s ~Mflops: 1.252 nsubm:16 otn:12 +Applying merge (22 -> 16 leaves, 12 th.) yielded SPEEDUP of 1.196x: 0.00055s -> 0.0004599s, so taking this instance. +Merge (16 -> 10 leaves) took w.c.t. of 0.0002429s, ~7.153e-06s of computing time (of which 0s sorting, 3.099e-06s analysis) +3 iterations (12 th.) took 0.001516s; avg 0.0005053s ( +/- 15.68/ 16.36 %); best 0.0004261s; worst 0.0005879s; std dev. 6.613e-05 (taking best). +Reference operation time is 0.000426054 s (1.352 Mflops) with 12 threads. +After merge step 2: tpop: 0.0004261 s ~Mflops: 1.352 nsubm:10 otn:12 +Applying merge (16 -> 10 leaves, 12 th.) yielded SPEEDUP of 1.079x: 0.0004599s -> 0.0004261s, so taking this instance. +Merge (10 -> 7 leaves) took w.c.t. of 6.914e-06s, ~2.861e-06s of computing time (of which 0s sorting, 1.907e-06s analysis) +3 iterations (12 th.) took 0.001282s; avg 0.0004273s ( +/- 2.64/ 1.82 %); best 0.000416s; worst 0.0004351s; std dev. 8.17e-06 (taking best). +Reference operation time is 0.00041604 s (1.384 Mflops) with 12 threads. +After merge step 3: tpop: 0.000416 s ~Mflops: 1.384 nsubm:7 otn:12 +Applying merge (10 -> 7 leaves, 12 th.) yielded SPEEDUP of 1.024x: 0.0004261s -> 0.000416s, so taking this instance. +Merge (7 -> 4 leaves) took w.c.t. of 4.053e-06s, ~1.192e-06s of computing time (of which 0s sorting, 9.537e-07s analysis) +3 iterations (12 th.) took 0.001273s; avg 0.0004244s ( +/- 1.29/ 2.08 %); best 0.0004189s; worst 0.0004332s; std dev. 6.299e-06 (taking best). +Reference operation time is 0.000418901 s (1.375 Mflops) with 12 threads. +After merge step 4: tpop: 0.0004189 s ~Mflops: 1.375 nsubm:4 otn:12 +Applying merge (7 -> 4 leaves, 12 th.) yielded NEGLIGIBLE change (1th in a row) (old/new=0.99317x): 0.000416s -> 0.0004189s, so IGNORING this instance. +Merge (4 -> 1 leaves) took w.c.t. of 2.861e-06s, ~1.907e-06s of computing time (of which 0s sorting, 9.537e-07s analysis) +3 iterations (12 th.) took 9.537e-07s; avg 3.179e-07s ( +/- 90.77/200.00 %); best 2.935e-08s; worst 9.537e-07s; std dev. 4.496e-07 (taking best). +Reference operation time is 2.93493e-08 s (1.963e+04 Mflops) with 12 threads. +After merge step 5: tpop: 2.935e-08 s ~Mflops: 19625.663 nsubm:1 otn:12 +Applying merge (4 -> 1 leaves, 12 th.) yielded SPEEDUP of 14175.467x: 0.000416s -> 2.935e-08s, so taking this instance. +Merged all the matrix leaves: no reason to continue merging. +A total of 5 merge steps (of max 6) (22 -> 1 subms) took 0.01415s (of which 0.0009151s partitioning, 0s I/O); computing times: 1.812e-05s in par. loops, 9.537e-07s sorting, 8.821e-06s analyzing) +Total merge + benchmarking process took 0.01415s, equivalent to 482120.2/25.7 new/old ops (0.006355s for 5 clones -- as 216531.3/11.6 ops, or 43306.3/2.3 ops per clone), SPEEDUP of 18740.861x +Applying multi-merge (22 -> 1 leaves, 5 steps, 0 -> 12 th.sp.) yielded SPEEDUP of 18740.861x (0.00055s -> 2.935e-08s), will amortize in 25.7 ops by saving 0.00055s per op. +In 1 tuning rounds (tot. 0.018s, 0.0064s for constructor, 5 clones) obtained a SPEEDUP of 1873986.1% (1.874e+04x) (from 1.047 to 1.963e+04 Mflops). +After 0.018364s, global autotuning declared speedup of 18740.9 x, when using threads count of 12 and a new matrix: +(6 x 6)[0xaaab0e719a80]{C} @ (0(0..6),0(0..6)) (36 nnz, 6 nnz/r) flags 0x2244086 (coo:0, csr:1, hw:1, ic:1, fi:0), storage: 1, subm: 1, symflags:'' Considering Z clone. Building a matrix with 36 nnz, 6 x 6 Duplicates check: 36 - 0 = 36 - converted COO to RSB in 3.937e-03 s (100.00 %) - analyzed arrays in 2.371e-03 s (60.23 %) - cleaned-up arrays in 1.192e-06 s (0.03 %) - deduplicated arrays in 9.537e-07 s (0.02 %) + converted COO to RSB in 2.738e-03 s (100.00 %) + analyzed arrays in 1.038e-03 s (37.90 %) + cleaned-up arrays in 0.000e+00 s (0.00 %) + deduplicated arrays in 9.537e-07 s (0.03 %) sorted arrays in 0.000e+00 s (0.00 %) - shuffled partitions in 7.000e-04 s (17.78 %) - memory allocations took 3.815e-06 s (0.10 %) - leafs setup took 1.907e-06 s (0.05 %) - halfword conversion took 8.562e-04 s (21.75 %) -Built (6 x 6)[0xaaaadc5ff670]{Z} @ (0(0..0),0(0..0)) (36 nnz, 6 nnz/r) flags 0x42046186 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 28, symflags:'' + shuffled partitions in 8.531e-04 s (31.16 %) + memory allocations took 1.907e-06 s (0.07 %) + leafs setup took 9.537e-07 s (0.03 %) + halfword conversion took 8.421e-04 s (30.76 %) +Built (6 x 6)[0xaaab0e719a80]{Z} @ (0(0..0),0(0..0)) (36 nnz, 6 nnz/r) flags 0x42046186 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 28, symflags:'' Base matrix: -(6 x 6)[0xaaaadc5ff670]{Z} @ (0(0..0),0(0..0)) (36 nnz, 6 nnz/r) flags 0x2046186 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 28, symflags:'' +(6 x 6)[0xaaab0e719a80]{Z} @ (0(0..0),0(0..0)) (36 nnz, 6 nnz/r) flags 0x2046186 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 28, symflags:'' Will use autotuning routine to sample matrix: 6 x 6, type Z, 36 nnz, 6 nnz/r, 37 subms, 28 lsubms, 4.4444 bpnz. Parameters: verbosity:1 mintimes:3 maxtimes:10 mindt:0 maxdt:0.1 -3 iterations (12 th.) took 0.002406s; avg 0.000802s ( +/- 38.67/ 37.91 %); best 0.0004919s; worst 0.001106s; std dev. 0.0002508 (taking best). -Reference operation time is 0.000491858 s (1.171 Mflops) with 12 threads. -After 0.002427s, autotuning routine did not find a better threads count configuration. +3 iterations (12 th.) took 0.002122s; avg 0.0007074s ( +/- 28.04/ 39.53 %); best 0.000509s; worst 0.0009871s; std dev. 0.0002034 (taking best). +Reference operation time is 0.000509024 s (1.132 Mflops) with 12 threads. +After 0.002133s, autotuning routine did not find a better threads count configuration. Will autotune matrix: 6 x 6, type Z, 36 nnz, 6 nnz/r, 37 subms, 28 lsubms, 4.4444 bpnz. Parameters: verbosity:1 mintimes:3 maxtimes:10 mindt:0 maxdt:0.1 -3 iterations (12 th.) took 0.003186s; avg 0.001062s ( +/- 16.78/ 32.68 %); best 0.0008838s; worst 0.001409s; std dev. 0.0002454 (taking best). -Reference operation time is 0.000883818 s (0.6517 Mflops) with 12 threads. -Starting merge (same threads) based auto-tuning procedure (transA=N, nrhs=2, order=cols) (max 6 steps, inclusive 3 grace steps) on: 6 x 6, type Z, 36 nnz, 6 nnz/r, 37 subms, 28 lsubms, 4.4444 bpnz (tpop: 0.0008838 Mflops: 0.652) -Merge (28 -> 22 leaves) took w.c.t. of 0.0004048s, ~1.407e-05s of computing time (of which 2.384e-06s sorting, 2.861e-06s analysis) -3 iterations (12 th.) took 0.002666s; avg 0.0008887s ( +/- 31.35/ 56.52 %); best 0.0006101s; worst 0.001391s; std dev. 0.0003559 (taking best). -Reference operation time is 0.000610113 s (0.9441 Mflops) with 12 threads. -After merge step 1: tpop: 0.0006101 s ~Mflops: 0.944 nsubm:22 otn:12 -Applying merge (28 -> 22 leaves, 12 th.) yielded SPEEDUP of 1.449x: 0.0008838s -> 0.0006101s, so taking this instance. -Merge (22 -> 16 leaves) took w.c.t. of 1.907e-05s, ~9.775e-06s of computing time (of which 9.537e-07s sorting, 3.099e-06s analysis) -3 iterations (12 th.) took 0.002383s; avg 0.0007943s ( +/- 38.32/ 44.91 %); best 0.00049s; worst 0.001151s; std dev. 0.0002724 (taking best). -Reference operation time is 0.00048995 s (1.176 Mflops) with 12 threads. -After merge step 2: tpop: 0.00049 s ~Mflops: 1.176 nsubm:16 otn:12 -Applying merge (22 -> 16 leaves, 12 th.) yielded SPEEDUP of 1.245x: 0.0006101s -> 0.00049s, so taking this instance. -Merge (16 -> 10 leaves) took w.c.t. of 0.0002382s, ~6.676e-06s of computing time (of which 1.907e-06s sorting, 2.146e-06s analysis) -3 iterations (12 th.) took 0.003337s; avg 0.001112s ( +/- 24.02/ 18.20 %); best 0.0008452s; worst 0.001315s; std dev. 0.0001971 (taking best). -Reference operation time is 0.000845194 s (0.6815 Mflops) with 12 threads. -After merge step 3: tpop: 0.0008452 s ~Mflops: 0.682 nsubm:10 otn:12 -Applying merge (16 -> 10 leaves, 12 th.) yielded SLOWDOWN (1th of 3 tolerable) of 1.725x: 0.00049s -> 0.0008452s. -Skipping further merge based tests after 1 definite performance degradations in a row (and last exceeding limit). -A total of 3 merge steps (of max 6) (28 -> 10 subms) took 0.01213s (of which 0.000669s partitioning, 0s I/O); computing times: 3.052e-05s in par. loops, 5.245e-06s sorting, 8.106e-06s analyzing) -Total merge + benchmarking process took 0.01213s, equivalent to 24.8/13.7 new/old ops (0.005199s for 3 clones -- as 10.6/5.9 ops, or 3.5/2.0 ops per clone), SPEEDUP of 1.804x -Applying multi-merge (28 -> 16 leaves, 2 steps, 0 -> 12 th.sp.) yielded SPEEDUP of 1.804x (0.0008838s -> 0.00049s), will amortize in 30.8 ops by saving 0.0003939s per op. -In 1 tuning rounds (tot. 0.018s, 0.0052s for constructor, 3 clones) obtained a SPEEDUP of 80.4% (1.804x) (from 0.6517 to 1.176 Mflops). -After 0.017515s, global autotuning declared speedup of 1.80389 x, when using threads count of 12 and a new matrix: -(6 x 6)[0xaaaadc605520]{Z} @ (0(0..0),0(0..0)) (36 nnz, 6 nnz/r) flags 0x2046186 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 16, symflags:'' +3 iterations (12 th.) took 0.00485s; avg 0.001617s ( +/- 38.58/ 70.72 %); best 0.000993s; worst 0.00276s; std dev. 0.0008095 (taking best). +Reference operation time is 0.000993013 s (0.5801 Mflops) with 12 threads. +Starting merge (same threads) based auto-tuning procedure (transA=N, nrhs=2, order=cols) (max 6 steps, inclusive 3 grace steps) on: 6 x 6, type Z, 36 nnz, 6 nnz/r, 37 subms, 28 lsubms, 4.4444 bpnz (tpop: 0.000993 Mflops: 0.580) +Merge (28 -> 22 leaves) took w.c.t. of 0.00049s, ~6.199e-06s of computing time (of which 1.192e-06s sorting, 1.907e-06s analysis) +3 iterations (12 th.) took 0.002427s; avg 0.000809s ( +/- 28.94/ 41.06 %); best 0.0005748s; worst 0.001141s; std dev. 0.0002413 (taking best). +Reference operation time is 0.000574827 s (1.002 Mflops) with 12 threads. +After merge step 1: tpop: 0.0005748 s ~Mflops: 1.002 nsubm:22 otn:12 +Applying merge (28 -> 22 leaves, 12 th.) yielded SPEEDUP of 1.727x: 0.000993s -> 0.0005748s, so taking this instance. +Merge (22 -> 16 leaves) took w.c.t. of 0.000283s, ~6.199e-06s of computing time (of which 0s sorting, 2.146e-06s analysis) +3 iterations (12 th.) took 0.002267s; avg 0.0007556s ( +/- 10.96/ 14.76 %); best 0.0006728s; worst 0.0008671s; std dev. 8.188e-05 (taking best). +Reference operation time is 0.000672817 s (0.8561 Mflops) with 12 threads. +After merge step 2: tpop: 0.0006728 s ~Mflops: 0.856 nsubm:16 otn:12 +Applying merge (22 -> 16 leaves, 12 th.) yielded SLOWDOWN (1th of 3 tolerable) of 1.170x: 0.0005748s -> 0.0006728s. +Merge (16 -> 10 leaves) took w.c.t. of 0.000242s, ~6.914e-06s of computing time (of which 9.537e-07s sorting, 2.146e-06s analysis) +3 iterations (12 th.) took 0.00185s; avg 0.0006166s ( +/- 27.50/ 22.92 %); best 0.000447s; worst 0.0007579s; std dev. 0.0001285 (taking best). +Reference operation time is 0.000447035 s (1.288 Mflops) with 12 threads. +After merge step 3: tpop: 0.000447 s ~Mflops: 1.288 nsubm:10 otn:12 +Applying merge (16 -> 10 leaves, 12 th.) yielded SPEEDUP of 1.286x: 0.0005748s -> 0.000447s, so taking this instance. +Merge (10 -> 7 leaves) took w.c.t. of 7.153e-06s, ~3.099e-06s of computing time (of which 0s sorting, 9.537e-07s analysis) +3 iterations (12 th.) took 0.001439s; avg 0.0004797s ( +/- 11.18/ 21.92 %); best 0.0004261s; worst 0.0005848s; std dev. 7.435e-05 (taking best). +Reference operation time is 0.000426054 s (1.352 Mflops) with 12 threads. +After merge step 4: tpop: 0.0004261 s ~Mflops: 1.352 nsubm:7 otn:12 +Applying merge (10 -> 7 leaves, 12 th.) yielded SPEEDUP of 1.049x: 0.000447s -> 0.0004261s, so taking this instance. +Merge (7 -> 4 leaves) took w.c.t. of 4.053e-06s, ~2.146e-06s of computing time (of which 0s sorting, 9.537e-07s analysis) +3 iterations (12 th.) took 0.00129s; avg 0.00043s ( +/- 1.15/ 1.63 %); best 0.0004251s; worst 0.000437s; std dev. 5.081e-06 (taking best). +Reference operation time is 0.0004251 s (1.355 Mflops) with 12 threads. +After merge step 5: tpop: 0.0004251 s ~Mflops: 1.355 nsubm:4 otn:12 +Applying merge (7 -> 4 leaves, 12 th.) yielded NEGLIGIBLE change (1th in a row) (old/new=1.00224x): 0.0004261s -> 0.0004251s, so IGNORING this instance. +Merge (4 -> 1 leaves) took w.c.t. of 5.007e-06s, ~3.099e-06s of computing time (of which 0s sorting, 0s analysis) +3 iterations (12 th.) took 2.146e-06s; avg 7.153e-07s ( +/- 95.90/ 66.67 %); best 2.935e-08s; worst 1.192e-06s; std dev. 5.15e-07 (taking best). +Reference operation time is 2.93493e-08 s (1.963e+04 Mflops) with 12 threads. +After merge step 6: tpop: 2.935e-08 s ~Mflops: 19625.663 nsubm:1 otn:12 +Applying merge (4 -> 1 leaves, 12 th.) yielded SPEEDUP of 14516.653x: 0.0004261s -> 2.935e-08s, so taking this instance. +Merged all the matrix leaves: no reason to continue merging. +A total of 6 merge steps (of max 6) (28 -> 1 subms) took 0.01585s (of which 0.001043s partitioning, 0s I/O); computing times: 2.766e-05s in par. loops, 2.146e-06s sorting, 8.106e-06s analyzing) +Total merge + benchmarking process took 0.01585s, equivalent to 540040.6/16.0 new/old ops (0.006785s for 5 clones -- as 231186.0/6.8 ops, or 46237.2/1.4 ops per clone), SPEEDUP of 33834.281x +Applying multi-merge (28 -> 1 leaves, 6 steps, 0 -> 12 th.sp.) yielded SPEEDUP of 33834.281x (0.000993s -> 2.935e-08s), will amortize in 16.0 ops by saving 0.000993s per op. +In 1 tuning rounds (tot. 0.022s, 0.0068s for constructor, 5 clones) obtained a SPEEDUP of 3383328.1% (3.383e+04x) (from 0.5801 to 1.963e+04 Mflops). +After 0.022067s, global autotuning declared speedup of 33834.3 x, when using threads count of 12 and a new matrix: +(6 x 6)[0xaaab0e71d1d0]{Z} @ (0(0..6),0(0..6)) (36 nnz, 6 nnz/r) flags 0x2244086 (coo:0, csr:1, hw:1, ic:1, fi:0), storage: 1, subm: 1, symflags:'' gmake[4]: Leaving directory '/build/reproducible-path/librsb-1.3.0.2+dfsg/examples' gmake[3]: Leaving directory '/build/reproducible-path/librsb-1.3.0.2+dfsg' @@ -9249,19 +9376,18 @@ 4 0 DIFF PRINT TEST END Beginning large binary search test. -Detected 33596850176 bytes of memory, comprehensive of 23224246272 of free memory. +Detected 33596854272 bytes of memory, comprehensive of 18953117696 of free memory. On this system, maximal array of coordinates can have 2147483137 elements and occupy 8589932548 bytes. -Will perform the test using less memory (227 MB) than on the maximal coordinate indices array (238315520) allows. -(c)allocated 59578880 nnz (238315520 bytes) -Succeeded retrieving array last element. -Successfully performed large binary search test. +Will perform the test using less memory (17592186041588 MB) than on the maximal coordinate indices array (18446744070744520704) allows. +Skipping test: too little memory. +Skipping large binary search test. BASIC SPARSE BLAS TEST: BEGIN INIT INTERFACE TEST: BEGIN got RSB_IO_WANT_EXTRA_VERBOSE_INTERFACE: -1 got RSB_IO_WANT_IS_INITIALIZED_MARKER: 1 INIT INTERFACE TEST: END (SUCCESS) DEVEL PRINT TEST: BEGIN -(4 x 4)[0xaaaac32b13a0]{S} @ (0(0..0),0(0..0)) (4 nnz, 1 nnz/r) flags 0x2046186 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 2, symflags:'' +(4 x 4)[0xaaaacd4603a0]{S} @ (0(0..0),0(0..0)) (4 nnz, 1 nnz/r) flags 0x2046186 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 2, symflags:'' RSB_FLAG_USE_HALFWORD_INDICES | RSB_FLAG_SORTED_INPUT | RSB_FLAG_WANT_COO_STORAGE | @@ -9270,8 +9396,8 @@ RSB_FLAG_ASSEMBLED_IN_COO_ARRAYS | RSB_FLAG_OWN_PARTITIONING_ARRAYS | RSB_FLAG_SORT_INPUT -(2 x 2)[0xaaaac32b14b0]{S} @ (0(0..2),0(0..2)) (2 nnz, 1 nnz/r) flags 0x2144386 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 0, symflags:'' -(2 x 2)[0xaaaac32b15c0]{S} @ (2(2..4),2(2..4)) (2 nnz, 1 nnz/r) flags 0x2144386 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 0, symflags:'' +(2 x 2)[0xaaaacd4604b0]{S} @ (0(0..2),0(0..2)) (2 nnz, 1 nnz/r) flags 0x2144386 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 0, symflags:'' +(2 x 2)[0xaaaacd4605c0]{S} @ (2(2..4),2(2..4)) (2 nnz, 1 nnz/r) flags 0x2144386 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 0, symflags:'' #R 4 x 4, 4 nnz (16 bytes), 16 index space for bytes, 544 bytes for 2 structs (2 of which are on the diagonal) (1e+02% of nnz are on the diagonal) #N at 0 0, 4 x 4, 4 nnz ( 25%) #T at 0 0, 2 x 2, 2 nnz ( 50%) @@ -9279,9 +9405,9 @@ ( 0x2046186 = { rec:1 coo:1 css:1 hw:1 ic:1 fi:0 symflags: } ) DEVEL PRINT TEST: END PRINT TEST: BEGIN [QUIET] -(2 x 2)[0xaaaac32b14b0]{S} @ (0(0..2),0(0..2)) (2 nnz, 1 nnz/r) flags 0x2144386 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 0, symflags:'' -(2 x 2)[0xaaaac32b15c0]{S} @ (2(2..4),2(2..4)) (2 nnz, 1 nnz/r) flags 0x2144386 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 0, symflags:'' -(4 x 4)[0xaaaac32b13a0]{S} @ (0(0..0),0(0..0)) (4 nnz, 1 nnz/r) flags 0x2046186 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 2, symflags:'' +(2 x 2)[0xaaaacd4604b0]{S} @ (0(0..2),0(0..2)) (2 nnz, 1 nnz/r) flags 0x2144386 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 0, symflags:'' +(2 x 2)[0xaaaacd4605c0]{S} @ (2(2..4),2(2..4)) (2 nnz, 1 nnz/r) flags 0x2144386 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 0, symflags:'' +(4 x 4)[0xaaaacd4603a0]{S} @ (0(0..0),0(0..0)) (4 nnz, 1 nnz/r) flags 0x2046186 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 2, symflags:'' RSB_FLAG_USE_HALFWORD_INDICES | RSB_FLAG_SORTED_INPUT | RSB_FLAG_WANT_COO_STORAGE | @@ -9299,8 +9425,8 @@ BASIC PRIMITIVES TEST: BEGIN BASIC PRIMITIVES TEST: END (SUCCESS) ADVANCED SPARSE BLAS TEST: BEGIN [limit 30.000000s] [QUIET] -Terminating testing earlier due to user timeout request: test took 30.009697 s, max allowed was 30.000000. - PASSED:20628 +Terminating testing earlier due to user timeout request: test took 30.000135 s, max allowed was 30.000000. + PASSED:19505 FAILED:0 ADVANCED SPARSE BLAS TEST: END (SUCCESS) gmake qtests -C librsbpp @@ -9309,7 +9435,7 @@ gmake[4]: Entering directory '/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp' gmake[4]: Leaving directory '/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp' ./rsbtt -if ! test -f G.mtx ; then cp -p /build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp/G.mtx . ; fi ; /bin/bash /build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp/test.sh +if ! test -f G.mtx ; then cp -p /build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp/G.mtx . ; fi ; /bin/sh /build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp/test.sh ++ ./rsbpp Td,s G.mtx ++ grep Z-sort ++ wc -l @@ -9385,10 +9511,10 @@ ++ grep Recursing ++ wc -l + test 4 = 4 +++ grep Recursing ++ OMP_NUM_THREADS=2 ++ RSB_NUM_THREADS=2 ++ ./rsbpp vvvC1000m100M100I1r1vtN,TorsF -++ grep Recursing ++ wc -l + test 4 = 4 ++ OMP_NUM_THREADS=1 @@ -9448,7 +9574,7 @@ 0 0 0 0 before tuning for SPMV: -(3 x 3)[0xaaab0283b0a0]{D} @ (0(0..0),0(0..0)) (6 nnz, 2 nnz/r) flags 0x2046186 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'' +(3 x 3)[0xaaaacd1f00a0]{D} @ (0(0..0),0(0..0)) (6 nnz, 2 nnz/r) flags 0x2046186 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'' ** x: 1.1 @@ -9537,18 +9663,18 @@ BEGIN Rsb_Matrix_test_multimatrix_ms_mnrhs BEGIN -(3 x 3)[0xaaab02852480]{D} @ (0(0..0),0(0..0)) (6 nnz, 2 nnz/r) flags 0x204619e (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'LT' +(3 x 3)[0xaaaacd207480]{D} @ (0(0..0),0(0..0)) (6 nnz, 2 nnz/r) flags 0x204619e (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'LT' Tuned with speedup factor of 1: -(3 x 3)[0xaaab02852480]{D} @ (0(0..0),0(0..0)) (6 nnz, 2 nnz/r) flags 0x204619e (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'LT' -(3 x 3)[0xaaab02866a70]{D} @ (0(0..0),0(0..0)) (6 nnz, 2 nnz/r) flags 0x204619e (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'LT' +(3 x 3)[0xaaaacd207480]{D} @ (0(0..0),0(0..0)) (6 nnz, 2 nnz/r) flags 0x204619e (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'LT' +(3 x 3)[0xaaaacd21ba70]{D} @ (0(0..0),0(0..0)) (6 nnz, 2 nnz/r) flags 0x204619e (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'LT' Tuned with speedup factor of 1: -(3 x 3)[0xaaab02866a70]{D} @ (0(0..0),0(0..0)) (6 nnz, 2 nnz/r) flags 0x204619e (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'LT' -(3 x 3)[0xaaab02852480]{D} @ (0(0..0),0(0..0)) (6 nnz, 2 nnz/r) flags 0x204619e (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'LT' +(3 x 3)[0xaaaacd21ba70]{D} @ (0(0..0),0(0..0)) (6 nnz, 2 nnz/r) flags 0x204619e (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'LT' +(3 x 3)[0xaaaacd207480]{D} @ (0(0..0),0(0..0)) (6 nnz, 2 nnz/r) flags 0x204619e (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'LT' Tuned with speedup factor of 1: -(3 x 3)[0xaaab02852480]{D} @ (0(0..0),0(0..0)) (6 nnz, 2 nnz/r) flags 0x204619e (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'LT' -(3 x 3)[0xaaab02866a70]{D} @ (0(0..0),0(0..0)) (6 nnz, 2 nnz/r) flags 0x204619e (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'LT' +(3 x 3)[0xaaaacd207480]{D} @ (0(0..0),0(0..0)) (6 nnz, 2 nnz/r) flags 0x204619e (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'LT' +(3 x 3)[0xaaaacd21ba70]{D} @ (0(0..0),0(0..0)) (6 nnz, 2 nnz/r) flags 0x204619e (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'LT' Tuned with speedup factor of 1: -(3 x 3)[0xaaab02866a70]{D} @ (0(0..0),0(0..0)) (6 nnz, 2 nnz/r) flags 0x204619e (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'LT' +(3 x 3)[0xaaaacd21ba70]{D} @ (0(0..0),0(0..0)) (6 nnz, 2 nnz/r) flags 0x204619e (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'LT' END OK: terminating with no allocations registered in librsb [*] tests terminated successfully ! @@ -9565,10 +9691,10 @@ ./rsbtest --no-tune --max_t 0.01 --serial | dd if=/dev/stdin of=/dev/stdout bs=16M status=none iflag=fullblock | grep -q Building ./rsbtest --no-tune --max_t 0.01 --max 1 --nrhs 1 --beta 1 --incy 1 --incx 1 --no-trans --alpha 1 --type d --rand --serial . | dd if=/dev/stdin of=/dev/stdout bs=16M status=none iflag=fullblock | grep -q adding ! ./rsbtest --mkl A.mkl -running on codethink03-arm64 +running on i-capture-the-hostname Built without the MKL. ( ! ./rsbtest --unrecognized-option-triggers-abort ) -running on codethink03-arm64 +running on i-capture-the-hostname /build/reproducible-path/librsb-1.3.0.2+dfsg/rsbtest/.libs/rsbtest: unrecognized option '--unrecognized-option-triggers-abort' unrecognized option, aborting. ( ./rsbtest --no-tune --max_t 0.01 --skip-loading-hermitian-matrices --skip-loading-unsymmetric-matrices --tune-maxt 10 --tune-maxr 10 --verbose-tuning --extra-verbose-interface --min_t 0.01 --max_t 0.01 --mintimes 1 --maxtimes 1 --verbose --skip-loading-symmetric-matrices A.mtx | dd if=/dev/stdin of=/dev/stdout bs=16M status=none iflag=fullblock | grep -q skip ) @@ -9577,7 +9703,7 @@ ( ! ./rsbtest --no-tune --max_t 0.01 --quiet --types all --nthreads 1,2 --maxtimes 1 -+ A.mtx | dd if=/dev/stdin of=/dev/stdout bs=16M status=none iflag=fullblock | grep -q 2.threads ) ( ! ./rsbtest --no-tune --max_t 0.01 --quiet --render-only A.mtx > /dev/null ) ! ./rsbtest --no-tune --max_t 0.01 --quiet --max 1 --nrhs 1 --beta 1 --incy 1 --incx 1 --render --no-trans --alpha 1 --type all A.mtx -running on codethink03-arm64 +running on i-capture-the-hostname Will not invoke autotuning routine. Benchmark will sample for at most 0.01 s Built without render support! @@ -9629,7 +9755,7 @@ gmake[4]: Entering directory '/build/reproducible-path/librsb-1.3.0.2+dfsg' gmake[5]: Entering directory '/build/reproducible-path/librsb-1.3.0.2+dfsg' /usr/bin/mkdir -p '/build/reproducible-path/librsb-1.3.0.2+dfsg/debian/tmp/usr/lib/aarch64-linux-gnu' - /bin/bash ./libtool --mode=install /usr/bin/install -c librsb.la '/build/reproducible-path/librsb-1.3.0.2+dfsg/debian/tmp/usr/lib/aarch64-linux-gnu' + /bin/sh ./libtool --mode=install /usr/bin/install -c librsb.la '/build/reproducible-path/librsb-1.3.0.2+dfsg/debian/tmp/usr/lib/aarch64-linux-gnu' libtool: install: /usr/bin/install -c .libs/librsb.so.0.0.0 /build/reproducible-path/librsb-1.3.0.2+dfsg/debian/tmp/usr/lib/aarch64-linux-gnu/librsb.so.0.0.0 libtool: install: (cd /build/reproducible-path/librsb-1.3.0.2+dfsg/debian/tmp/usr/lib/aarch64-linux-gnu && { ln -s -f librsb.so.0.0.0 librsb.so.0 || { rm -f librsb.so.0 && ln -s librsb.so.0.0.0 librsb.so.0; }; }) libtool: install: (cd /build/reproducible-path/librsb-1.3.0.2+dfsg/debian/tmp/usr/lib/aarch64-linux-gnu && { ln -s -f librsb.so.0.0.0 librsb.so || { rm -f librsb.so && ln -s librsb.so.0.0.0 librsb.so; }; }) @@ -9639,7 +9765,7 @@ libtool: install: ranlib /build/reproducible-path/librsb-1.3.0.2+dfsg/debian/tmp/usr/lib/aarch64-linux-gnu/librsb.a libtool: warning: remember to run 'libtool --finish /usr/lib/aarch64-linux-gnu' /usr/bin/mkdir -p '/build/reproducible-path/librsb-1.3.0.2+dfsg/debian/tmp/usr/bin' - /bin/bash ./libtool --mode=install /usr/bin/install -c rsbench '/build/reproducible-path/librsb-1.3.0.2+dfsg/debian/tmp/usr/bin' + /bin/sh ./libtool --mode=install /usr/bin/install -c rsbench '/build/reproducible-path/librsb-1.3.0.2+dfsg/debian/tmp/usr/bin' libtool: warning: 'librsb.la' has not been installed in '/usr/lib/aarch64-linux-gnu' libtool: install: /usr/bin/install -c .libs/rsbench /build/reproducible-path/librsb-1.3.0.2+dfsg/debian/tmp/usr/bin/rsbench /usr/bin/mkdir -p '/build/reproducible-path/librsb-1.3.0.2+dfsg/debian/tmp/usr/bin' @@ -9774,11 +9900,11 @@ dh_gencontrol dh_md5sums dh_builddeb -dpkg-deb: building package 'librsb0t64-dbgsym' in '../librsb0t64-dbgsym_1.3.0.2+dfsg-8_arm64.deb'. dpkg-deb: building package 'librsb0t64' in '../librsb0t64_1.3.0.2+dfsg-8_arm64.deb'. -dpkg-deb: building package 'librsb-dev' in '../librsb-dev_1.3.0.2+dfsg-8_arm64.deb'. -dpkg-deb: building package 'librsb-tools-dbgsym' in '../librsb-tools-dbgsym_1.3.0.2+dfsg-8_arm64.deb'. dpkg-deb: building package 'librsb-tools' in '../librsb-tools_1.3.0.2+dfsg-8_arm64.deb'. +dpkg-deb: building package 'librsb0t64-dbgsym' in '../librsb0t64-dbgsym_1.3.0.2+dfsg-8_arm64.deb'. +dpkg-deb: building package 'librsb-tools-dbgsym' in '../librsb-tools-dbgsym_1.3.0.2+dfsg-8_arm64.deb'. +dpkg-deb: building package 'librsb-dev' in '../librsb-dev_1.3.0.2+dfsg-8_arm64.deb'. dpkg-deb: building package 'librsb-doc' in '../librsb-doc_1.3.0.2+dfsg-8_all.deb'. dpkg-genbuildinfo --build=binary -O../librsb_1.3.0.2+dfsg-8_arm64.buildinfo dpkg-genchanges --build=binary -O../librsb_1.3.0.2+dfsg-8_arm64.changes @@ -9788,12 +9914,14 @@ dpkg-buildpackage: info: binary-only upload (no source included) dpkg-genchanges: info: not including original source code in upload I: copying local configuration +I: user script /srv/workspace/pbuilder/3598769/tmp/hooks/B01_cleanup starting +I: user script /srv/workspace/pbuilder/3598769/tmp/hooks/B01_cleanup finished I: unmounting dev/ptmx filesystem I: unmounting dev/pts filesystem I: unmounting dev/shm filesystem I: unmounting proc filesystem I: unmounting sys filesystem I: cleaning the build env -I: removing directory /srv/workspace/pbuilder/3017132 and its subdirectories -I: Current time: Mon Nov 30 06:42:05 -12 2026 -I: pbuilder-time-stamp: 1796064125 +I: removing directory /srv/workspace/pbuilder/3598769 and its subdirectories +I: Current time: Wed Oct 29 02:30:41 +14 2025 +I: pbuilder-time-stamp: 1761654641