Diff of the two buildlogs: -- --- b1/build.log 2025-08-04 01:27:39.723710547 +0000 +++ b2/build.log 2025-08-04 01:40:00.108694151 +0000 @@ -1,6 +1,6 @@ I: pbuilder: network access will be disabled during build -I: Current time: Sat Sep 5 19:38:44 -12 2026 -I: pbuilder-time-stamp: 1788680324 +I: Current time: Mon Aug 4 15:27:42 +14 2025 +I: pbuilder-time-stamp: 1754270862 I: Building the build Environment I: extracting base tarball [/var/cache/pbuilder/trixie-reproducible-base.tgz] I: copying local configuration @@ -25,52 +25,84 @@ dpkg-source: info: applying auto-gitignore I: Not using root during the build. I: Installing the build-deps -I: user script /srv/workspace/pbuilder/1467199/tmp/hooks/D02_print_environment starting +I: user script /srv/workspace/pbuilder/1730324/tmp/hooks/D01_modify_environment starting +debug: Running on codethink04-arm64. +I: Changing host+domainname to test build reproducibility +I: Adding a custom variable just for the fun of it... +I: Changing /bin/sh to bash +'/bin/sh' -> '/bin/bash' +lrwxrwxrwx 1 root root 9 Aug 4 01:27 /bin/sh -> /bin/bash +I: Setting pbuilder2's login shell to /bin/bash +I: Setting pbuilder2's GECOS to second user,second room,second work-phone,second home-phone,second other +I: user script /srv/workspace/pbuilder/1730324/tmp/hooks/D01_modify_environment finished +I: user script /srv/workspace/pbuilder/1730324/tmp/hooks/D02_print_environment starting I: set - BUILDDIR='/build/reproducible-path' - BUILDUSERGECOS='first user,first room,first work-phone,first home-phone,first other' - BUILDUSERNAME='pbuilder1' - BUILD_ARCH='arm64' - DEBIAN_FRONTEND='noninteractive' + BASH=/bin/sh + BASHOPTS=checkwinsize:cmdhist:complete_fullquote:extquote:force_fignore:globasciiranges:globskipdots:hostcomplete:interactive_comments:patsub_replacement:progcomp:promptvars:sourcepath + BASH_ALIASES=() + BASH_ARGC=() + BASH_ARGV=() + BASH_CMDS=() + BASH_LINENO=([0]="12" [1]="0") + BASH_LOADABLES_PATH=/usr/local/lib/bash:/usr/lib/bash:/opt/local/lib/bash:/usr/pkg/lib/bash:/opt/pkg/lib/bash:. + BASH_SOURCE=([0]="/tmp/hooks/D02_print_environment" [1]="/tmp/hooks/D02_print_environment") + BASH_VERSINFO=([0]="5" [1]="2" [2]="37" [3]="1" [4]="release" [5]="aarch64-unknown-linux-gnu") + BASH_VERSION='5.2.37(1)-release' + BUILDDIR=/build/reproducible-path + BUILDUSERGECOS='second user,second room,second work-phone,second home-phone,second other' + BUILDUSERNAME=pbuilder2 + BUILD_ARCH=arm64 + DEBIAN_FRONTEND=noninteractive DEB_BUILD_OPTIONS='buildinfo=+all reproducible=+all parallel=12 ' - DISTRIBUTION='trixie' - HOME='/root' - HOST_ARCH='arm64' + DIRSTACK=() + DISTRIBUTION=trixie + EUID=0 + FUNCNAME=([0]="Echo" [1]="main") + GROUPS=() + HOME=/root + HOSTNAME=i-capture-the-hostname + HOSTTYPE=aarch64 + HOST_ARCH=arm64 IFS=' ' - INVOCATION_ID='592f0c642cfc424d95670e364a3e708c' - LANG='C' - LANGUAGE='en_US:en' - LC_ALL='C' - MAIL='/var/mail/root' - OPTIND='1' - PATH='/usr/sbin:/usr/bin:/sbin:/bin:/usr/games' - PBCURRENTCOMMANDLINEOPERATION='build' - PBUILDER_OPERATION='build' - PBUILDER_PKGDATADIR='/usr/share/pbuilder' - PBUILDER_PKGLIBDIR='/usr/lib/pbuilder' - PBUILDER_SYSCONFDIR='/etc' - PPID='1467199' - PS1='# ' - PS2='> ' + INVOCATION_ID=a4c2e7b801a6456f82586cc5a2b3a645 + LANG=C + LANGUAGE=nl_BE:nl + LC_ALL=C + MACHTYPE=aarch64-unknown-linux-gnu + MAIL=/var/mail/root + OPTERR=1 + OPTIND=1 + OSTYPE=linux-gnu + PATH=/usr/sbin:/usr/bin:/sbin:/bin:/usr/games:/i/capture/the/path + PBCURRENTCOMMANDLINEOPERATION=build + PBUILDER_OPERATION=build + PBUILDER_PKGDATADIR=/usr/share/pbuilder + PBUILDER_PKGLIBDIR=/usr/lib/pbuilder + PBUILDER_SYSCONFDIR=/etc + PIPESTATUS=([0]="0") + POSIXLY_CORRECT=y + PPID=1730324 PS4='+ ' - PWD='/' - SHELL='/bin/bash' - SHLVL='2' - SUDO_COMMAND='/usr/bin/timeout -k 18.1h 18h /usr/bin/ionice -c 3 /usr/bin/nice /usr/sbin/pbuilder --build --configfile /srv/reproducible-results/rbuild-debian/r-b-build.VwV7TEZu/pbuilderrc_OSUm --distribution trixie --hookdir /etc/pbuilder/first-build-hooks --debbuildopts -b --basetgz /var/cache/pbuilder/trixie-reproducible-base.tgz --buildresult /srv/reproducible-results/rbuild-debian/r-b-build.VwV7TEZu/b1 --logfile b1/build.log librsb_1.3.0.2+dfsg-7.dsc' - SUDO_GID='109' - SUDO_UID='104' - SUDO_USER='jenkins' - TERM='unknown' - TZ='/usr/share/zoneinfo/Etc/GMT+12' - USER='root' - _='/usr/bin/systemd-run' - http_proxy='http://192.168.101.4:3128' + PWD=/ + SHELL=/bin/bash + SHELLOPTS=braceexpand:errexit:hashall:interactive-comments:posix + SHLVL=3 + SUDO_COMMAND='/usr/bin/timeout -k 24.1h 24h /usr/bin/ionice -c 3 /usr/bin/nice -n 11 /usr/bin/unshare --uts -- /usr/sbin/pbuilder --build --configfile /srv/reproducible-results/rbuild-debian/r-b-build.VwV7TEZu/pbuilderrc_wL8J --distribution trixie --hookdir /etc/pbuilder/rebuild-hooks --debbuildopts -b --basetgz /var/cache/pbuilder/trixie-reproducible-base.tgz --buildresult /srv/reproducible-results/rbuild-debian/r-b-build.VwV7TEZu/b2 --logfile b2/build.log librsb_1.3.0.2+dfsg-7.dsc' + SUDO_GID=109 + SUDO_UID=104 + SUDO_USER=jenkins + TERM=unknown + TZ=/usr/share/zoneinfo/Etc/GMT-14 + UID=0 + USER=root + _='I: set' + http_proxy=http://192.168.101.4:3128 I: uname -a - Linux codethink03-arm64 6.1.0-37-cloud-arm64 #1 SMP Debian 6.1.140-1 (2025-05-22) aarch64 GNU/Linux + Linux i-capture-the-hostname 6.1.0-37-cloud-arm64 #1 SMP Debian 6.1.140-1 (2025-05-22) aarch64 GNU/Linux I: ls -l /bin - lrwxrwxrwx 1 root root 7 May 12 2025 /bin -> usr/bin -I: user script /srv/workspace/pbuilder/1467199/tmp/hooks/D02_print_environment finished + lrwxrwxrwx 1 root root 7 May 12 19:25 /bin -> usr/bin +I: user script /srv/workspace/pbuilder/1730324/tmp/hooks/D02_print_environment finished -> Attempting to satisfy build-dependencies -> Creating pbuilder-satisfydepends-dummy package Package: pbuilder-satisfydepends-dummy @@ -296,7 +328,7 @@ Get: 178 http://deb.debian.org/debian trixie/main arm64 libltdl-dev arm64 2.5.4-4 [168 kB] Get: 179 http://deb.debian.org/debian trixie/main arm64 libhwloc-dev arm64 2.12.0-4 [239 kB] Get: 180 http://deb.debian.org/debian trixie/main arm64 zlib1g-dev arm64 1:1.3.dfsg+really1.3.1-1+b1 [917 kB] -Fetched 372 MB in 1s (309 MB/s) +Fetched 372 MB in 2s (164 MB/s) Preconfiguring packages ... Selecting previously unselected package libexpat1:arm64. (Reading database ... (Reading database ... 5% (Reading database ... 10% (Reading database ... 15% (Reading database ... 20% (Reading database ... 25% (Reading database ... 30% (Reading database ... 35% (Reading database ... 40% (Reading database ... 45% (Reading database ... 50% (Reading database ... 55% (Reading database ... 60% (Reading database ... 65% (Reading database ... 70% (Reading database ... 75% (Reading database ... 80% (Reading database ... 85% (Reading database ... 90% (Reading database ... 95% (Reading database ... 100% (Reading database ... 19965 files and directories currently installed.) @@ -893,8 +925,8 @@ Setting up tzdata (2025b-4) ... Current default time zone: 'Etc/UTC' -Local time is now: Sun Sep 6 07:39:23 UTC 2026. -Universal Time is now: Sun Sep 6 07:39:23 UTC 2026. +Local time is now: Mon Aug 4 01:28:31 UTC 2025. +Universal Time is now: Mon Aug 4 01:28:31 UTC 2025. Run 'dpkg-reconfigure tzdata' if you wish to change it. Setting up libfontenc1:arm64 (1:1.1.8-1+b2) ... @@ -1062,7 +1094,11 @@ Building tag database... -> Finished parsing the build-deps I: Building the package -I: Running cd /build/reproducible-path/librsb-1.3.0.2+dfsg/ && env PATH="/usr/sbin:/usr/bin:/sbin:/bin:/usr/games" HOME="/nonexistent/first-build" dpkg-buildpackage -us -uc -b && env PATH="/usr/sbin:/usr/bin:/sbin:/bin:/usr/games" HOME="/nonexistent/first-build" dpkg-genchanges -S > ../librsb_1.3.0.2+dfsg-7_source.changes +I: user script /srv/workspace/pbuilder/1730324/tmp/hooks/A99_set_merged_usr starting +Not re-configuring usrmerge for trixie +I: user script /srv/workspace/pbuilder/1730324/tmp/hooks/A99_set_merged_usr finished +hostname: Name or service not known +I: Running cd /build/reproducible-path/librsb-1.3.0.2+dfsg/ && env PATH="/usr/sbin:/usr/bin:/sbin:/bin:/usr/games:/i/capture/the/path" HOME="/nonexistent/second-build" dpkg-buildpackage -us -uc -b && env PATH="/usr/sbin:/usr/bin:/sbin:/bin:/usr/games:/i/capture/the/path" HOME="/nonexistent/second-build" dpkg-genchanges -S > ../librsb_1.3.0.2+dfsg-7_source.changes dpkg-buildpackage: info: source package librsb dpkg-buildpackage: info: source version 1.3.0.2+dfsg-7 dpkg-buildpackage: info: source distribution unstable @@ -1082,62 +1118,62 @@ dh binary dh_update_autotools_config dh_autoreconf -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found libtoolize: putting auxiliary files in '.'. libtoolize: copying file './ltmain.sh' libtoolize: putting macros in AC_CONFIG_MACRO_DIRS, 'm4'. @@ -1179,90 +1215,90 @@ libtoolize: copying file 'm4/ltsugar.m4' libtoolize: copying file 'm4/ltversion.m4' libtoolize: copying file 'm4/lt~obsolete.m4' -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found configure.ac:66: installing './compile' configure.ac:65: installing './missing' Makefile.am: installing './depcomp' @@ -1448,7 +1484,7 @@ checking for m4... m4 checking for gmake... gmake checking for ggrep... /usr/bin/grep -checking for bash... /bin/bash +checking for bash... /bin/sh checking for gsed... /usr/bin/sed checking for cmp... cmp checking for basename... basename @@ -1565,7 +1601,7 @@ configure: It appears that Fortran programs can be linked without using the Fortran linker. configure: Using OPENMP_CFLAGS ok for linking an OpenMP program: adding it to LIBS. checking if your have a usable getrusage() ... 1 -checking for /bin/bash... /bin/bash +checking for /bin/sh... /bin/sh configure: Will not use Google Test. configure: You seem to not have GNU Octave or have disabled 'int' type. Part of the test suite will not be generated. If you want more testing capabilities, you should enable the 'int' type as well. checking that generated files are newer than configure... done @@ -1587,7 +1623,7 @@ config.status: executing depfiles commands config.status: executing libtool commands === configuring in librsbpp (/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp) -configure: running /bin/bash ./configure --disable-option-checking '--prefix=/usr' '--build=aarch64-linux-gnu' '--includedir=${prefix}/include' '--mandir=${prefix}/share/man' '--infodir=${prefix}/share/info' '--sysconfdir=/etc' '--localstatedir=/var' '--disable-silent-rules' '--libdir=${prefix}/lib/aarch64-linux-gnu' '--runstatedir=/run' '--disable-maintainer-mode' '--disable-dependency-tracking' '--with-memhinfo=L2:4/64/512K,L1:8/64/24K' '--with-hwloc' '--enable-matrix-types=blas' '--with-zlib=-lz' '--enable-doc-build' '--enable-fortran-module-install' '--enable-extra-patches' '--enable-pkg-config-install' '--disable-extra-patches' 'build_alias=aarch64-linux-gnu' 'CFLAGS=-g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3' 'LDFLAGS=-Wl,-z,relro' 'CPPFLAGS=-Wdate-time -D_FORTIFY_SOURCE=2' 'FCFLAGS=-g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -mbranch-protection=standard -pipe' 'CXXFLAGS=-g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard' 'BASH=/bin/bash' --cache-file=/dev/null --srcdir=. +configure: running /bin/sh ./configure --disable-option-checking '--prefix=/usr' '--build=aarch64-linux-gnu' '--includedir=${prefix}/include' '--mandir=${prefix}/share/man' '--infodir=${prefix}/share/info' '--sysconfdir=/etc' '--localstatedir=/var' '--disable-silent-rules' '--libdir=${prefix}/lib/aarch64-linux-gnu' '--runstatedir=/run' '--disable-maintainer-mode' '--disable-dependency-tracking' '--with-memhinfo=L2:4/64/512K,L1:8/64/24K' '--with-hwloc' '--enable-matrix-types=blas' '--with-zlib=-lz' '--enable-doc-build' '--enable-fortran-module-install' '--enable-extra-patches' '--enable-pkg-config-install' '--disable-extra-patches' 'build_alias=aarch64-linux-gnu' 'CFLAGS=-g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3' 'LDFLAGS=-Wl,-z,relro' 'CPPFLAGS=-Wdate-time -D_FORTIFY_SOURCE=2' 'FCFLAGS=-g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -mbranch-protection=standard -pipe' 'CXXFLAGS=-g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard' 'BASH=/bin/sh' --cache-file=/dev/null --srcdir=. checking for a BSD-compatible install... /usr/bin/install -c checking whether sleep supports fractional seconds... yes checking filesystem timestamp resolution... 0.01 @@ -1712,7 +1748,7 @@ configure: Will not use Google Test. checking whether you have std::thread... yes checking whether you have std::mutex... yes -/bin/bash +/bin/sh checking that generated files are newer than configure... done configure: creating ./config.status config.status: creating Makefile @@ -1721,7 +1757,7 @@ config.status: executing libtool commands configure: Successfully created a Makefile. === configuring in rsblib (/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib) -configure: running /bin/bash ./configure --disable-option-checking '--prefix=/usr' '--build=aarch64-linux-gnu' '--includedir=${prefix}/include' '--mandir=${prefix}/share/man' '--infodir=${prefix}/share/info' '--sysconfdir=/etc' '--localstatedir=/var' '--disable-silent-rules' '--libdir=${prefix}/lib/aarch64-linux-gnu' '--runstatedir=/run' '--disable-maintainer-mode' '--disable-dependency-tracking' '--with-memhinfo=L2:4/64/512K,L1:8/64/24K' '--with-hwloc' '--enable-matrix-types=blas' '--with-zlib=-lz' '--enable-doc-build' '--enable-fortran-module-install' '--enable-extra-patches' '--enable-pkg-config-install' '--disable-extra-patches' 'build_alias=aarch64-linux-gnu' 'CFLAGS=-g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3' 'LDFLAGS=-Wl,-z,relro' 'CPPFLAGS=-Wdate-time -D_FORTIFY_SOURCE=2' 'FCFLAGS=-g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -mbranch-protection=standard -pipe' 'CXXFLAGS=-g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard' 'BASH=/bin/bash' --cache-file=/dev/null --srcdir=. +configure: running /bin/sh ./configure --disable-option-checking '--prefix=/usr' '--build=aarch64-linux-gnu' '--includedir=${prefix}/include' '--mandir=${prefix}/share/man' '--infodir=${prefix}/share/info' '--sysconfdir=/etc' '--localstatedir=/var' '--disable-silent-rules' '--libdir=${prefix}/lib/aarch64-linux-gnu' '--runstatedir=/run' '--disable-maintainer-mode' '--disable-dependency-tracking' '--with-memhinfo=L2:4/64/512K,L1:8/64/24K' '--with-hwloc' '--enable-matrix-types=blas' '--with-zlib=-lz' '--enable-doc-build' '--enable-fortran-module-install' '--enable-extra-patches' '--enable-pkg-config-install' '--disable-extra-patches' 'build_alias=aarch64-linux-gnu' 'CFLAGS=-g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3' 'LDFLAGS=-Wl,-z,relro' 'CPPFLAGS=-Wdate-time -D_FORTIFY_SOURCE=2' 'FCFLAGS=-g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -mbranch-protection=standard -pipe' 'CXXFLAGS=-g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard' 'BASH=/bin/sh' --cache-file=/dev/null --srcdir=. checking for a BSD-compatible install... /usr/bin/install -c checking whether sleep supports fractional seconds... yes checking filesystem timestamp resolution... 0.01 @@ -1833,7 +1869,7 @@ checking for filesystem... yes checking for main in -lstdc++fs... yes configure: Assuming you are yet to build librsb.la. (set LIBS= -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la) -/bin/bash +/bin/sh checking that generated files are newer than configure... done configure: creating ./config.status config.status: creating Makefile @@ -1843,7 +1879,7 @@ config.status: executing libtool commands configure: Created a Makefile. === configuring in rsbtest (/build/reproducible-path/librsb-1.3.0.2+dfsg/rsbtest) -configure: running /bin/bash ./configure --disable-option-checking '--prefix=/usr' '--build=aarch64-linux-gnu' '--includedir=${prefix}/include' '--mandir=${prefix}/share/man' '--infodir=${prefix}/share/info' '--sysconfdir=/etc' '--localstatedir=/var' '--disable-silent-rules' '--libdir=${prefix}/lib/aarch64-linux-gnu' '--runstatedir=/run' '--disable-maintainer-mode' '--disable-dependency-tracking' '--with-memhinfo=L2:4/64/512K,L1:8/64/24K' '--with-hwloc' '--enable-matrix-types=blas' '--with-zlib=-lz' '--enable-doc-build' '--enable-fortran-module-install' '--enable-extra-patches' '--enable-pkg-config-install' '--disable-extra-patches' 'build_alias=aarch64-linux-gnu' 'CFLAGS=-g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3' 'LDFLAGS=-Wl,-z,relro' 'CPPFLAGS=-Wdate-time -D_FORTIFY_SOURCE=2' 'FCFLAGS=-g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -mbranch-protection=standard -pipe' 'CXXFLAGS=-g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard' 'BASH=/bin/bash' --cache-file=/dev/null --srcdir=. +configure: running /bin/sh ./configure --disable-option-checking '--prefix=/usr' '--build=aarch64-linux-gnu' '--includedir=${prefix}/include' '--mandir=${prefix}/share/man' '--infodir=${prefix}/share/info' '--sysconfdir=/etc' '--localstatedir=/var' '--disable-silent-rules' '--libdir=${prefix}/lib/aarch64-linux-gnu' '--runstatedir=/run' '--disable-maintainer-mode' '--disable-dependency-tracking' '--with-memhinfo=L2:4/64/512K,L1:8/64/24K' '--with-hwloc' '--enable-matrix-types=blas' '--with-zlib=-lz' '--enable-doc-build' '--enable-fortran-module-install' '--enable-extra-patches' '--enable-pkg-config-install' '--disable-extra-patches' 'build_alias=aarch64-linux-gnu' 'CFLAGS=-g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3' 'LDFLAGS=-Wl,-z,relro' 'CPPFLAGS=-Wdate-time -D_FORTIFY_SOURCE=2' 'FCFLAGS=-g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -mbranch-protection=standard -pipe' 'CXXFLAGS=-g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard' 'BASH=/bin/sh' --cache-file=/dev/null --srcdir=. checking for a BSD-compatible install... /usr/bin/install -c checking whether sleep supports fractional seconds... yes checking filesystem timestamp resolution... 0.01 @@ -1957,7 +1993,7 @@ checking for filesystem... yes checking for rsb_lib_init... no checking for dd... yes -/bin/bash +/bin/sh /usr/bin/timeout checking that generated files are newer than configure... done configure: creating ./config.status @@ -1989,7 +2025,7 @@ ARFLAGS : cru M4 : m4 MAKE : gmake - BASH : /bin/bash + BASH : /bin/sh OCTAVE : false DOXYGEN : doxygen HELP2MAN : help2man @@ -2045,24 +2081,24 @@ Making all in librsbpp gmake[4]: Entering directory '/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp' g++ -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -DRSBPP_HAS_RSB_H=1 -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -DRSBPP_HAS_RSB_H=1 -c -o rsbpp.o rsbpp.cpp -/bin/bash ./libtool --tag=CXX --mode=compile g++ -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -DRSBPP_HAS_RSB_H=1 -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -DRSBPP_HAS_RSB_H=1 -c -o rsbpp_coo.lo rsbpp_coo.cpp -/bin/bash ./libtool --tag=CXX --mode=compile g++ -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -DRSBPP_HAS_RSB_H=1 -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -DRSBPP_HAS_RSB_H=1 -c -o rsbpp_csr.lo rsbpp_csr.cpp +/bin/sh ./libtool --tag=CXX --mode=compile g++ -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -DRSBPP_HAS_RSB_H=1 -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -DRSBPP_HAS_RSB_H=1 -c -o rsbpp_coo.lo rsbpp_coo.cpp +/bin/sh ./libtool --tag=CXX --mode=compile g++ -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -DRSBPP_HAS_RSB_H=1 -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -DRSBPP_HAS_RSB_H=1 -c -o rsbpp_csr.lo rsbpp_csr.cpp g++ -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -DRSBPP_HAS_RSB_H=1 -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -DRSBPP_HAS_RSB_H=1 -c -o rsbtt.o rsbtt.cpp gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -DRSBPP_HAS_RSB_H=1 -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -c -o rsbct.o rsbct.c -libtool: compile: g++ -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -DRSBPP_HAS_RSB_H=1 -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -DRSBPP_HAS_RSB_H=1 -c rsbpp_coo.cpp -fPIC -DPIC -o .libs/rsbpp_coo.o libtool: compile: g++ -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -DRSBPP_HAS_RSB_H=1 -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -DRSBPP_HAS_RSB_H=1 -c rsbpp_csr.cpp -fPIC -DPIC -o .libs/rsbpp_csr.o +libtool: compile: g++ -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -DRSBPP_HAS_RSB_H=1 -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -DRSBPP_HAS_RSB_H=1 -c rsbpp_coo.cpp -fPIC -DPIC -o .libs/rsbpp_coo.o libtool: compile: g++ -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -DRSBPP_HAS_RSB_H=1 -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -DRSBPP_HAS_RSB_H=1 -c rsbpp_coo.cpp -o rsbpp_coo.o >/dev/null 2>&1 libtool: compile: g++ -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -DRSBPP_HAS_RSB_H=1 -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -DRSBPP_HAS_RSB_H=1 -c rsbpp_csr.cpp -o rsbpp_csr.o >/dev/null 2>&1 -/bin/bash ./libtool --tag=CXX --mode=link g++ -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -DRSBPP_HAS_RSB_H=1 -Wl,-z,relro -o librsbpp.la rsbpp_coo.lo rsbpp_csr.lo -lpthread -lstdc++fs +/bin/sh ./libtool --tag=CXX --mode=link g++ -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -DRSBPP_HAS_RSB_H=1 -Wl,-z,relro -o librsbpp.la rsbpp_coo.lo rsbpp_csr.lo -lpthread -lstdc++fs libtool: link: ar cr .libs/librsbpp.a .libs/rsbpp_coo.o .libs/rsbpp_csr.o libtool: link: ranlib .libs/librsbpp.a libtool: link: ( cd ".libs" && rm -f "librsbpp.la" && ln -s "../librsbpp.la" "librsbpp.la" ) -/bin/bash ./libtool --tag=CXX --mode=link g++ -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -DRSBPP_HAS_RSB_H=1 -Wl,-z,relro -o rsbpp rsbpp.o librsbpp.la -lpthread -lstdc++fs -/bin/bash ./libtool --tag=CXX --mode=link g++ -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -DRSBPP_HAS_RSB_H=1 -Wl,-z,relro -o rsbtt rsbtt.o librsbpp.la -lpthread -lstdc++fs -/bin/bash ./libtool --tag=CXX --mode=link g++ -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -DRSBPP_HAS_RSB_H=1 -Wl,-z,relro -o rsbct rsbct.o librsbpp.la -lpthread -lstdc++fs +/bin/sh ./libtool --tag=CXX --mode=link g++ -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -DRSBPP_HAS_RSB_H=1 -Wl,-z,relro -o rsbpp rsbpp.o librsbpp.la -lpthread -lstdc++fs +/bin/sh ./libtool --tag=CXX --mode=link g++ -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -DRSBPP_HAS_RSB_H=1 -Wl,-z,relro -o rsbtt rsbtt.o librsbpp.la -lpthread -lstdc++fs +/bin/sh ./libtool --tag=CXX --mode=link g++ -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -DRSBPP_HAS_RSB_H=1 -Wl,-z,relro -o rsbct rsbct.o librsbpp.la -lpthread -lstdc++fs libtool: link: g++ -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -DRSBPP_HAS_RSB_H=1 -Wl,-z -Wl,relro -o rsbct rsbct.o ./.libs/librsbpp.a -lpthread -lstdc++fs -fopenmp -libtool: link: g++ -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -DRSBPP_HAS_RSB_H=1 -Wl,-z -Wl,relro -o rsbpp rsbpp.o ./.libs/librsbpp.a -lpthread -lstdc++fs -fopenmp libtool: link: g++ -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -DRSBPP_HAS_RSB_H=1 -Wl,-z -Wl,relro -o rsbtt rsbtt.o ./.libs/librsbpp.a -lpthread -lstdc++fs -fopenmp +libtool: link: g++ -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -DRSBPP_HAS_RSB_H=1 -Wl,-z -Wl,relro -o rsbpp rsbpp.o ./.libs/librsbpp.a -lpthread -lstdc++fs -fopenmp gmake all-am gmake[5]: Entering directory '/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp' gmake[5]: Leaving directory '/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp' @@ -2080,94 +2116,99 @@ gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o rsbench-rsb_libspblas_tests.o `test -f 'rsb_libspblas_tests.c' || echo './'`rsb_libspblas_tests.c g++ -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -fopenmp -c -o rsb_dummy.o rsb_dummy.cpp gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o ch2icfb-ch2icfb.o `test -f 'ch2icfb.c' || echo './'`ch2icfb.c -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_nounroll_la-rsb_stropts.lo `test -f 'rsb_stropts.c' || echo './'`rsb_stropts.c -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_nounroll_la-rsb_strmif.lo `test -f 'rsb_strmif.c' || echo './'`rsb_strmif.c -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_nounroll_la-rsb_unroll.lo `test -f 'rsb_unroll.c' || echo './'`rsb_unroll.c -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_nounroll_la-rsb_krnl_vb.lo `test -f 'rsb_krnl_vb.c' || echo './'`rsb_krnl_vb.c +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_nounroll_la-rsb_stropts.lo `test -f 'rsb_stropts.c' || echo './'`rsb_stropts.c +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_nounroll_la-rsb_strmif.lo `test -f 'rsb_strmif.c' || echo './'`rsb_strmif.c +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_nounroll_la-rsb_unroll.lo `test -f 'rsb_unroll.c' || echo './'`rsb_unroll.c +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_nounroll_la-rsb_krnl_vb.lo `test -f 'rsb_krnl_vb.c' || echo './'`rsb_krnl_vb.c +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_nounroll_la-rsb_krnl_lb.lo `test -f 'rsb_krnl_lb.c' || echo './'`rsb_krnl_lb.c +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_nounroll_la-rsb_krnl.lo `test -f 'rsb_krnl.c' || echo './'`rsb_krnl.c +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_strmif.c -fPIC -DPIC -o .libs/librsb_nounroll_la-rsb_strmif.o libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_stropts.c -fPIC -DPIC -o .libs/librsb_nounroll_la-rsb_stropts.o -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_unroll.c -fPIC -DPIC -o .libs/librsb_nounroll_la-rsb_unroll.o -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_nounroll_la-rsb_krnl_lb.lo `test -f 'rsb_krnl_lb.c' || echo './'`rsb_krnl_lb.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_krnl_vb.c -fPIC -DPIC -o .libs/librsb_nounroll_la-rsb_krnl_vb.o -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_strmif.c -fPIC -DPIC -o .libs/librsb_nounroll_la-rsb_strmif.o -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_unroll.c -o librsb_nounroll_la-rsb_unroll.o >/dev/null 2>&1 -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_krnl_lb.c -fPIC -DPIC -o .libs/librsb_nounroll_la-rsb_krnl_lb.o -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_nounroll_la-rsb_krnl.lo `test -f 'rsb_krnl.c' || echo './'`rsb_krnl.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_stropts.c -o librsb_nounroll_la-rsb_stropts.o >/dev/null 2>&1 +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_krnl.c -fPIC -DPIC -o .libs/librsb_nounroll_la-rsb_krnl.o +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_unroll.c -fPIC -DPIC -o .libs/librsb_nounroll_la-rsb_unroll.o +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_krnl_lb.c -fPIC -DPIC -o .libs/librsb_nounroll_la-rsb_krnl_lb.o libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_krnl_vb.c -o librsb_nounroll_la-rsb_krnl_vb.o >/dev/null 2>&1 -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_nounroll_la-rsb_bench.lo `test -f 'rsb_bench.c' || echo './'`rsb_bench.c -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_nounroll_la-rsb_mergesort.lo `test -f 'rsb_mergesort.c' || echo './'`rsb_mergesort.c +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_nounroll_la-rsb_bench.lo `test -f 'rsb_bench.c' || echo './'`rsb_bench.c +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_unroll.c -o librsb_nounroll_la-rsb_unroll.o >/dev/null 2>&1 libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_krnl_lb.c -o librsb_nounroll_la-rsb_krnl_lb.o >/dev/null 2>&1 -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_nounroll_la-rsb_permute.lo `test -f 'rsb_permute.c' || echo './'`rsb_permute.c -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_bench.c -fPIC -DPIC -o .libs/librsb_nounroll_la-rsb_bench.o -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_nounroll_la-rsb_krnl_bcss_l.lo `test -f 'rsb_krnl_bcss_l.c' || echo './'`rsb_krnl_bcss_l.c -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_krnl.c -fPIC -DPIC -o .libs/librsb_nounroll_la-rsb_krnl.o -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_nounroll_la-rsb_krnl_bcss_u.lo `test -f 'rsb_krnl_bcss_u.c' || echo './'`rsb_krnl_bcss_u.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_strmif.c -o librsb_nounroll_la-rsb_strmif.o >/dev/null 2>&1 -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_mergesort.c -fPIC -DPIC -o .libs/librsb_nounroll_la-rsb_mergesort.o +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_nounroll_la-rsb_mergesort.lo `test -f 'rsb_mergesort.c' || echo './'`rsb_mergesort.c +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_nounroll_la-rsb_permute.lo `test -f 'rsb_permute.c' || echo './'`rsb_permute.c +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_nounroll_la-rsb_krnl_bcss_l.lo `test -f 'rsb_krnl_bcss_l.c' || echo './'`rsb_krnl_bcss_l.c +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_nounroll_la-rsb_krnl_bcss_u.lo `test -f 'rsb_krnl_bcss_u.c' || echo './'`rsb_krnl_bcss_u.c +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_nounroll_la-rsb_krnl_bcss_spsv_u.lo `test -f 'rsb_krnl_bcss_spsv_u.c' || echo './'`rsb_krnl_bcss_spsv_u.c +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_bench.c -fPIC -DPIC -o .libs/librsb_nounroll_la-rsb_bench.o +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_nounroll_la-rsb_krnl_bcss_spmv_u.lo `test -f 'rsb_krnl_bcss_spmv_u.c' || echo './'`rsb_krnl_bcss_spmv_u.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_krnl_bcss_l.c -fPIC -DPIC -o .libs/librsb_nounroll_la-rsb_krnl_bcss_l.o -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_krnl_bcss_u.c -fPIC -DPIC -o .libs/librsb_nounroll_la-rsb_krnl_bcss_u.o -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_nounroll_la-rsb_krnl_bcss_spsv_u.lo `test -f 'rsb_krnl_bcss_spsv_u.c' || echo './'`rsb_krnl_bcss_spsv_u.c +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_mergesort.c -fPIC -DPIC -o .libs/librsb_nounroll_la-rsb_mergesort.o libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_permute.c -fPIC -DPIC -o .libs/librsb_nounroll_la-rsb_permute.o -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_krnl_bcss_l.c -o librsb_nounroll_la-rsb_krnl_bcss_l.o >/dev/null 2>&1 +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_krnl_bcss_u.c -fPIC -DPIC -o .libs/librsb_nounroll_la-rsb_krnl_bcss_u.o +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_krnl_bcss_spsv_u.c -fPIC -DPIC -o .libs/librsb_nounroll_la-rsb_krnl_bcss_spsv_u.o libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_mergesort.c -o librsb_nounroll_la-rsb_mergesort.o >/dev/null 2>&1 -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_nounroll_la-rsb_krnl_bcss_spmv_u.lo `test -f 'rsb_krnl_bcss_spmv_u.c' || echo './'`rsb_krnl_bcss_spmv_u.c +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_krnl_bcss_l.c -o librsb_nounroll_la-rsb_krnl_bcss_l.o >/dev/null 2>&1 +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_nounroll_la-rsb_krnl_bcss_misc_u.lo `test -f 'rsb_krnl_bcss_misc_u.c' || echo './'`rsb_krnl_bcss_misc_u.c +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_krnl_bcss_spmv_u.c -fPIC -DPIC -o .libs/librsb_nounroll_la-rsb_krnl_bcss_spmv_u.o libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_krnl_bcss_u.c -o librsb_nounroll_la-rsb_krnl_bcss_u.o >/dev/null 2>&1 -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_nounroll_la-rsb_krnl_bcss_misc_u.lo `test -f 'rsb_krnl_bcss_misc_u.c' || echo './'`rsb_krnl_bcss_misc_u.c -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_nounroll_la-rsb_krnl_bcoo_spmv_u.lo `test -f 'rsb_krnl_bcoo_spmv_u.c' || echo './'`rsb_krnl_bcoo_spmv_u.c -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_krnl_bcss_spsv_u.c -fPIC -DPIC -o .libs/librsb_nounroll_la-rsb_krnl_bcss_spsv_u.o -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_nounroll_la-rsb_krnl_bcss.lo `test -f 'rsb_krnl_bcss.c' || echo './'`rsb_krnl_bcss.c -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_nounroll_la-rsb_spmv.lo `test -f 'rsb_spmv.c' || echo './'`rsb_spmv.c +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_nounroll_la-rsb_krnl_bcoo_spmv_u.lo `test -f 'rsb_krnl_bcoo_spmv_u.c' || echo './'`rsb_krnl_bcoo_spmv_u.c +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_nounroll_la-rsb_krnl_bcss.lo `test -f 'rsb_krnl_bcss.c' || echo './'`rsb_krnl_bcss.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_krnl_bcoo_spmv_u.c -fPIC -DPIC -o .libs/librsb_nounroll_la-rsb_krnl_bcoo_spmv_u.o -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_spmv.c -fPIC -DPIC -o .libs/librsb_nounroll_la-rsb_spmv.o +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_nounroll_la-rsb_spmv.lo `test -f 'rsb_spmv.c' || echo './'`rsb_spmv.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_krnl_bcss_misc_u.c -fPIC -DPIC -o .libs/librsb_nounroll_la-rsb_krnl_bcss_misc_u.o -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_krnl_bcss_spmv_u.c -fPIC -DPIC -o .libs/librsb_nounroll_la-rsb_krnl_bcss_spmv_u.o libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_krnl_bcss.c -fPIC -DPIC -o .libs/librsb_nounroll_la-rsb_krnl_bcss.o libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_bench.c -o librsb_nounroll_la-rsb_bench.o >/dev/null 2>&1 -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_spmv.c -o librsb_nounroll_la-rsb_spmv.o >/dev/null 2>&1 libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_krnl_bcss.c -o librsb_nounroll_la-rsb_krnl_bcss.o >/dev/null 2>&1 +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_spmv.c -fPIC -DPIC -o .libs/librsb_nounroll_la-rsb_spmv.o +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_nounroll_la-rsb_merge.lo `test -f 'rsb_merge.c' || echo './'`rsb_merge.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_permute.c -o librsb_nounroll_la-rsb_permute.o >/dev/null 2>&1 -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_nounroll_la-rsb_merge.lo `test -f 'rsb_merge.c' || echo './'`rsb_merge.c -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_nounroll_la-rsb_ompio.lo `test -f 'rsb_ompio.c' || echo './'`rsb_ompio.c -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_nounroll_la-rsb_util.lo `test -f 'rsb_util.c' || echo './'`rsb_util.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_merge.c -fPIC -DPIC -o .libs/librsb_nounroll_la-rsb_merge.o -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_nounroll_la-rsb_spgemm_csr.lo `test -f 'rsb_spgemm_csr.c' || echo './'`rsb_spgemm_csr.c +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_nounroll_la-rsb_ompio.lo `test -f 'rsb_ompio.c' || echo './'`rsb_ompio.c +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_spmv.c -o librsb_nounroll_la-rsb_spmv.o >/dev/null 2>&1 libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_ompio.c -fPIC -DPIC -o .libs/librsb_nounroll_la-rsb_ompio.o -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_util.c -fPIC -DPIC -o .libs/librsb_nounroll_la-rsb_util.o -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_ompio.c -o librsb_nounroll_la-rsb_ompio.o >/dev/null 2>&1 libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_merge.c -o librsb_nounroll_la-rsb_merge.o >/dev/null 2>&1 +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_ompio.c -o librsb_nounroll_la-rsb_ompio.o >/dev/null 2>&1 +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_nounroll_la-rsb_util.lo `test -f 'rsb_util.c' || echo './'`rsb_util.c +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_nounroll_la-rsb_spgemm_csr.lo `test -f 'rsb_spgemm_csr.c' || echo './'`rsb_spgemm_csr.c +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_nounroll_la-rsb_spsum_misc.lo `test -f 'rsb_spsum_misc.c' || echo './'`rsb_spsum_misc.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_spgemm_csr.c -fPIC -DPIC -o .libs/librsb_nounroll_la-rsb_spgemm_csr.o -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_nounroll_la-rsb_spsum_misc.lo `test -f 'rsb_spsum_misc.c' || echo './'`rsb_spsum_misc.c -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_nounroll_la-rsb_prec.lo `test -f 'rsb_prec.c' || echo './'`rsb_prec.c +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_util.c -fPIC -DPIC -o .libs/librsb_nounroll_la-rsb_util.o +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_spsum_misc.c -fPIC -DPIC -o .libs/librsb_nounroll_la-rsb_spsum_misc.o +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_nounroll_la-rsb_prec.lo `test -f 'rsb_prec.c' || echo './'`rsb_prec.c +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_is.lo `test -f 'rsb_is.c' || echo './'`rsb_is.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_spgemm_csr.c -o librsb_nounroll_la-rsb_spgemm_csr.o >/dev/null 2>&1 libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_prec.c -fPIC -DPIC -o .libs/librsb_nounroll_la-rsb_prec.o -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_spsum_misc.c -fPIC -DPIC -o .libs/librsb_nounroll_la-rsb_spsum_misc.o -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_is.lo `test -f 'rsb_is.c' || echo './'`rsb_is.c +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_spsum_misc.c -o librsb_nounroll_la-rsb_spsum_misc.o >/dev/null 2>&1 libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_is.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_is.o -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_mio.lo `test -f 'rsb_mio.c' || echo './'`rsb_mio.c +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_mio.lo `test -f 'rsb_mio.c' || echo './'`rsb_mio.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_prec.c -o librsb_nounroll_la-rsb_prec.o >/dev/null 2>&1 libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_is.c -o librsb_base_la-rsb_is.o >/dev/null 2>&1 -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_spsum_misc.c -o librsb_nounroll_la-rsb_spsum_misc.o >/dev/null 2>&1 +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_op.lo `test -f 'rsb_op.c' || echo './'`rsb_op.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_mio.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_mio.o -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_op.lo `test -f 'rsb_op.c' || echo './'`rsb_op.c -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_bio.lo `test -f 'rsb_bio.c' || echo './'`rsb_bio.c +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_bio.lo `test -f 'rsb_bio.c' || echo './'`rsb_bio.c +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_get.lo `test -f 'rsb_get.c' || echo './'`rsb_get.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_op.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_op.o -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_get.lo `test -f 'rsb_get.c' || echo './'`rsb_get.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_op.c -o librsb_base_la-rsb_op.o >/dev/null 2>&1 libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_bio.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_bio.o -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_set.lo `test -f 'rsb_set.c' || echo './'`rsb_set.c -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_mio.c -o librsb_base_la-rsb_mio.o >/dev/null 2>&1 +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_set.lo `test -f 'rsb_set.c' || echo './'`rsb_set.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_bio.c -o librsb_base_la-rsb_bio.o >/dev/null 2>&1 libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_get.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_get.o libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_set.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_set.o -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_coo.lo `test -f 'rsb_coo.c' || echo './'`rsb_coo.c -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_csr.lo `test -f 'rsb_csr.c' || echo './'`rsb_csr.c +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_coo.lo `test -f 'rsb_coo.c' || echo './'`rsb_coo.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_krnl_bcss_spsv_u.c -o librsb_nounroll_la-rsb_krnl_bcss_spsv_u.o >/dev/null 2>&1 -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_coo.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_coo.o +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_mio.c -o librsb_base_la-rsb_mio.o >/dev/null 2>&1 libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_set.c -o librsb_base_la-rsb_set.o >/dev/null 2>&1 +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_coo.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_coo.o +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_csr.lo `test -f 'rsb_csr.c' || echo './'`rsb_csr.c +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_get.c -o librsb_base_la-rsb_get.o >/dev/null 2>&1 +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_coo.c -o librsb_base_la-rsb_coo.o >/dev/null 2>&1 +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_csr.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_csr.o +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_coo_check.lo `test -f 'rsb_coo_check.c' || echo './'`rsb_coo_check.c rsb_test_matops.c: In function 'rsb__main_block_partitioned_spmv_sxsa': rsb_test_matops.c:214:41: warning: '%s' directive writing up to 2047 bytes into a region of size 1011 [-Wformat-overflow=] 214 | rsb__sprintf(dst,"%s%s_%s_%.0lf_%s%s" "%s%s%s" "%s%s" "%s",pp?pp:"",h,rsb__getenv_nnr("HOSTNAME"),rsb_time(),buf,ap?ap:"", | ^~ ~~~ +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_csr.c -o librsb_base_la-rsb_csr.o >/dev/null 2>&1 In file included from /usr/include/stdio.h:970, from rsb_common.h:49, from rsb_test_matops.h:79, @@ -2182,112 +2223,137 @@ | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ 32 | __va_arg_pack ()); | ~~~~~~~~~~~~~~~~~ -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_csr.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_csr.o -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_coo.c -o librsb_base_la-rsb_coo.o >/dev/null 2>&1 -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_get.c -o librsb_base_la-rsb_get.o >/dev/null 2>&1 -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_coo_check.lo `test -f 'rsb_coo_check.c' || echo './'`rsb_coo_check.c -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_csr.c -o librsb_base_la-rsb_csr.o >/dev/null 2>&1 -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_coo_symm.lo `test -f 'rsb_coo_symm.c' || echo './'`rsb_coo_symm.c -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_idx.lo `test -f 'rsb_idx.c' || echo './'`rsb_idx.c +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_coo_symm.lo `test -f 'rsb_coo_symm.c' || echo './'`rsb_coo_symm.c +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_idx.lo `test -f 'rsb_idx.c' || echo './'`rsb_idx.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_coo_check.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_coo_check.o +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_idx.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_idx.o libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_coo_symm.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_coo_symm.o -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_srt.lo `test -f 'rsb_srt.c' || echo './'`rsb_srt.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_coo_check.c -o librsb_base_la-rsb_coo_check.o >/dev/null 2>&1 -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_idx.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_idx.o -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_srtp.lo `test -f 'rsb_srtp.c' || echo './'`rsb_srtp.c +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_srt.lo `test -f 'rsb_srt.c' || echo './'`rsb_srt.c +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_srtp.lo `test -f 'rsb_srtp.c' || echo './'`rsb_srtp.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_coo_symm.c -o librsb_base_la-rsb_coo_symm.o >/dev/null 2>&1 libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_srt.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_srt.o +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_src.lo `test -f 'rsb_src.c' || echo './'`rsb_src.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_srtp.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_srtp.o -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_src.lo `test -f 'rsb_src.c' || echo './'`rsb_src.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_idx.c -o librsb_base_la-rsb_idx.o >/dev/null 2>&1 -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_srt.c -o librsb_base_la-rsb_srt.o >/dev/null 2>&1 -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_srtp.c -o librsb_base_la-rsb_srtp.o >/dev/null 2>&1 libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_src.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_src.o -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_test_accuracy.lo `test -f 'rsb_test_accuracy.c' || echo './'`rsb_test_accuracy.c +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_srtp.c -o librsb_base_la-rsb_srtp.o >/dev/null 2>&1 +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_srt.c -o librsb_base_la-rsb_srt.o >/dev/null 2>&1 libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_src.c -o librsb_base_la-rsb_src.o >/dev/null 2>&1 -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_clone.lo `test -f 'rsb_clone.c' || echo './'`rsb_clone.c -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_test_accuracy.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_test_accuracy.o -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_rec.lo `test -f 'rsb_rec.c' || echo './'`rsb_rec.c -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_render.lo `test -f 'rsb_render.c' || echo './'`rsb_render.c -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_test_accuracy.c -o librsb_base_la-rsb_test_accuracy.o >/dev/null 2>&1 -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_clone.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_clone.o +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_test_accuracy.lo `test -f 'rsb_test_accuracy.c' || echo './'`rsb_test_accuracy.c +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_clone.lo `test -f 'rsb_clone.c' || echo './'`rsb_clone.c +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_rec.lo `test -f 'rsb_rec.c' || echo './'`rsb_rec.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_rec.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_rec.o +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_clone.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_clone.o +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_test_accuracy.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_test_accuracy.o +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_render.lo `test -f 'rsb_render.c' || echo './'`rsb_render.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_render.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_render.o -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_eps.lo `test -f 'rsb_eps.c' || echo './'`rsb_eps.c +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_test_accuracy.c -o librsb_base_la-rsb_test_accuracy.o >/dev/null 2>&1 +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_eps.lo `test -f 'rsb_eps.c' || echo './'`rsb_eps.c +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_clone.c -o librsb_base_la-rsb_clone.o >/dev/null 2>&1 libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_render.c -o librsb_base_la-rsb_render.o >/dev/null 2>&1 -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_msort_up.lo `test -f 'rsb_msort_up.c' || echo './'`rsb_msort_up.c +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_msort_up.lo `test -f 'rsb_msort_up.c' || echo './'`rsb_msort_up.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_eps.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_eps.o -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_clone.c -o librsb_base_la-rsb_clone.o >/dev/null 2>&1 -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_sys.lo `test -f 'rsb_sys.c' || echo './'`rsb_sys.c -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_blas_stuff.lo `test -f 'rsb_blas_stuff.c' || echo './'`rsb_blas_stuff.c -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_msort_up.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_msort_up.o +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_sys.lo `test -f 'rsb_sys.c' || echo './'`rsb_sys.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_rec.c -o librsb_base_la-rsb_rec.o >/dev/null 2>&1 +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_msort_up.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_msort_up.o +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_blas_stuff.lo `test -f 'rsb_blas_stuff.c' || echo './'`rsb_blas_stuff.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_sys.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_sys.o -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_blas_stuff.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_blas_stuff.o libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_msort_up.c -o librsb_base_la-rsb_msort_up.o >/dev/null 2>&1 -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_gen.lo `test -f 'rsb_gen.c' || echo './'`rsb_gen.c -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_perf.lo `test -f 'rsb_perf.c' || echo './'`rsb_perf.c -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_eps.c -o librsb_base_la-rsb_eps.o >/dev/null 2>&1 -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_blas_stuff.c -o librsb_base_la-rsb_blas_stuff.o >/dev/null 2>&1 +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_gen.lo `test -f 'rsb_gen.c' || echo './'`rsb_gen.c +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_blas_stuff.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_blas_stuff.o libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_gen.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_gen.o libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_sys.c -o librsb_base_la-rsb_sys.o >/dev/null 2>&1 -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_rsb.lo `test -f 'rsb_rsb.c' || echo './'`rsb_rsb.c +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_perf.lo `test -f 'rsb_perf.c' || echo './'`rsb_perf.c +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_eps.c -o librsb_base_la-rsb_eps.o >/dev/null 2>&1 +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_rsb.lo `test -f 'rsb_rsb.c' || echo './'`rsb_rsb.c +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_blas_stuff.c -o librsb_base_la-rsb_blas_stuff.o >/dev/null 2>&1 libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_perf.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_perf.o -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_perf.c -o librsb_base_la-rsb_perf.o >/dev/null 2>&1 -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_err.lo `test -f 'rsb_err.c' || echo './'`rsb_err.c +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_err.lo `test -f 'rsb_err.c' || echo './'`rsb_err.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_rsb.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_rsb.o libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_gen.c -o librsb_base_la-rsb_gen.o >/dev/null 2>&1 -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_tune.lo `test -f 'rsb_tune.c' || echo './'`rsb_tune.c -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_do.lo `test -f 'rsb_do.c' || echo './'`rsb_do.c -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_internals.lo `test -f 'rsb_internals.c' || echo './'`rsb_internals.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_err.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_err.o +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_perf.c -o librsb_base_la-rsb_perf.o >/dev/null 2>&1 +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_tune.lo `test -f 'rsb_tune.c' || echo './'`rsb_tune.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_rsb.c -o librsb_base_la-rsb_rsb.o >/dev/null 2>&1 -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_garbage.lo `test -f 'rsb_garbage.c' || echo './'`rsb_garbage.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_err.c -o librsb_base_la-rsb_err.o >/dev/null 2>&1 +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_do.lo `test -f 'rsb_do.c' || echo './'`rsb_do.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_tune.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_tune.o -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_do.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_do.o +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_internals.lo `test -f 'rsb_internals.c' || echo './'`rsb_internals.c +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_garbage.lo `test -f 'rsb_garbage.c' || echo './'`rsb_garbage.c +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_mmio.lo `test -f 'rsb_mmio.c' || echo './'`rsb_mmio.c +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_partition.lo `test -f 'rsb_partition.c' || echo './'`rsb_partition.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_internals.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_internals.o -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_mmio.lo `test -f 'rsb_mmio.c' || echo './'`rsb_mmio.c -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_partition.lo `test -f 'rsb_partition.c' || echo './'`rsb_partition.c -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_krnl_bcss_misc_u.c -o librsb_nounroll_la-rsb_krnl_bcss_misc_u.o >/dev/null 2>&1 +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_do.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_do.o libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_garbage.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_garbage.o -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_mmio.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_mmio.o -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_do.c -o librsb_base_la-rsb_do.o >/dev/null 2>&1 libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_partition.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_partition.o -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_mmio.c -o librsb_base_la-rsb_mmio.o >/dev/null 2>&1 +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_mmio.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_mmio.o libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_garbage.c -o librsb_base_la-rsb_garbage.o >/dev/null 2>&1 -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_mbw.lo `test -f 'rsb_mbw.c' || echo './'`rsb_mbw.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_partition.c -o librsb_base_la-rsb_partition.o >/dev/null 2>&1 -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_internals.c -o librsb_base_la-rsb_internals.o >/dev/null 2>&1 -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_limiter.lo `test -f 'rsb_limiter.c' || echo './'`rsb_limiter.c -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_util.c -o librsb_nounroll_la-rsb_util.o >/dev/null 2>&1 -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_fpb.lo `test -f 'rsb_fpb.c' || echo './'`rsb_fpb.c +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_mmio.c -o librsb_base_la-rsb_mmio.o >/dev/null 2>&1 +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_mbw.lo `test -f 'rsb_mbw.c' || echo './'`rsb_mbw.c +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_do.c -o librsb_base_la-rsb_do.o >/dev/null 2>&1 +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_limiter.lo `test -f 'rsb_limiter.c' || echo './'`rsb_limiter.c +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_fpb.lo `test -f 'rsb_fpb.c' || echo './'`rsb_fpb.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_mbw.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_mbw.o -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_spgemm.lo `test -f 'rsb_spgemm.c' || echo './'`rsb_spgemm.c -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_fpb.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_fpb.o -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_tune.c -o librsb_base_la-rsb_tune.o >/dev/null 2>&1 libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_limiter.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_limiter.o -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_spgemm.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_spgemm.o -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_mbw.c -o librsb_base_la-rsb_mbw.o >/dev/null 2>&1 +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_internals.c -o librsb_base_la-rsb_internals.o >/dev/null 2>&1 +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_fpb.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_fpb.o +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_spgemm.lo `test -f 'rsb_spgemm.c' || echo './'`rsb_spgemm.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_limiter.c -o librsb_base_la-rsb_limiter.o >/dev/null 2>&1 +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_spgemm.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_spgemm.o libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_fpb.c -o librsb_base_la-rsb_fpb.o >/dev/null 2>&1 -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_spsum.lo `test -f 'rsb_spsum.c' || echo './'`rsb_spsum.c -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_spsv.lo `test -f 'rsb_spsv.c' || echo './'`rsb_spsv.c -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_spgemm.c -o librsb_base_la-rsb_spgemm.o >/dev/null 2>&1 -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_lock.lo `test -f 'rsb_lock.c' || echo './'`rsb_lock.c -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_swt.lo `test -f 'rsb_swt.c' || echo './'`rsb_swt.c -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_spsv.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_spsv.o +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_mbw.c -o librsb_base_la-rsb_mbw.o >/dev/null 2>&1 +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_spsum.lo `test -f 'rsb_spsum.c' || echo './'`rsb_spsum.c +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_util.c -o librsb_nounroll_la-rsb_util.o >/dev/null 2>&1 +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_spsv.lo `test -f 'rsb_spsv.c' || echo './'`rsb_spsv.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_spsum.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_spsum.o -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_lock.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_lock.o -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_swt.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_swt.o -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_init.lo `test -f 'rsb_init.c' || echo './'`rsb_init.c +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_tune.c -o librsb_base_la-rsb_tune.o >/dev/null 2>&1 +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_spsv.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_spsv.o +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_spgemm.c -o librsb_base_la-rsb_spgemm.o >/dev/null 2>&1 libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_spsum.c -o librsb_base_la-rsb_spsum.o >/dev/null 2>&1 +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_lock.lo `test -f 'rsb_lock.c' || echo './'`rsb_lock.c +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_swt.lo `test -f 'rsb_swt.c' || echo './'`rsb_swt.c +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_init.lo `test -f 'rsb_init.c' || echo './'`rsb_init.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_spsv.c -o librsb_base_la-rsb_spsv.o >/dev/null 2>&1 -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_dump.lo `test -f 'rsb_dump.c' || echo './'`rsb_dump.c -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_lock.c -o librsb_base_la-rsb_lock.o >/dev/null 2>&1 +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_dump.lo `test -f 'rsb_dump.c' || echo './'`rsb_dump.c +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_lock.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_lock.o +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_swt.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_swt.o libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_init.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_init.o -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_cpmv.lo `test -f 'rsb_cpmv.c' || echo './'`rsb_cpmv.c +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_lock.c -o librsb_base_la-rsb_lock.o >/dev/null 2>&1 +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_dump.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_dump.o +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_krnl_bcss_misc_u.c -o librsb_nounroll_la-rsb_krnl_bcss_misc_u.o >/dev/null 2>&1 +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_cpmv.lo `test -f 'rsb_cpmv.c' || echo './'`rsb_cpmv.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_swt.c -o librsb_base_la-rsb_swt.o >/dev/null 2>&1 +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_asm.lo `test -f 'rsb_asm.c' || echo './'`rsb_asm.c +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_dump.c -o librsb_base_la-rsb_dump.o >/dev/null 2>&1 +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_cpmv.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_cpmv.o +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_init.c -o librsb_base_la-rsb_init.o >/dev/null 2>&1 +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_cpmv.c -o librsb_base_la-rsb_cpmv.o >/dev/null 2>&1 +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_asm.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_asm.o +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_user.lo `test -f 'rsb_user.c' || echo './'`rsb_user.c +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_coo2rec.lo `test -f 'rsb_coo2rec.c' || echo './'`rsb_coo2rec.c +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_rec2coo.lo `test -f 'rsb_rec2coo.c' || echo './'`rsb_rec2coo.c +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_asm.c -o librsb_base_la-rsb_asm.o >/dev/null 2>&1 +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_user.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_user.o +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_rec2csr.lo `test -f 'rsb_rec2csr.c' || echo './'`rsb_rec2csr.c +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_coo2rec.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_coo2rec.o +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_csr2coo.lo `test -f 'rsb_csr2coo.c' || echo './'`rsb_csr2coo.c +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_rec2coo.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_rec2coo.o +/bin/sh ./libtool --tag=FC --mode=compile gfortran -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -mbranch-protection=standard -pipe -fopenmp -c -o rsb_blas_sparse.lo rsb_blas_sparse.F90 +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_csr2coo.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_csr2coo.o +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_rec2csr.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_rec2csr.o +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_krnl.c -o librsb_nounroll_la-rsb_krnl.o >/dev/null 2>&1 +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_rec2coo.c -o librsb_base_la-rsb_rec2coo.o >/dev/null 2>&1 +libtool: compile: gfortran -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -mbranch-protection=standard -pipe -fopenmp -c rsb_blas_sparse.F90 -fPIC -o .libs/rsb_blas_sparse.o +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_user.c -o librsb_base_la-rsb_user.o >/dev/null 2>&1 +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_csr2coo.c -o librsb_base_la-rsb_csr2coo.o >/dev/null 2>&1 +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_rec2csr.c -o librsb_base_la-rsb_rec2csr.o >/dev/null 2>&1 +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o rsb_libspblas_handle.lo rsb_libspblas_handle.c +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o rsb_libspblas.lo rsb_libspblas.c +gfortran -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -mbranch-protection=standard -pipe -fopenmp -c -o rsb_blas_sparse.o rsb_blas_sparse.F90 +/bin/sh ./libtool --tag=CC --mode=link gcc -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -no-undefined -version-info 0:0:0 -Wl,-z,relro -o ch2icfb ch2icfb-ch2icfb.o -lm -lhwloc -lz -fopenmp -L/usr/lib/gcc/aarch64-linux-gnu/14 -L/usr/lib/gcc/aarch64-linux-gnu/14/../../../aarch64-linux-gnu -L/usr/lib/gcc/aarch64-linux-gnu/14/../../../../lib -L/lib/aarch64-linux-gnu -L/lib/../lib -L/usr/lib/aarch64-linux-gnu -L/usr/lib/../lib -L/usr/lib/gcc/aarch64-linux-gnu/14/../../.. -lgfortran -lm +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_coo2rec.c -o librsb_base_la-rsb_coo2rec.o >/dev/null 2>&1 rsb_test_matops.c: In function 'rsb__main_block_partitioned_spsv_sxsx': rsb_test_matops.c:214:41: warning: '%s' directive writing up to 2047 bytes into a region of size 1011 [-Wformat-overflow=] 214 | rsb__sprintf(dst,"%s%s_%s_%.0lf_%s%s" "%s%s%s" "%s%s" "%s",pp?pp:"",h,rsb__getenv_nnr("HOSTNAME"),rsb_time(),buf,ap?ap:"", @@ -2302,56 +2368,26 @@ | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ 32 | __va_arg_pack ()); | ~~~~~~~~~~~~~~~~~ -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_krnl.c -o librsb_nounroll_la-rsb_krnl.o >/dev/null 2>&1 -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_asm.lo `test -f 'rsb_asm.c' || echo './'`rsb_asm.c -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_dump.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_dump.o -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_user.lo `test -f 'rsb_user.c' || echo './'`rsb_user.c -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_cpmv.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_cpmv.o -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_init.c -o librsb_base_la-rsb_init.o >/dev/null 2>&1 -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_coo2rec.lo `test -f 'rsb_coo2rec.c' || echo './'`rsb_coo2rec.c -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_cpmv.c -o librsb_base_la-rsb_cpmv.o >/dev/null 2>&1 -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_dump.c -o librsb_base_la-rsb_dump.o >/dev/null 2>&1 -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_asm.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_asm.o -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_user.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_user.o -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_rec2coo.lo `test -f 'rsb_rec2coo.c' || echo './'`rsb_rec2coo.c -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_rec2csr.lo `test -f 'rsb_rec2csr.c' || echo './'`rsb_rec2csr.c -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_csr2coo.lo `test -f 'rsb_csr2coo.c' || echo './'`rsb_csr2coo.c -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_coo2rec.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_coo2rec.o -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_asm.c -o librsb_base_la-rsb_asm.o >/dev/null 2>&1 -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_rec2csr.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_rec2csr.o -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_rec2coo.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_rec2coo.o -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_user.c -o librsb_base_la-rsb_user.o >/dev/null 2>&1 -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_rec2csr.c -o librsb_base_la-rsb_rec2csr.o >/dev/null 2>&1 -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_csr2coo.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_csr2coo.o -/bin/bash ./libtool --tag=FC --mode=compile gfortran -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -mbranch-protection=standard -pipe -fopenmp -c -o rsb_blas_sparse.lo rsb_blas_sparse.F90 -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o rsb_libspblas_handle.lo rsb_libspblas_handle.c -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o rsb_libspblas.lo rsb_libspblas.c -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_rec2coo.c -o librsb_base_la-rsb_rec2coo.o >/dev/null 2>&1 -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_csr2coo.c -o librsb_base_la-rsb_csr2coo.o >/dev/null 2>&1 -libtool: compile: gfortran -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -mbranch-protection=standard -pipe -fopenmp -c rsb_blas_sparse.F90 -fPIC -o .libs/rsb_blas_sparse.o -gfortran -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -mbranch-protection=standard -pipe -fopenmp -c -o rsb_blas_sparse.o rsb_blas_sparse.F90 -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_libspblas.c -fPIC -DPIC -o .libs/rsb_libspblas.o libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_libspblas_handle.c -fPIC -DPIC -o .libs/rsb_libspblas_handle.o -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_coo2rec.c -o librsb_base_la-rsb_coo2rec.o >/dev/null 2>&1 -/bin/bash ./libtool --tag=CC --mode=link gcc -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -no-undefined -version-info 0:0:0 -Wl,-z,relro -o ch2icfb ch2icfb-ch2icfb.o -lm -lhwloc -lz -fopenmp -L/usr/lib/gcc/aarch64-linux-gnu/14 -L/usr/lib/gcc/aarch64-linux-gnu/14/../../../aarch64-linux-gnu -L/usr/lib/gcc/aarch64-linux-gnu/14/../../../../lib -L/lib/aarch64-linux-gnu -L/lib/../lib -L/usr/lib/aarch64-linux-gnu -L/usr/lib/../lib -L/usr/lib/gcc/aarch64-linux-gnu/14/../../.. -lgfortran -lm +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_libspblas.c -fPIC -DPIC -o .libs/rsb_libspblas.o libtool: warning: '-version-info' is ignored for programs libtool: link: gcc -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -Wl,-z -Wl,relro -o ch2icfb ch2icfb-ch2icfb.o -fopenmp -lhwloc -lz -L/usr/lib/gcc/aarch64-linux-gnu/14 -L/usr/lib/gcc/aarch64-linux-gnu/14/../../../aarch64-linux-gnu -L/usr/lib/gcc/aarch64-linux-gnu/14/../../../../lib -L/lib/aarch64-linux-gnu -L/lib/../lib -L/usr/lib/aarch64-linux-gnu -L/usr/lib/../lib -L/usr/lib/gcc/aarch64-linux-gnu/14/../../.. -lgfortran -lm -fopenmp if test -f ./rsb_types.h -a ! -f ./rsb_types.h ; then cp -pv ./rsb_types.h ./rsb_types.h ; fi # out-of-dir behaviour varies between installations -if test -f ch2icfb ; then if SED=/usr/bin/sed GREP=/usr/bin/grep /bin/bash ./scripts/rsb_h_to_rsb_fi.sh . /build/reproducible-path/librsb-1.3.0.2+dfsg > rsb.F90 ; then true; else rm "rsb.F90"; echo "Failure generating rsb.F90!" ; exit ; fi ; else echo "Warning: Your system did not build ch2icfb for some reason --- skipping rebuild of "rsb.F90 ;true ; fi -/bin/bash ./libtool --tag=FC --mode=compile gfortran -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -mbranch-protection=standard -pipe -fopenmp -c -o rsb.lo rsb.F90 -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_libspblas.c -o rsb_libspblas.o >/dev/null 2>&1 +if test -f ch2icfb ; then if SED=/usr/bin/sed GREP=/usr/bin/grep /bin/sh ./scripts/rsb_h_to_rsb_fi.sh . /build/reproducible-path/librsb-1.3.0.2+dfsg > rsb.F90 ; then true; else rm "rsb.F90"; echo "Failure generating rsb.F90!" ; exit ; fi ; else echo "Warning: Your system did not build ch2icfb for some reason --- skipping rebuild of "rsb.F90 ;true ; fi +/bin/sh ./libtool --tag=FC --mode=compile gfortran -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -mbranch-protection=standard -pipe -fopenmp -c -o rsb.lo rsb.F90 libtool: compile: gfortran -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -mbranch-protection=standard -pipe -fopenmp -c rsb_blas_sparse.F90 -o rsb_blas_sparse.o >/dev/null 2>&1 -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_libspblas_handle.c -o rsb_libspblas_handle.o >/dev/null 2>&1 gfortran -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -mbranch-protection=standard -pipe -fopenmp -c -o rsb.o rsb.F90 +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_libspblas_handle.c -o rsb_libspblas_handle.o >/dev/null 2>&1 libtool: compile: gfortran -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -mbranch-protection=standard -pipe -fopenmp -c rsb.F90 -fPIC -o .libs/rsb.o libtool: compile: gfortran -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -mbranch-protection=standard -pipe -fopenmp -c rsb.F90 -o rsb.o >/dev/null 2>&1 -/bin/bash ./libtool --tag=CC --mode=link gcc -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -no-undefined -version-info 0:0:0 -Wl,-z,relro -o librsb_base.la librsb_base_la-rsb_is.lo librsb_base_la-rsb_mio.lo librsb_base_la-rsb_op.lo librsb_base_la-rsb_bio.lo librsb_base_la-rsb_get.lo librsb_base_la-rsb_set.lo librsb_base_la-rsb_coo.lo librsb_base_la-rsb_csr.lo librsb_base_la-rsb_coo_check.lo librsb_base_la-rsb_coo_symm.lo librsb_base_la-rsb_idx.lo librsb_base_la-rsb_srt.lo librsb_base_la-rsb_srtp.lo librsb_base_la-rsb_src.lo librsb_base_la-rsb_test_accuracy.lo librsb_base_la-rsb_clone.lo librsb_base_la-rsb_rec.lo librsb_base_la-rsb_render.lo librsb_base_la-rsb_eps.lo librsb_base_la-rsb_msort_up.lo librsb_base_la-rsb_sys.lo librsb_base_la-rsb_blas_stuff.lo librsb_base_la-rsb_gen.lo librsb_base_la-rsb_perf.lo librsb_base_la-rsb_rsb.lo librsb_base_la-rsb_err.lo librsb_base_la-rsb_tune.lo librsb_base_la-rsb_do.lo librsb_base_la-rsb_internals.lo librsb_base_la-rsb_garbage.lo librsb_base_la-rsb_mmio.lo librsb_base_la-rsb_partition.lo librsb_base_la-rsb_mbw.lo librsb_base_la-rsb_limiter.lo librsb_base_la-rsb_fpb.lo librsb_base_la-rsb_spgemm.lo librsb_base_la-rsb_spsum.lo librsb_base_la-rsb_spsv.lo librsb_base_la-rsb_lock.lo librsb_base_la-rsb_swt.lo librsb_base_la-rsb_init.lo librsb_base_la-rsb_dump.lo librsb_base_la-rsb_cpmv.lo librsb_base_la-rsb_asm.lo librsb_base_la-rsb_user.lo librsb_base_la-rsb_coo2rec.lo librsb_base_la-rsb_rec2coo.lo librsb_base_la-rsb_rec2csr.lo librsb_base_la-rsb_csr2coo.lo rsb_blas_sparse.lo -lm -lhwloc -lz -fopenmp -L/usr/lib/gcc/aarch64-linux-gnu/14 -L/usr/lib/gcc/aarch64-linux-gnu/14/../../../aarch64-linux-gnu -L/usr/lib/gcc/aarch64-linux-gnu/14/../../../../lib -L/lib/aarch64-linux-gnu -L/lib/../lib -L/usr/lib/aarch64-linux-gnu -L/usr/lib/../lib -L/usr/lib/gcc/aarch64-linux-gnu/14/../../.. -lgfortran -lm -/bin/bash ./libtool --tag=CC --mode=link gcc -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -no-undefined -version-info 0:0:0 -Wl,-z,relro -o librsb_spblas.la rsb_libspblas_handle.lo rsb_libspblas.lo -lm -lhwloc -lz -fopenmp -L/usr/lib/gcc/aarch64-linux-gnu/14 -L/usr/lib/gcc/aarch64-linux-gnu/14/../../../aarch64-linux-gnu -L/usr/lib/gcc/aarch64-linux-gnu/14/../../../../lib -L/lib/aarch64-linux-gnu -L/lib/../lib -L/usr/lib/aarch64-linux-gnu -L/usr/lib/../lib -L/usr/lib/gcc/aarch64-linux-gnu/14/../../.. -lgfortran -lm -libtool: warning: '-version-info/-version-number' is ignored for convenience libraries +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_libspblas.c -o rsb_libspblas.o >/dev/null 2>&1 +/bin/sh ./libtool --tag=CC --mode=link gcc -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -no-undefined -version-info 0:0:0 -Wl,-z,relro -o librsb_base.la librsb_base_la-rsb_is.lo librsb_base_la-rsb_mio.lo librsb_base_la-rsb_op.lo librsb_base_la-rsb_bio.lo librsb_base_la-rsb_get.lo librsb_base_la-rsb_set.lo librsb_base_la-rsb_coo.lo librsb_base_la-rsb_csr.lo librsb_base_la-rsb_coo_check.lo librsb_base_la-rsb_coo_symm.lo librsb_base_la-rsb_idx.lo librsb_base_la-rsb_srt.lo librsb_base_la-rsb_srtp.lo librsb_base_la-rsb_src.lo librsb_base_la-rsb_test_accuracy.lo librsb_base_la-rsb_clone.lo librsb_base_la-rsb_rec.lo librsb_base_la-rsb_render.lo librsb_base_la-rsb_eps.lo librsb_base_la-rsb_msort_up.lo librsb_base_la-rsb_sys.lo librsb_base_la-rsb_blas_stuff.lo librsb_base_la-rsb_gen.lo librsb_base_la-rsb_perf.lo librsb_base_la-rsb_rsb.lo librsb_base_la-rsb_err.lo librsb_base_la-rsb_tune.lo librsb_base_la-rsb_do.lo librsb_base_la-rsb_internals.lo librsb_base_la-rsb_garbage.lo librsb_base_la-rsb_mmio.lo librsb_base_la-rsb_partition.lo librsb_base_la-rsb_mbw.lo librsb_base_la-rsb_limiter.lo librsb_base_la-rsb_fpb.lo librsb_base_la-rsb_spgemm.lo librsb_base_la-rsb_spsum.lo librsb_base_la-rsb_spsv.lo librsb_base_la-rsb_lock.lo librsb_base_la-rsb_swt.lo librsb_base_la-rsb_init.lo librsb_base_la-rsb_dump.lo librsb_base_la-rsb_cpmv.lo librsb_base_la-rsb_asm.lo librsb_base_la-rsb_user.lo librsb_base_la-rsb_coo2rec.lo librsb_base_la-rsb_rec2coo.lo librsb_base_la-rsb_rec2csr.lo librsb_base_la-rsb_csr2coo.lo rsb_blas_sparse.lo -lm -lhwloc -lz -fopenmp -L/usr/lib/gcc/aarch64-linux-gnu/14 -L/usr/lib/gcc/aarch64-linux-gnu/14/../../../aarch64-linux-gnu -L/usr/lib/gcc/aarch64-linux-gnu/14/../../../../lib -L/lib/aarch64-linux-gnu -L/lib/../lib -L/usr/lib/aarch64-linux-gnu -L/usr/lib/../lib -L/usr/lib/gcc/aarch64-linux-gnu/14/../../.. -lgfortran -lm +/bin/sh ./libtool --tag=CC --mode=link gcc -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -no-undefined -version-info 0:0:0 -Wl,-z,relro -o librsb_spblas.la rsb_libspblas_handle.lo rsb_libspblas.lo -lm -lhwloc -lz -fopenmp -L/usr/lib/gcc/aarch64-linux-gnu/14 -L/usr/lib/gcc/aarch64-linux-gnu/14/../../../aarch64-linux-gnu -L/usr/lib/gcc/aarch64-linux-gnu/14/../../../../lib -L/lib/aarch64-linux-gnu -L/lib/../lib -L/usr/lib/aarch64-linux-gnu -L/usr/lib/../lib -L/usr/lib/gcc/aarch64-linux-gnu/14/../../.. -lgfortran -lm libtool: warning: '-version-info/-version-number' is ignored for convenience libraries libtool: link: ar cr .libs/librsb_spblas.a .libs/rsb_libspblas_handle.o .libs/rsb_libspblas.o libtool: link: ranlib .libs/librsb_spblas.a libtool: link: ( cd ".libs" && rm -f "librsb_spblas.la" && ln -s "../librsb_spblas.la" "librsb_spblas.la" ) +libtool: warning: '-version-info/-version-number' is ignored for convenience libraries libtool: link: ar cr .libs/librsb_base.a .libs/librsb_base_la-rsb_is.o .libs/librsb_base_la-rsb_mio.o .libs/librsb_base_la-rsb_op.o .libs/librsb_base_la-rsb_bio.o .libs/librsb_base_la-rsb_get.o .libs/librsb_base_la-rsb_set.o .libs/librsb_base_la-rsb_coo.o .libs/librsb_base_la-rsb_csr.o .libs/librsb_base_la-rsb_coo_check.o .libs/librsb_base_la-rsb_coo_symm.o .libs/librsb_base_la-rsb_idx.o .libs/librsb_base_la-rsb_srt.o .libs/librsb_base_la-rsb_srtp.o .libs/librsb_base_la-rsb_src.o .libs/librsb_base_la-rsb_test_accuracy.o .libs/librsb_base_la-rsb_clone.o .libs/librsb_base_la-rsb_rec.o .libs/librsb_base_la-rsb_render.o .libs/librsb_base_la-rsb_eps.o .libs/librsb_base_la-rsb_msort_up.o .libs/librsb_base_la-rsb_sys.o .libs/librsb_base_la-rsb_blas_stuff.o .libs/librsb_base_la-rsb_gen.o .libs/librsb_base_la-rsb_perf.o .libs/librsb_base_la-rsb_rsb.o .libs/librsb_base_la-rsb_err.o .libs/librsb_base_la-rsb_tune.o .libs/librsb_base_la-rsb_do.o .libs/librsb_base_la-rsb_internals.o .libs/librsb_base_la-rsb_garbage.o .libs/librsb_base_la-rsb_mmio.o .libs/librsb_base_la-rsb_partition.o .libs/librsb_base_la-rsb_mbw.o .libs/librsb_base_la-rsb_limiter.o .libs/librsb_base_la-rsb_fpb.o .libs/librsb_base_la-rsb_spgemm.o .libs/librsb_base_la-rsb_spsum.o .libs/librsb_base_la-rsb_spsv.o .libs/librsb_base_la-rsb_lock.o .libs/librsb_base_la-rsb_swt.o .libs/librsb_base_la-rsb_init.o .libs/librsb_base_la-rsb_dump.o .libs/librsb_base_la-rsb_cpmv.o .libs/librsb_base_la-rsb_asm.o .libs/librsb_base_la-rsb_user.o .libs/librsb_base_la-rsb_coo2rec.o .libs/librsb_base_la-rsb_rec2coo.o .libs/librsb_base_la-rsb_rec2csr.o .libs/librsb_base_la-rsb_csr2coo.o .libs/rsb_blas_sparse.o libtool: link: ranlib .libs/librsb_base.a libtool: link: ( cd ".libs" && rm -f "librsb_base.la" && ln -s "../librsb_base.la" "librsb_base.la" ) @@ -2371,12 +2407,12 @@ | ~~~~~~~~~~~~~~~~~ libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_krnl_bcss_spmv_u.c -o librsb_nounroll_la-rsb_krnl_bcss_spmv_u.o >/dev/null 2>&1 libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_krnl_bcoo_spmv_u.c -o librsb_nounroll_la-rsb_krnl_bcoo_spmv_u.o >/dev/null 2>&1 -/bin/bash ./libtool --tag=CC --mode=link gcc -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -no-undefined -version-info 0:0:0 -Wl,-z,relro -o librsb_nounroll.la librsb_nounroll_la-rsb_stropts.lo librsb_nounroll_la-rsb_strmif.lo librsb_nounroll_la-rsb_unroll.lo librsb_nounroll_la-rsb_krnl_vb.lo librsb_nounroll_la-rsb_krnl_lb.lo librsb_nounroll_la-rsb_krnl.lo librsb_nounroll_la-rsb_bench.lo librsb_nounroll_la-rsb_mergesort.lo librsb_nounroll_la-rsb_permute.lo librsb_nounroll_la-rsb_krnl_bcss_l.lo librsb_nounroll_la-rsb_krnl_bcss_u.lo librsb_nounroll_la-rsb_krnl_bcss_spsv_u.lo librsb_nounroll_la-rsb_krnl_bcss_spmv_u.lo librsb_nounroll_la-rsb_krnl_bcss_misc_u.lo librsb_nounroll_la-rsb_krnl_bcoo_spmv_u.lo librsb_nounroll_la-rsb_krnl_bcss.lo librsb_nounroll_la-rsb_spmv.lo librsb_nounroll_la-rsb_merge.lo librsb_nounroll_la-rsb_ompio.lo librsb_nounroll_la-rsb_util.lo librsb_nounroll_la-rsb_spgemm_csr.lo librsb_nounroll_la-rsb_spsum_misc.lo librsb_nounroll_la-rsb_prec.lo -lm -lhwloc -lz -fopenmp -L/usr/lib/gcc/aarch64-linux-gnu/14 -L/usr/lib/gcc/aarch64-linux-gnu/14/../../../aarch64-linux-gnu -L/usr/lib/gcc/aarch64-linux-gnu/14/../../../../lib -L/lib/aarch64-linux-gnu -L/lib/../lib -L/usr/lib/aarch64-linux-gnu -L/usr/lib/../lib -L/usr/lib/gcc/aarch64-linux-gnu/14/../../.. -lgfortran -lm +/bin/sh ./libtool --tag=CC --mode=link gcc -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -no-undefined -version-info 0:0:0 -Wl,-z,relro -o librsb_nounroll.la librsb_nounroll_la-rsb_stropts.lo librsb_nounroll_la-rsb_strmif.lo librsb_nounroll_la-rsb_unroll.lo librsb_nounroll_la-rsb_krnl_vb.lo librsb_nounroll_la-rsb_krnl_lb.lo librsb_nounroll_la-rsb_krnl.lo librsb_nounroll_la-rsb_bench.lo librsb_nounroll_la-rsb_mergesort.lo librsb_nounroll_la-rsb_permute.lo librsb_nounroll_la-rsb_krnl_bcss_l.lo librsb_nounroll_la-rsb_krnl_bcss_u.lo librsb_nounroll_la-rsb_krnl_bcss_spsv_u.lo librsb_nounroll_la-rsb_krnl_bcss_spmv_u.lo librsb_nounroll_la-rsb_krnl_bcss_misc_u.lo librsb_nounroll_la-rsb_krnl_bcoo_spmv_u.lo librsb_nounroll_la-rsb_krnl_bcss.lo librsb_nounroll_la-rsb_spmv.lo librsb_nounroll_la-rsb_merge.lo librsb_nounroll_la-rsb_ompio.lo librsb_nounroll_la-rsb_util.lo librsb_nounroll_la-rsb_spgemm_csr.lo librsb_nounroll_la-rsb_spsum_misc.lo librsb_nounroll_la-rsb_prec.lo -lm -lhwloc -lz -fopenmp -L/usr/lib/gcc/aarch64-linux-gnu/14 -L/usr/lib/gcc/aarch64-linux-gnu/14/../../../aarch64-linux-gnu -L/usr/lib/gcc/aarch64-linux-gnu/14/../../../../lib -L/lib/aarch64-linux-gnu -L/lib/../lib -L/usr/lib/aarch64-linux-gnu -L/usr/lib/../lib -L/usr/lib/gcc/aarch64-linux-gnu/14/../../.. -lgfortran -lm libtool: warning: '-version-info/-version-number' is ignored for convenience libraries libtool: link: ar cr .libs/librsb_nounroll.a .libs/librsb_nounroll_la-rsb_stropts.o .libs/librsb_nounroll_la-rsb_strmif.o .libs/librsb_nounroll_la-rsb_unroll.o .libs/librsb_nounroll_la-rsb_krnl_vb.o .libs/librsb_nounroll_la-rsb_krnl_lb.o .libs/librsb_nounroll_la-rsb_krnl.o .libs/librsb_nounroll_la-rsb_bench.o .libs/librsb_nounroll_la-rsb_mergesort.o .libs/librsb_nounroll_la-rsb_permute.o .libs/librsb_nounroll_la-rsb_krnl_bcss_l.o .libs/librsb_nounroll_la-rsb_krnl_bcss_u.o .libs/librsb_nounroll_la-rsb_krnl_bcss_spsv_u.o .libs/librsb_nounroll_la-rsb_krnl_bcss_spmv_u.o .libs/librsb_nounroll_la-rsb_krnl_bcss_misc_u.o .libs/librsb_nounroll_la-rsb_krnl_bcoo_spmv_u.o .libs/librsb_nounroll_la-rsb_krnl_bcss.o .libs/librsb_nounroll_la-rsb_spmv.o .libs/librsb_nounroll_la-rsb_merge.o .libs/librsb_nounroll_la-rsb_ompio.o .libs/librsb_nounroll_la-rsb_util.o .libs/librsb_nounroll_la-rsb_spgemm_csr.o .libs/librsb_nounroll_la-rsb_spsum_misc.o .libs/librsb_nounroll_la-rsb_prec.o libtool: link: ranlib .libs/librsb_nounroll.a libtool: link: ( cd ".libs" && rm -f "librsb_nounroll.la" && ln -s "../librsb_nounroll.la" "librsb_nounroll.la" ) -/bin/bash ./libtool --tag=CC --mode=link gcc -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -no-undefined -version-info 0:0:0 -Wl,-z,relro -o librsb.la -rpath /usr/lib/aarch64-linux-gnu rsb.lo librsb_nounroll.la librsb_base.la librsb_spblas.la /build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp/librsbpp.la -lstdc++ -lm -lhwloc -lz -fopenmp -L/usr/lib/gcc/aarch64-linux-gnu/14 -L/usr/lib/gcc/aarch64-linux-gnu/14/../../../aarch64-linux-gnu -L/usr/lib/gcc/aarch64-linux-gnu/14/../../../../lib -L/lib/aarch64-linux-gnu -L/lib/../lib -L/usr/lib/aarch64-linux-gnu -L/usr/lib/../lib -L/usr/lib/gcc/aarch64-linux-gnu/14/../../.. -lgfortran -lm +/bin/sh ./libtool --tag=CC --mode=link gcc -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -no-undefined -version-info 0:0:0 -Wl,-z,relro -o librsb.la -rpath /usr/lib/aarch64-linux-gnu rsb.lo librsb_nounroll.la librsb_base.la librsb_spblas.la /build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp/librsbpp.la -lstdc++ -lm -lhwloc -lz -fopenmp -L/usr/lib/gcc/aarch64-linux-gnu/14 -L/usr/lib/gcc/aarch64-linux-gnu/14/../../../aarch64-linux-gnu -L/usr/lib/gcc/aarch64-linux-gnu/14/../../../../lib -L/lib/aarch64-linux-gnu -L/lib/../lib -L/usr/lib/aarch64-linux-gnu -L/usr/lib/../lib -L/usr/lib/gcc/aarch64-linux-gnu/14/../../.. -lgfortran -lm libtool: link: gcc -shared -fPIC -DPIC .libs/rsb.o -Wl,--whole-archive ./.libs/librsb_nounroll.a ./.libs/librsb_base.a ./.libs/librsb_spblas.a /build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp/.libs/librsbpp.a -Wl,--no-whole-archive -L/usr/lib/gcc/aarch64-linux-gnu/14 -L/usr/lib/gcc/aarch64-linux-gnu/14/../../../aarch64-linux-gnu -L/usr/lib/gcc/aarch64-linux-gnu/14/../../../../lib -L/lib/aarch64-linux-gnu -L/lib/../lib -L/usr/lib/aarch64-linux-gnu -L/usr/lib/../lib -L/usr/lib/gcc/aarch64-linux-gnu/14/../../.. -lpthread -lstdc++fs -lstdc++ -lhwloc -lz -lgfortran -lm -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Werror=format-security -mbranch-protection=standard -O3 -Wl,-z -Wl,relro -fopenmp -fopenmp -Wl,-soname -Wl,librsb.so.0 -o .libs/librsb.so.0.0.0 libtool: link: (cd ".libs" && rm -f "librsb.so.0" && ln -s "librsb.so.0.0.0" "librsb.so.0") libtool: link: (cd ".libs" && rm -f "librsb.so" && ln -s "librsb.so.0.0.0" "librsb.so") @@ -2388,7 +2424,7 @@ libtool: link: ranlib .libs/librsb.a libtool: link: rm -fr .libs/librsb.lax libtool: link: ( cd ".libs" && rm -f "librsb.la" && ln -s "../librsb.la" "librsb.la" ) -/bin/bash ./libtool --tag=CXX --mode=link g++ -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -fopenmp -no-undefined -version-info 0:0:0 -Wl,-z,relro -o rsbench rsbench-rsbench.o rsbench-rsb_test_matops.o rsbench-rsb_mkl.o rsbench-rsb_genmm.o rsbench-rsb_mmls.o rsbench-rsb_pr.o rsbench-rsb_pcnt.o rsbench-rsb_failure_tests.o rsbench-rsb_libspblas_tests.o rsb_dummy.o librsb.la -lhwloc -lm -lhwloc -lz -fopenmp -L/usr/lib/gcc/aarch64-linux-gnu/14 -L/usr/lib/gcc/aarch64-linux-gnu/14/../../../aarch64-linux-gnu -L/usr/lib/gcc/aarch64-linux-gnu/14/../../../../lib -L/lib/aarch64-linux-gnu -L/lib/../lib -L/usr/lib/aarch64-linux-gnu -L/usr/lib/../lib -L/usr/lib/gcc/aarch64-linux-gnu/14/../../.. -lgfortran -lm +/bin/sh ./libtool --tag=CXX --mode=link g++ -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -fopenmp -no-undefined -version-info 0:0:0 -Wl,-z,relro -o rsbench rsbench-rsbench.o rsbench-rsb_test_matops.o rsbench-rsb_mkl.o rsbench-rsb_genmm.o rsbench-rsb_mmls.o rsbench-rsb_pr.o rsbench-rsb_pcnt.o rsbench-rsb_failure_tests.o rsbench-rsb_libspblas_tests.o rsb_dummy.o librsb.la -lhwloc -lm -lhwloc -lz -fopenmp -L/usr/lib/gcc/aarch64-linux-gnu/14 -L/usr/lib/gcc/aarch64-linux-gnu/14/../../../aarch64-linux-gnu -L/usr/lib/gcc/aarch64-linux-gnu/14/../../../../lib -L/lib/aarch64-linux-gnu -L/lib/../lib -L/usr/lib/aarch64-linux-gnu -L/usr/lib/../lib -L/usr/lib/gcc/aarch64-linux-gnu/14/../../.. -lgfortran -lm libtool: warning: '-version-info' is ignored for programs libtool: link: g++ -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -fopenmp -Wl,-z -Wl,relro -o .libs/rsbench rsbench-rsbench.o rsbench-rsb_test_matops.o rsbench-rsb_mkl.o rsbench-rsb_genmm.o rsbench-rsb_mmls.o rsbench-rsb_pr.o rsbench-rsb_pcnt.o rsbench-rsb_failure_tests.o rsbench-rsb_libspblas_tests.o rsb_dummy.o -fopenmp ./.libs/librsb.so -lhwloc -lz -L/usr/lib/gcc/aarch64-linux-gnu/14 -L/usr/lib/gcc/aarch64-linux-gnu/14/../../../aarch64-linux-gnu -L/usr/lib/gcc/aarch64-linux-gnu/14/../../../../lib -L/lib/aarch64-linux-gnu -L/lib/../lib -L/usr/lib/aarch64-linux-gnu -L/usr/lib/../lib -L/usr/lib/gcc/aarch64-linux-gnu/14/../../.. -lgfortran -lm -fopenmp gmake[4]: Leaving directory '/build/reproducible-path/librsb-1.3.0.2+dfsg' @@ -2405,27 +2441,27 @@ gfortran -DHAVE_CONFIG_H -I. -I.. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -I.. -I.. -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -mbranch-protection=standard -pipe -fopenmp -c -o fortran.o fortran.F90 gfortran -DHAVE_CONFIG_H -I. -I.. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -I.. -I.. -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -mbranch-protection=standard -pipe -fopenmp -c -o fortran_rsb_fi.o fortran_rsb_fi.F90 g++ -DHAVE_CONFIG_H -I. -I.. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -fopenmp -c -o cplusplus.o cplusplus.cpp -/bin/bash ../libtool --tag=CXX --mode=link g++ -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -fopenmp -Wl,-z,relro -o power power.o -L.. /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la -lhwloc -lm -lhwloc -lz -fopenmp -L/usr/lib/gcc/aarch64-linux-gnu/14 -L/usr/lib/gcc/aarch64-linux-gnu/14/../../../aarch64-linux-gnu -L/usr/lib/gcc/aarch64-linux-gnu/14/../../../../lib -L/lib/aarch64-linux-gnu -L/lib/../lib -L/usr/lib/aarch64-linux-gnu -L/usr/lib/../lib -L/usr/lib/gcc/aarch64-linux-gnu/14/../../.. -lgfortran -lm -/bin/bash ../libtool --tag=CXX --mode=link g++ -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -fopenmp -Wl,-z,relro -o io-spblas io-spblas.o -L.. /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la -lhwloc -lm -lhwloc -lz -fopenmp -L/usr/lib/gcc/aarch64-linux-gnu/14 -L/usr/lib/gcc/aarch64-linux-gnu/14/../../../aarch64-linux-gnu -L/usr/lib/gcc/aarch64-linux-gnu/14/../../../../lib -L/lib/aarch64-linux-gnu -L/lib/../lib -L/usr/lib/aarch64-linux-gnu -L/usr/lib/../lib -L/usr/lib/gcc/aarch64-linux-gnu/14/../../.. -lgfortran -lm -/bin/bash ../libtool --tag=CXX --mode=link g++ -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -fopenmp -Wl,-z,relro -o hello-spblas hello-spblas.o -L.. /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la -lhwloc -lm -lhwloc -lz -fopenmp -L/usr/lib/gcc/aarch64-linux-gnu/14 -L/usr/lib/gcc/aarch64-linux-gnu/14/../../../aarch64-linux-gnu -L/usr/lib/gcc/aarch64-linux-gnu/14/../../../../lib -L/lib/aarch64-linux-gnu -L/lib/../lib -L/usr/lib/aarch64-linux-gnu -L/usr/lib/../lib -L/usr/lib/gcc/aarch64-linux-gnu/14/../../.. -lgfortran -lm -/bin/bash ../libtool --tag=CXX --mode=link g++ -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -fopenmp -Wl,-z,relro -o hello hello.o -L.. /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la -lhwloc -lm -lhwloc -lz -fopenmp -L/usr/lib/gcc/aarch64-linux-gnu/14 -L/usr/lib/gcc/aarch64-linux-gnu/14/../../../aarch64-linux-gnu -L/usr/lib/gcc/aarch64-linux-gnu/14/../../../../lib -L/lib/aarch64-linux-gnu -L/lib/../lib -L/usr/lib/aarch64-linux-gnu -L/usr/lib/../lib -L/usr/lib/gcc/aarch64-linux-gnu/14/../../.. -lgfortran -lm -/bin/bash ../libtool --tag=CXX --mode=link g++ -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -fopenmp -Wl,-z,relro -o transpose transpose.o -L.. /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la -lhwloc -lm -lhwloc -lz -fopenmp -L/usr/lib/gcc/aarch64-linux-gnu/14 -L/usr/lib/gcc/aarch64-linux-gnu/14/../../../aarch64-linux-gnu -L/usr/lib/gcc/aarch64-linux-gnu/14/../../../../lib -L/lib/aarch64-linux-gnu -L/lib/../lib -L/usr/lib/aarch64-linux-gnu -L/usr/lib/../lib -L/usr/lib/gcc/aarch64-linux-gnu/14/../../.. -lgfortran -lm -/bin/bash ../libtool --tag=CXX --mode=link g++ -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -fopenmp -Wl,-z,relro -o backsolve backsolve.o -L.. /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la -lhwloc -lm -lhwloc -lz -fopenmp -L/usr/lib/gcc/aarch64-linux-gnu/14 -L/usr/lib/gcc/aarch64-linux-gnu/14/../../../aarch64-linux-gnu -L/usr/lib/gcc/aarch64-linux-gnu/14/../../../../lib -L/lib/aarch64-linux-gnu -L/lib/../lib -L/usr/lib/aarch64-linux-gnu -L/usr/lib/../lib -L/usr/lib/gcc/aarch64-linux-gnu/14/../../.. -lgfortran -lm -/bin/bash ../libtool --tag=CXX --mode=link g++ -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -fopenmp -Wl,-z,relro -o fortran_rsb_fi fortran_rsb_fi.o -L.. /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la -lhwloc -lm -lhwloc -lz -fopenmp -L/usr/lib/gcc/aarch64-linux-gnu/14 -L/usr/lib/gcc/aarch64-linux-gnu/14/../../../aarch64-linux-gnu -L/usr/lib/gcc/aarch64-linux-gnu/14/../../../../lib -L/lib/aarch64-linux-gnu -L/lib/../lib -L/usr/lib/aarch64-linux-gnu -L/usr/lib/../lib -L/usr/lib/gcc/aarch64-linux-gnu/14/../../.. -lgfortran -lm -/bin/bash ../libtool --tag=CXX --mode=link g++ -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -fopenmp -Wl,-z,relro -o autotune autotune.o -L.. /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la -lhwloc -lm -lhwloc -lz -fopenmp -L/usr/lib/gcc/aarch64-linux-gnu/14 -L/usr/lib/gcc/aarch64-linux-gnu/14/../../../aarch64-linux-gnu -L/usr/lib/gcc/aarch64-linux-gnu/14/../../../../lib -L/lib/aarch64-linux-gnu -L/lib/../lib -L/usr/lib/aarch64-linux-gnu -L/usr/lib/../lib -L/usr/lib/gcc/aarch64-linux-gnu/14/../../.. -lgfortran -lm -/bin/bash ../libtool --tag=CXX --mode=link g++ -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -fopenmp -Wl,-z,relro -o fortran fortran.o -L.. /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la -lhwloc -lm -lhwloc -lz -fopenmp -L/usr/lib/gcc/aarch64-linux-gnu/14 -L/usr/lib/gcc/aarch64-linux-gnu/14/../../../aarch64-linux-gnu -L/usr/lib/gcc/aarch64-linux-gnu/14/../../../../lib -L/lib/aarch64-linux-gnu -L/lib/../lib -L/usr/lib/aarch64-linux-gnu -L/usr/lib/../lib -L/usr/lib/gcc/aarch64-linux-gnu/14/../../.. -lgfortran -lm +/bin/sh ../libtool --tag=CXX --mode=link g++ -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -fopenmp -Wl,-z,relro -o power power.o -L.. /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la -lhwloc -lm -lhwloc -lz -fopenmp -L/usr/lib/gcc/aarch64-linux-gnu/14 -L/usr/lib/gcc/aarch64-linux-gnu/14/../../../aarch64-linux-gnu -L/usr/lib/gcc/aarch64-linux-gnu/14/../../../../lib -L/lib/aarch64-linux-gnu -L/lib/../lib -L/usr/lib/aarch64-linux-gnu -L/usr/lib/../lib -L/usr/lib/gcc/aarch64-linux-gnu/14/../../.. -lgfortran -lm +/bin/sh ../libtool --tag=CXX --mode=link g++ -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -fopenmp -Wl,-z,relro -o hello hello.o -L.. /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la -lhwloc -lm -lhwloc -lz -fopenmp -L/usr/lib/gcc/aarch64-linux-gnu/14 -L/usr/lib/gcc/aarch64-linux-gnu/14/../../../aarch64-linux-gnu -L/usr/lib/gcc/aarch64-linux-gnu/14/../../../../lib -L/lib/aarch64-linux-gnu -L/lib/../lib -L/usr/lib/aarch64-linux-gnu -L/usr/lib/../lib -L/usr/lib/gcc/aarch64-linux-gnu/14/../../.. -lgfortran -lm +/bin/sh ../libtool --tag=CXX --mode=link g++ -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -fopenmp -Wl,-z,relro -o transpose transpose.o -L.. /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la -lhwloc -lm -lhwloc -lz -fopenmp -L/usr/lib/gcc/aarch64-linux-gnu/14 -L/usr/lib/gcc/aarch64-linux-gnu/14/../../../aarch64-linux-gnu -L/usr/lib/gcc/aarch64-linux-gnu/14/../../../../lib -L/lib/aarch64-linux-gnu -L/lib/../lib -L/usr/lib/aarch64-linux-gnu -L/usr/lib/../lib -L/usr/lib/gcc/aarch64-linux-gnu/14/../../.. -lgfortran -lm +/bin/sh ../libtool --tag=CXX --mode=link g++ -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -fopenmp -Wl,-z,relro -o backsolve backsolve.o -L.. /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la -lhwloc -lm -lhwloc -lz -fopenmp -L/usr/lib/gcc/aarch64-linux-gnu/14 -L/usr/lib/gcc/aarch64-linux-gnu/14/../../../aarch64-linux-gnu -L/usr/lib/gcc/aarch64-linux-gnu/14/../../../../lib -L/lib/aarch64-linux-gnu -L/lib/../lib -L/usr/lib/aarch64-linux-gnu -L/usr/lib/../lib -L/usr/lib/gcc/aarch64-linux-gnu/14/../../.. -lgfortran -lm +/bin/sh ../libtool --tag=CXX --mode=link g++ -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -fopenmp -Wl,-z,relro -o hello-spblas hello-spblas.o -L.. /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la -lhwloc -lm -lhwloc -lz -fopenmp -L/usr/lib/gcc/aarch64-linux-gnu/14 -L/usr/lib/gcc/aarch64-linux-gnu/14/../../../aarch64-linux-gnu -L/usr/lib/gcc/aarch64-linux-gnu/14/../../../../lib -L/lib/aarch64-linux-gnu -L/lib/../lib -L/usr/lib/aarch64-linux-gnu -L/usr/lib/../lib -L/usr/lib/gcc/aarch64-linux-gnu/14/../../.. -lgfortran -lm +/bin/sh ../libtool --tag=CXX --mode=link g++ -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -fopenmp -Wl,-z,relro -o io-spblas io-spblas.o -L.. /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la -lhwloc -lm -lhwloc -lz -fopenmp -L/usr/lib/gcc/aarch64-linux-gnu/14 -L/usr/lib/gcc/aarch64-linux-gnu/14/../../../aarch64-linux-gnu -L/usr/lib/gcc/aarch64-linux-gnu/14/../../../../lib -L/lib/aarch64-linux-gnu -L/lib/../lib -L/usr/lib/aarch64-linux-gnu -L/usr/lib/../lib -L/usr/lib/gcc/aarch64-linux-gnu/14/../../.. -lgfortran -lm +/bin/sh ../libtool --tag=CXX --mode=link g++ -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -fopenmp -Wl,-z,relro -o autotune autotune.o -L.. /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la -lhwloc -lm -lhwloc -lz -fopenmp -L/usr/lib/gcc/aarch64-linux-gnu/14 -L/usr/lib/gcc/aarch64-linux-gnu/14/../../../aarch64-linux-gnu -L/usr/lib/gcc/aarch64-linux-gnu/14/../../../../lib -L/lib/aarch64-linux-gnu -L/lib/../lib -L/usr/lib/aarch64-linux-gnu -L/usr/lib/../lib -L/usr/lib/gcc/aarch64-linux-gnu/14/../../.. -lgfortran -lm +/bin/sh ../libtool --tag=CXX --mode=link g++ -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -fopenmp -Wl,-z,relro -o fortran_rsb_fi fortran_rsb_fi.o -L.. /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la -lhwloc -lm -lhwloc -lz -fopenmp -L/usr/lib/gcc/aarch64-linux-gnu/14 -L/usr/lib/gcc/aarch64-linux-gnu/14/../../../aarch64-linux-gnu -L/usr/lib/gcc/aarch64-linux-gnu/14/../../../../lib -L/lib/aarch64-linux-gnu -L/lib/../lib -L/usr/lib/aarch64-linux-gnu -L/usr/lib/../lib -L/usr/lib/gcc/aarch64-linux-gnu/14/../../.. -lgfortran -lm +/bin/sh ../libtool --tag=CXX --mode=link g++ -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -fopenmp -Wl,-z,relro -o fortran fortran.o -L.. /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la -lhwloc -lm -lhwloc -lz -fopenmp -L/usr/lib/gcc/aarch64-linux-gnu/14 -L/usr/lib/gcc/aarch64-linux-gnu/14/../../../aarch64-linux-gnu -L/usr/lib/gcc/aarch64-linux-gnu/14/../../../../lib -L/lib/aarch64-linux-gnu -L/lib/../lib -L/usr/lib/aarch64-linux-gnu -L/usr/lib/../lib -L/usr/lib/gcc/aarch64-linux-gnu/14/../../.. -lgfortran -lm +libtool: link: g++ -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -fopenmp -Wl,-z -Wl,relro -o .libs/transpose transpose.o -fopenmp -L.. /build/reproducible-path/librsb-1.3.0.2+dfsg/.libs/librsb.so -lhwloc -lz -L/usr/lib/gcc/aarch64-linux-gnu/14 -L/usr/lib/gcc/aarch64-linux-gnu/14/../../../aarch64-linux-gnu -L/usr/lib/gcc/aarch64-linux-gnu/14/../../../../lib -L/lib/aarch64-linux-gnu -L/lib/../lib -L/usr/lib/aarch64-linux-gnu -L/usr/lib/../lib -L/usr/lib/gcc/aarch64-linux-gnu/14/../../.. -lgfortran -lm -fopenmp +/bin/sh ../libtool --tag=CXX --mode=link g++ -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -fopenmp -Wl,-z,relro -o snippets snippets.o -L.. /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la -lhwloc -lm -lhwloc -lz -fopenmp -L/usr/lib/gcc/aarch64-linux-gnu/14 -L/usr/lib/gcc/aarch64-linux-gnu/14/../../../aarch64-linux-gnu -L/usr/lib/gcc/aarch64-linux-gnu/14/../../../../lib -L/lib/aarch64-linux-gnu -L/lib/../lib -L/usr/lib/aarch64-linux-gnu -L/usr/lib/../lib -L/usr/lib/gcc/aarch64-linux-gnu/14/../../.. -lgfortran -lm +libtool: link: g++ -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -fopenmp -Wl,-z -Wl,relro -o .libs/backsolve backsolve.o -fopenmp -L.. /build/reproducible-path/librsb-1.3.0.2+dfsg/.libs/librsb.so -lhwloc -lz -L/usr/lib/gcc/aarch64-linux-gnu/14 -L/usr/lib/gcc/aarch64-linux-gnu/14/../../../aarch64-linux-gnu -L/usr/lib/gcc/aarch64-linux-gnu/14/../../../../lib -L/lib/aarch64-linux-gnu -L/lib/../lib -L/usr/lib/aarch64-linux-gnu -L/usr/lib/../lib -L/usr/lib/gcc/aarch64-linux-gnu/14/../../.. -lgfortran -lm -fopenmp libtool: link: g++ -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -fopenmp -Wl,-z -Wl,relro -o .libs/io-spblas io-spblas.o -fopenmp -L.. /build/reproducible-path/librsb-1.3.0.2+dfsg/.libs/librsb.so -lhwloc -lz -L/usr/lib/gcc/aarch64-linux-gnu/14 -L/usr/lib/gcc/aarch64-linux-gnu/14/../../../aarch64-linux-gnu -L/usr/lib/gcc/aarch64-linux-gnu/14/../../../../lib -L/lib/aarch64-linux-gnu -L/lib/../lib -L/usr/lib/aarch64-linux-gnu -L/usr/lib/../lib -L/usr/lib/gcc/aarch64-linux-gnu/14/../../.. -lgfortran -lm -fopenmp -libtool: link: g++ -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -fopenmp -Wl,-z -Wl,relro -o .libs/power power.o -fopenmp -L.. /build/reproducible-path/librsb-1.3.0.2+dfsg/.libs/librsb.so -lhwloc -lz -L/usr/lib/gcc/aarch64-linux-gnu/14 -L/usr/lib/gcc/aarch64-linux-gnu/14/../../../aarch64-linux-gnu -L/usr/lib/gcc/aarch64-linux-gnu/14/../../../../lib -L/lib/aarch64-linux-gnu -L/lib/../lib -L/usr/lib/aarch64-linux-gnu -L/usr/lib/../lib -L/usr/lib/gcc/aarch64-linux-gnu/14/../../.. -lgfortran -lm -fopenmp -libtool: link: g++ -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -fopenmp -Wl,-z -Wl,relro -o .libs/hello-spblas hello-spblas.o -fopenmp -L.. /build/reproducible-path/librsb-1.3.0.2+dfsg/.libs/librsb.so -lhwloc -lz -L/usr/lib/gcc/aarch64-linux-gnu/14 -L/usr/lib/gcc/aarch64-linux-gnu/14/../../../aarch64-linux-gnu -L/usr/lib/gcc/aarch64-linux-gnu/14/../../../../lib -L/lib/aarch64-linux-gnu -L/lib/../lib -L/usr/lib/aarch64-linux-gnu -L/usr/lib/../lib -L/usr/lib/gcc/aarch64-linux-gnu/14/../../.. -lgfortran -lm -fopenmp libtool: link: g++ -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -fopenmp -Wl,-z -Wl,relro -o .libs/hello hello.o -fopenmp -L.. /build/reproducible-path/librsb-1.3.0.2+dfsg/.libs/librsb.so -lhwloc -lz -L/usr/lib/gcc/aarch64-linux-gnu/14 -L/usr/lib/gcc/aarch64-linux-gnu/14/../../../aarch64-linux-gnu -L/usr/lib/gcc/aarch64-linux-gnu/14/../../../../lib -L/lib/aarch64-linux-gnu -L/lib/../lib -L/usr/lib/aarch64-linux-gnu -L/usr/lib/../lib -L/usr/lib/gcc/aarch64-linux-gnu/14/../../.. -lgfortran -lm -fopenmp -libtool: link: g++ -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -fopenmp -Wl,-z -Wl,relro -o .libs/backsolve backsolve.o -fopenmp -L.. /build/reproducible-path/librsb-1.3.0.2+dfsg/.libs/librsb.so -lhwloc -lz -L/usr/lib/gcc/aarch64-linux-gnu/14 -L/usr/lib/gcc/aarch64-linux-gnu/14/../../../aarch64-linux-gnu -L/usr/lib/gcc/aarch64-linux-gnu/14/../../../../lib -L/lib/aarch64-linux-gnu -L/lib/../lib -L/usr/lib/aarch64-linux-gnu -L/usr/lib/../lib -L/usr/lib/gcc/aarch64-linux-gnu/14/../../.. -lgfortran -lm -fopenmp -libtool: link: g++ -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -fopenmp -Wl,-z -Wl,relro -o .libs/transpose transpose.o -fopenmp -L.. /build/reproducible-path/librsb-1.3.0.2+dfsg/.libs/librsb.so -lhwloc -lz -L/usr/lib/gcc/aarch64-linux-gnu/14 -L/usr/lib/gcc/aarch64-linux-gnu/14/../../../aarch64-linux-gnu -L/usr/lib/gcc/aarch64-linux-gnu/14/../../../../lib -L/lib/aarch64-linux-gnu -L/lib/../lib -L/usr/lib/aarch64-linux-gnu -L/usr/lib/../lib -L/usr/lib/gcc/aarch64-linux-gnu/14/../../.. -lgfortran -lm -fopenmp -/bin/bash ../libtool --tag=CXX --mode=link g++ -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -fopenmp -Wl,-z,relro -o snippets snippets.o -L.. /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la -lhwloc -lm -lhwloc -lz -fopenmp -L/usr/lib/gcc/aarch64-linux-gnu/14 -L/usr/lib/gcc/aarch64-linux-gnu/14/../../../aarch64-linux-gnu -L/usr/lib/gcc/aarch64-linux-gnu/14/../../../../lib -L/lib/aarch64-linux-gnu -L/lib/../lib -L/usr/lib/aarch64-linux-gnu -L/usr/lib/../lib -L/usr/lib/gcc/aarch64-linux-gnu/14/../../.. -lgfortran -lm -libtool: link: g++ -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -fopenmp -Wl,-z -Wl,relro -o .libs/fortran_rsb_fi fortran_rsb_fi.o -fopenmp -L.. /build/reproducible-path/librsb-1.3.0.2+dfsg/.libs/librsb.so -lhwloc -lz -L/usr/lib/gcc/aarch64-linux-gnu/14 -L/usr/lib/gcc/aarch64-linux-gnu/14/../../../aarch64-linux-gnu -L/usr/lib/gcc/aarch64-linux-gnu/14/../../../../lib -L/lib/aarch64-linux-gnu -L/lib/../lib -L/usr/lib/aarch64-linux-gnu -L/usr/lib/../lib -L/usr/lib/gcc/aarch64-linux-gnu/14/../../.. -lgfortran -lm -fopenmp +libtool: link: g++ -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -fopenmp -Wl,-z -Wl,relro -o .libs/hello-spblas hello-spblas.o -fopenmp -L.. /build/reproducible-path/librsb-1.3.0.2+dfsg/.libs/librsb.so -lhwloc -lz -L/usr/lib/gcc/aarch64-linux-gnu/14 -L/usr/lib/gcc/aarch64-linux-gnu/14/../../../aarch64-linux-gnu -L/usr/lib/gcc/aarch64-linux-gnu/14/../../../../lib -L/lib/aarch64-linux-gnu -L/lib/../lib -L/usr/lib/aarch64-linux-gnu -L/usr/lib/../lib -L/usr/lib/gcc/aarch64-linux-gnu/14/../../.. -lgfortran -lm -fopenmp +libtool: link: g++ -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -fopenmp -Wl,-z -Wl,relro -o .libs/power power.o -fopenmp -L.. /build/reproducible-path/librsb-1.3.0.2+dfsg/.libs/librsb.so -lhwloc -lz -L/usr/lib/gcc/aarch64-linux-gnu/14 -L/usr/lib/gcc/aarch64-linux-gnu/14/../../../aarch64-linux-gnu -L/usr/lib/gcc/aarch64-linux-gnu/14/../../../../lib -L/lib/aarch64-linux-gnu -L/lib/../lib -L/usr/lib/aarch64-linux-gnu -L/usr/lib/../lib -L/usr/lib/gcc/aarch64-linux-gnu/14/../../.. -lgfortran -lm -fopenmp libtool: link: g++ -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -fopenmp -Wl,-z -Wl,relro -o .libs/autotune autotune.o -fopenmp -L.. /build/reproducible-path/librsb-1.3.0.2+dfsg/.libs/librsb.so -lhwloc -lz -L/usr/lib/gcc/aarch64-linux-gnu/14 -L/usr/lib/gcc/aarch64-linux-gnu/14/../../../aarch64-linux-gnu -L/usr/lib/gcc/aarch64-linux-gnu/14/../../../../lib -L/lib/aarch64-linux-gnu -L/lib/../lib -L/usr/lib/aarch64-linux-gnu -L/usr/lib/../lib -L/usr/lib/gcc/aarch64-linux-gnu/14/../../.. -lgfortran -lm -fopenmp +libtool: link: g++ -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -fopenmp -Wl,-z -Wl,relro -o .libs/fortran_rsb_fi fortran_rsb_fi.o -fopenmp -L.. /build/reproducible-path/librsb-1.3.0.2+dfsg/.libs/librsb.so -lhwloc -lz -L/usr/lib/gcc/aarch64-linux-gnu/14 -L/usr/lib/gcc/aarch64-linux-gnu/14/../../../aarch64-linux-gnu -L/usr/lib/gcc/aarch64-linux-gnu/14/../../../../lib -L/lib/aarch64-linux-gnu -L/lib/../lib -L/usr/lib/aarch64-linux-gnu -L/usr/lib/../lib -L/usr/lib/gcc/aarch64-linux-gnu/14/../../.. -lgfortran -lm -fopenmp libtool: link: g++ -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -fopenmp -Wl,-z -Wl,relro -o .libs/fortran fortran.o -fopenmp -L.. /build/reproducible-path/librsb-1.3.0.2+dfsg/.libs/librsb.so -lhwloc -lz -L/usr/lib/gcc/aarch64-linux-gnu/14 -L/usr/lib/gcc/aarch64-linux-gnu/14/../../../aarch64-linux-gnu -L/usr/lib/gcc/aarch64-linux-gnu/14/../../../../lib -L/lib/aarch64-linux-gnu -L/lib/../lib -L/usr/lib/aarch64-linux-gnu -L/usr/lib/../lib -L/usr/lib/gcc/aarch64-linux-gnu/14/../../.. -lgfortran -lm -fopenmp libtool: link: g++ -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -fopenmp -Wl,-z -Wl,relro -o .libs/snippets snippets.o -fopenmp -L.. /build/reproducible-path/librsb-1.3.0.2+dfsg/.libs/librsb.so -lhwloc -lz -L/usr/lib/gcc/aarch64-linux-gnu/14 -L/usr/lib/gcc/aarch64-linux-gnu/14/../../../aarch64-linux-gnu -L/usr/lib/gcc/aarch64-linux-gnu/14/../../../../lib -L/lib/aarch64-linux-gnu -L/lib/../lib -L/usr/lib/aarch64-linux-gnu -L/usr/lib/../lib -L/usr/lib/gcc/aarch64-linux-gnu/14/../../.. -lgfortran -lm -fopenmp -/bin/bash ../libtool --tag=CXX --mode=link g++ -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -fopenmp -Wl,-z,relro -o cplusplus cplusplus.o -L.. /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la -lhwloc -lm -lhwloc -lz -fopenmp -L/usr/lib/gcc/aarch64-linux-gnu/14 -L/usr/lib/gcc/aarch64-linux-gnu/14/../../../aarch64-linux-gnu -L/usr/lib/gcc/aarch64-linux-gnu/14/../../../../lib -L/lib/aarch64-linux-gnu -L/lib/../lib -L/usr/lib/aarch64-linux-gnu -L/usr/lib/../lib -L/usr/lib/gcc/aarch64-linux-gnu/14/../../.. -lgfortran -lm +/bin/sh ../libtool --tag=CXX --mode=link g++ -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -fopenmp -Wl,-z,relro -o cplusplus cplusplus.o -L.. /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la -lhwloc -lm -lhwloc -lz -fopenmp -L/usr/lib/gcc/aarch64-linux-gnu/14 -L/usr/lib/gcc/aarch64-linux-gnu/14/../../../aarch64-linux-gnu -L/usr/lib/gcc/aarch64-linux-gnu/14/../../../../lib -L/lib/aarch64-linux-gnu -L/lib/../lib -L/usr/lib/aarch64-linux-gnu -L/usr/lib/../lib -L/usr/lib/gcc/aarch64-linux-gnu/14/../../.. -lgfortran -lm libtool: link: g++ -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -fopenmp -Wl,-z -Wl,relro -o .libs/cplusplus cplusplus.o -fopenmp -L.. /build/reproducible-path/librsb-1.3.0.2+dfsg/.libs/librsb.so -lhwloc -lz -L/usr/lib/gcc/aarch64-linux-gnu/14 -L/usr/lib/gcc/aarch64-linux-gnu/14/../../../aarch64-linux-gnu -L/usr/lib/gcc/aarch64-linux-gnu/14/../../../../lib -L/lib/aarch64-linux-gnu -L/lib/../lib -L/usr/lib/aarch64-linux-gnu -L/usr/lib/../lib -L/usr/lib/gcc/aarch64-linux-gnu/14/../../.. -lgfortran -lm -fopenmp gmake[4]: Leaving directory '/build/reproducible-path/librsb-1.3.0.2+dfsg/examples' Making all in scripts @@ -2445,9 +2481,9 @@ /usr/bin/mkdir -p man /usr/bin/mkdir -p man gmake makedox -SOURCE_DATE_EPOCH=1767272461 \ +SOURCE_DATE_EPOCH=1735642861 \ help2man --name="benchmark and test for librsb" --no-info ../rsbench | /usr/bin/sed 's/January //g' > man/rsbench.1 -SOURCE_DATE_EPOCH=1767272461 \ +SOURCE_DATE_EPOCH=1735642861 \ help2man --name="provide configuration information for librsb" --no-info /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb-config | /usr/bin/sed 's/January //g' > man/librsb-config.1 gmake[5]: Entering directory '/build/reproducible-path/librsb-1.3.0.2+dfsg/doc' DOXYGEN_PROJECT_NUMBER=1.3.0.2 doxygen Doxyfile || echo "are you sure you have doxygen installed ?" @@ -3159,13 +3195,13 @@ g++ -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -c -o rgt-rgt.o `test -f 'rgt.cpp' || echo './'`rgt.cpp g++ -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -DRSBP_NOTHROW=1 -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -c -o rgt_ne-rgt.o `test -f 'rgt.cpp' || echo './'`rgt.cpp g++ -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -DRSBP_NOTHROW=1 -DRSBP_WANT_REV=1 -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -c -o rgt_rv-rgt.o `test -f 'rgt.cpp' || echo './'`rgt.cpp -/bin/bash ./libtool --tag=CXX --mode=link g++ -DRSBP_NOTHROW=1 -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -Wl,-z,relro -o rgt_ne rgt_ne-rgt.o -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la -/bin/bash ./libtool --tag=CXX --mode=link g++ -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -Wl,-z,relro -o rgt rgt-rgt.o -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la -/bin/bash ./libtool --tag=CXX --mode=link g++ -DRSBP_NOTHROW=1 -DRSBP_WANT_REV=1 -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -Wl,-z,relro -o rgt_rv rgt_rv-rgt.o -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la +/bin/sh ./libtool --tag=CXX --mode=link g++ -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -Wl,-z,relro -o rgt rgt-rgt.o -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la +/bin/sh ./libtool --tag=CXX --mode=link g++ -DRSBP_NOTHROW=1 -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -Wl,-z,relro -o rgt_ne rgt_ne-rgt.o -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la +/bin/sh ./libtool --tag=CXX --mode=link g++ -DRSBP_NOTHROW=1 -DRSBP_WANT_REV=1 -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -Wl,-z,relro -o rgt_rv rgt_rv-rgt.o -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la +libtool: link: g++ -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -Wl,-z -Wl,relro -o .libs/rgt rgt-rgt.o -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/.libs/librsb.so -fopenmp libtool: link: g++ -DRSBP_NOTHROW=1 -DRSBP_WANT_REV=1 -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -Wl,-z -Wl,relro -o .libs/rgt_rv rgt_rv-rgt.o -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/.libs/librsb.so -fopenmp libtool: link: g++ -DRSBP_NOTHROW=1 -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -Wl,-z -Wl,relro -o .libs/rgt_ne rgt_ne-rgt.o -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/.libs/librsb.so -fopenmp -libtool: link: g++ -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -Wl,-z -Wl,relro -o .libs/rgt rgt-rgt.o -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/.libs/librsb.so -fopenmp -/bin/bash ./libtool --tag=CXX --mode=link g++ -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -Wl,-z,relro -o rsb rsb.o -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la +/bin/sh ./libtool --tag=CXX --mode=link g++ -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -Wl,-z,relro -o rsb rsb.o -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la libtool: link: g++ -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -Wl,-z -Wl,relro -o .libs/rsb rsb.o -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/.libs/librsb.so -fopenmp gmake[6]: Leaving directory '/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib' Making all in examples @@ -3180,25 +3216,25 @@ g++ -DHAVE_CONFIG_H -I.. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I.. -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -c -o mtx2bin.o mtx2bin.cpp g++ -DHAVE_CONFIG_H -I.. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I.. -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -c -o render.o render.cpp g++ -DHAVE_CONFIG_H -I.. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I.. -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -c -o span.o span.cpp -/bin/bash ../libtool --tag=CXX --mode=link g++ -I.. -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -Wl,-z,relro -o span span.o -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la -/bin/bash ../libtool --tag=CXX --mode=link g++ -I.. -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -Wl,-z,relro -o example example.o -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la -/bin/bash ../libtool --tag=CXX --mode=link g++ -I.. -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -Wl,-z,relro -o render render.o -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la -/bin/bash ../libtool --tag=CXX --mode=link g++ -I.. -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -Wl,-z,relro -o assemble assemble.o -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la -libtool: link: g++ -I.. -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -Wl,-z -Wl,relro -o .libs/example example.o -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/.libs/librsb.so -fopenmp -libtool: link: g++ -I.. -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -Wl,-z -Wl,relro -o .libs/render render.o -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/.libs/librsb.so -fopenmp -/bin/bash ../libtool --tag=CXX --mode=link g++ -I.. -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -Wl,-z,relro -o misc misc.o -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la -libtool: link: g++ -I.. -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -Wl,-z -Wl,relro -o .libs/span span.o -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/.libs/librsb.so -fopenmp +/bin/sh ../libtool --tag=CXX --mode=link g++ -I.. -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -Wl,-z,relro -o span span.o -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la +/bin/sh ../libtool --tag=CXX --mode=link g++ -I.. -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -Wl,-z,relro -o assemble assemble.o -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la +/bin/sh ../libtool --tag=CXX --mode=link g++ -I.. -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -Wl,-z,relro -o example example.o -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la +/bin/sh ../libtool --tag=CXX --mode=link g++ -I.. -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -Wl,-z,relro -o misc misc.o -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la libtool: link: g++ -I.. -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -Wl,-z -Wl,relro -o .libs/assemble assemble.o -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/.libs/librsb.so -fopenmp +libtool: link: g++ -I.. -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -Wl,-z -Wl,relro -o .libs/span span.o -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/.libs/librsb.so -fopenmp +/bin/sh ../libtool --tag=CXX --mode=link g++ -I.. -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -Wl,-z,relro -o render render.o -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la +libtool: link: g++ -I.. -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -Wl,-z -Wl,relro -o .libs/example example.o -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/.libs/librsb.so -fopenmp libtool: link: g++ -I.. -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -Wl,-z -Wl,relro -o .libs/misc misc.o -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/.libs/librsb.so -fopenmp -/bin/bash ../libtool --tag=CXX --mode=link g++ -I.. -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -Wl,-z,relro -o build build.o -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la +libtool: link: g++ -I.. -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -Wl,-z -Wl,relro -o .libs/render render.o -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/.libs/librsb.so -fopenmp +/bin/sh ../libtool --tag=CXX --mode=link g++ -I.. -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -Wl,-z,relro -o build build.o -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la libtool: link: g++ -I.. -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -Wl,-z -Wl,relro -o .libs/build build.o -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/.libs/librsb.so -fopenmp -/bin/bash ../libtool --tag=CXX --mode=link g++ -I.. -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -Wl,-z,relro -o twonnz twonnz.o -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la -/bin/bash ../libtool --tag=CXX --mode=link g++ -I.. -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -Wl,-z,relro -o mtx2bin mtx2bin.o -lstdc++fs -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la +/bin/sh ../libtool --tag=CXX --mode=link g++ -I.. -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -Wl,-z,relro -o twonnz twonnz.o -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la +/bin/sh ../libtool --tag=CXX --mode=link g++ -I.. -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -Wl,-z,relro -o mtx2bin mtx2bin.o -lstdc++fs -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la libtool: link: g++ -I.. -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -Wl,-z -Wl,relro -o .libs/twonnz twonnz.o -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/.libs/librsb.so -fopenmp +/bin/sh ../libtool --tag=CXX --mode=link g++ -I.. -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -Wl,-z,relro -o autotune autotune.o -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la libtool: link: g++ -I.. -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -Wl,-z -Wl,relro -o .libs/mtx2bin mtx2bin.o -lstdc++fs -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/.libs/librsb.so -fopenmp -/bin/bash ../libtool --tag=CXX --mode=link g++ -I.. -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -Wl,-z,relro -o autotune autotune.o -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la libtool: link: g++ -I.. -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -Wl,-z -Wl,relro -o .libs/autotune autotune.o -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/.libs/librsb.so -fopenmp -/bin/bash ../libtool --tag=CXX --mode=link g++ -I.. -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -Wl,-z,relro -o bench bench.o -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la +/bin/sh ../libtool --tag=CXX --mode=link g++ -I.. -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -Wl,-z,relro -o bench bench.o -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la libtool: link: g++ -I.. -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -Wl,-z -Wl,relro -o .libs/bench bench.o -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/.libs/librsb.so -fopenmp gmake[6]: Leaving directory '/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib/examples' gmake[5]: Leaving directory '/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib' @@ -3208,7 +3244,7 @@ gmake all-am gmake[5]: Entering directory '/build/reproducible-path/librsb-1.3.0.2+dfsg/rsbtest' g++ -DHAVE_CONFIG_H -I. -I/build/reproducible-path/librsb-1.3.0.2+dfsg -Wdate-time -D_FORTIFY_SOURCE=2 -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -c -o rsbtest.o rsbtest.cpp -/bin/bash ./libtool --tag=CXX --mode=link g++ -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -Wl,-z,relro -o rsbtest rsbtest.o /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la -lstdc++fs -lstdc++fs +/bin/sh ./libtool --tag=CXX --mode=link g++ -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -Wl,-z,relro -o rsbtest rsbtest.o /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la -lstdc++fs -lstdc++fs libtool: link: g++ -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -Wl,-z -Wl,relro -o .libs/rsbtest rsbtest.o /build/reproducible-path/librsb-1.3.0.2+dfsg/.libs/librsb.so -lstdc++fs -fopenmp gmake[5]: Leaving directory '/build/reproducible-path/librsb-1.3.0.2+dfsg/rsbtest' gmake[4]: Leaving directory '/build/reproducible-path/librsb-1.3.0.2+dfsg/rsbtest' @@ -3284,7 +3320,7 @@ gmake[3]: Leaving directory '/build/reproducible-path/librsb-1.3.0.2+dfsg' gmake mtests -C . gmake[3]: Entering directory '/build/reproducible-path/librsb-1.3.0.2+dfsg' -srcdir="/build/reproducible-path/librsb-1.3.0.2+dfsg" /bin/bash -ex ./scripts/readme-tests.sh +srcdir="/build/reproducible-path/librsb-1.3.0.2+dfsg" /bin/sh -ex ./scripts/readme-tests.sh + test x/build/reproducible-path/librsb-1.3.0.2+dfsg = x + ./rsbench -oa -Ob --bench -f /build/reproducible-path/librsb-1.3.0.2+dfsg/A.mtx -qH -R -n1,4 -T z --verbose --nrhs 1,2 --by-rows # --bench option implies -qH -R --write-performance-record --want-mkl-autotune --mkl-benchmark --types : --split-experimental 6 --merge-experimental 6 --also-transpose --sort-filenames-list --want-memory-benchmark @@ -3294,15 +3330,15 @@ Adding matrix file: /build/reproducible-path/librsb-1.3.0.2+dfsg/A.mtx # Sorting matrices list (use --no-sort-filenames-list to prevent this) # Using matrices: A.mtx -# beginning run at 1788680910 +# beginning run at 1754271489 # /build/reproducible-path/librsb-1.3.0.2+dfsg/.libs/rsbench -oa -Ob --bench -f /build/reproducible-path/librsb-1.3.0.2+dfsg/A.mtx -qH -R -n1,4 -T z --verbose --nrhs 1,2 --by-rows # compiled with: CC=gcc CFLAGS=-g -O2 -Werror=implicit-function-declaration -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -# average timer granularity: 3.07e-08 s -# Will write a final performance record to file rsbench_pr__1788680910_gcc-14.2-1,4th.rpr and periodic checkpoints to rsbench_pr__1788680910_gcc-14.2-1,4th.rpr.tmp +# average timer granularity: 8.19e-08 s +# Will write a final performance record to file rsbench_pr__1754271489_gcc-14.2-1,4th.rpr and periodic checkpoints to rsbench_pr__1754271489_gcc-14.2-1,4th.rpr.tmp # will NOT perform ancillary tests. # will flush cache memory: between each operation measurement series, and NOT between each operation. # will keep any zero encountered in the matrix. -# env: export PATH=/usr/sbin:/usr/bin:/sbin:/bin:/usr/games +# env: export PATH=/usr/sbin:/usr/bin:/sbin:/bin:/usr/games:/i/capture/the/path # env: export LD_LIBRARY_PATH=/build/reproducible-path/librsb-1.3.0.2+dfsg/.libs # env: HOSTNAME is not set # env: KMP_AFFINITY is not set @@ -3341,67 +3377,67 @@ # env: SLURM_NTASKS is not set # env: SLURM_STEP_TASKS_PER_NODE is not set # env: SLURM_TASKS_PER_NODE is not set -# detected hostname: codethink03-arm64 +# detected hostname: i-capture-the-hostname # user specified a verbosity level of 1 (each --verbose occurrence counts +1) # This test will measure times in scanning arrays sized and aligned to fit in caches. # 2 cache levels detected Will fill struct with 40 samples... -# Memory benchmark took 5.100s +# Memory benchmark took 5.395s # auto-tuning oriented output implies times==0 iterations and sort-after-load. #pr: allocated a performance record for 8 samples (2240 bytes). # Cache block size total 524288 bytes, per-thread 43690 bytes -# so far, program took 5.102s of wall clock time; ancillary tests 0.000s; I/O 0.000s; checks 0.000s; conversions 0.000s; rsb/mkl tuning 0.000s/0.000s . +# so far, program took 5.399s of wall clock time; ancillary tests 0.000s; I/O 0.000s; checks 0.000s; conversions 0.000s; rsb/mkl tuning 0.000s/0.000s . # Using 1 threads # reading A.mtx (184 bytes / 1 MiB / 6 nnz / 3 rows / 3 columns / 1 MiB COO) as type Z... -# file input of A.mtx took 0.00 s (6 nnz, 35696 nnz/s ) (1.09 MB/s ) -#pre-sorting (6 elements) took 0.025028 s -#weeding duplicates (to 6 elements) took 3.09944e-06 s (and check, 9.53674e-07 s ) +# file input of A.mtx took 0.00 s (6 nnz, 37958 nnz/s ) (1.16 MB/s ) +#pre-sorting (6 elements) took 0.0136409 s +#weeding duplicates (to 6 elements) took 2.14577e-06 s (and check, 9.53674e-07 s ) # multi-nrhs benchmarking (1,2) -- now using nrhs 1. # Using alpha=1 beta=1 order=rows for rsb_spmv/rsb_spsv/rsb_spmm/rsb_spsm. # multi-transpose benchmarking -- now using transA = N. # will use input matrix flags: RSB_FLAG_USE_HALFWORD_INDICES, RSB_FLAG_SORTED_INPUT, RSB_FLAG_QUAD_PARTITIONING, RSB_FLAG_SYMMETRIC, RSB_FLAG_OWN_PARTITIONING_ARRAYS # Using 1 threads -# Constructed matrix (took 0.051s): (3 x 3)[0xaaaadc88c6c0]{Z} @ (0(0..0),0(0..0)) (6 nnz, 2 nnz/r) flags 0x2442186 (coo:1, csr:0, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'S' +# Constructed matrix (took 0.011s): (3 x 3)[0xaaaac73016c0]{Z} @ (0(0..0),0(0..0)) (6 nnz, 2 nnz/r) flags 0x2442186 (coo:1, csr:0, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'S' # matrix consistency check took 0.000s (ok) RSB Sparse Blocks Autotuner invoked requesting max 6 splits and max 6 merges in 1 rounds, threads spec.0 (specify negative values to enable threads tuning). Will autotune matrix: 3 x 3, type Z, 6 nnz, 2 nnz/r, 4 subms, 3 lsubms, 4.0000 bpnz. Parameters: verbosity:1 mintimes:3 maxtimes:10 mindt:0 maxdt:3 -3 iterations (1 th.) took 0.0246s; avg 0.008201s ( +/- 14.81/ 7.50 %); best 0.006986s; worst 0.008816s; std dev. 0.000859 (taking best). -Reference operation time is 0.0069859 s (0.01374 Mflops) with 1 threads. -Starting merge (same threads) based auto-tuning procedure (transA=N, nrhs=1, order=rows) (max 6 steps, inclusive 3 grace steps) on: 3 x 3, type Z, 6 nnz, 2 nnz/r, 4 subms, 3 lsubms, 4.0000 bpnz (tpop: 0.006986 Mflops: 0.014) -Merge (3 -> 1 leaves) took w.c.t. of 1.788e-05s, ~6.914e-06s of computing time (of which 9.537e-07s sorting, 5.007e-06s analysis) -3 iterations (1 th.) took 0.0002689s; avg 8.965e-05s ( +/- 99.96/200.00 %); best 3.175e-08s; worst 0.0002689s; std dev. 0.0001268 (taking best). -Reference operation time is 3.17454e-08 s (3024 Mflops) with 1 threads. -After merge step 1: tpop: 3.175e-08 s ~Mflops: 3024.057 nsubm:1 otn:1 -Applying merge (3 -> 1 leaves, 1 th.) yielded SPEEDUP of 220060.083x: 0.006986s -> 3.175e-08s, so taking this instance. +3 iterations (1 th.) took 0.004321s; avg 0.00144s ( +/- 10.37/ 8.39 %); best 0.001291s; worst 0.001561s; std dev. 0.0001121 (taking best). +Reference operation time is 0.00129104 s (0.07436 Mflops) with 1 threads. +Starting merge (same threads) based auto-tuning procedure (transA=N, nrhs=1, order=rows) (max 6 steps, inclusive 3 grace steps) on: 3 x 3, type Z, 6 nnz, 2 nnz/r, 4 subms, 3 lsubms, 4.0000 bpnz (tpop: 0.001291 Mflops: 0.074) +Merge (3 -> 1 leaves) took w.c.t. of 6.795e-05s, ~2.789e-05s of computing time (of which 5.007e-06s sorting, 5.007e-06s analysis) +3 iterations (1 th.) took 0.0003018s; avg 0.0001006s ( +/- 99.92/200.00 %); best 8.105e-08s; worst 0.0003018s; std dev. 0.0001423 (taking best). +Reference operation time is 8.10504e-08 s (1184 Mflops) with 1 threads. +After merge step 1: tpop: 8.105e-08 s ~Mflops: 1184.448 nsubm:1 otn:1 +Applying merge (3 -> 1 leaves, 1 th.) yielded SPEEDUP of 15928.813x: 0.001291s -> 8.105e-08s, so taking this instance. Merged all the matrix leaves: no reason to continue merging. -A total of 1 merge steps (of max 6) (3 -> 1 subms) took 0.02318s (of which 2.098e-05s partitioning, 0s I/O); computing times: 6.914e-06s in par. loops, 9.537e-07s sorting, 5.007e-06s analyzing) -Total merge + benchmarking process took 0.02318s, equivalent to 730154.0/3.3 new/old ops (0.04357s for 2 clones -- as 1372549.8/6.2 ops, or 686274.9/3.1 ops per clone), SPEEDUP of 220060.083x -Applying multi-merge (3 -> 1 leaves, 1 steps, 0 -> 1 th.sp.) yielded SPEEDUP of 220060.083x (0.006986s -> 3.175e-08s), will amortize in 3.3 ops by saving 0.006986s per op. -In 1 tuning rounds (tot. 0.069s, 0.044s for constructor, 2 clones) obtained a SPEEDUP of 22005908.3% (2.201e+05x) (from 0.01374 to 3024 Mflops). +A total of 1 merge steps (of max 6) (3 -> 1 subms) took 0.003724s (of which 7.486e-05s partitioning, 0s I/O); computing times: 2.789e-05s in par. loops, 5.007e-06s sorting, 5.007e-06s analyzing) +Total merge + benchmarking process took 0.003724s, equivalent to 45945.0/2.9 new/old ops (0.007396s for 2 clones -- as 91254.6/5.7 ops, or 45627.3/2.9 ops per clone), SPEEDUP of 15928.813x +Applying multi-merge (3 -> 1 leaves, 1 steps, 0 -> 1 th.sp.) yielded SPEEDUP of 15928.813x (0.001291s -> 8.105e-08s), will amortize in 2.9 ops by saving 0.001291s per op. +In 1 tuning rounds (tot. 0.012s, 0.0074s for constructor, 2 clones) obtained a SPEEDUP of 1592781.3% (1.593e+04x) (from 0.07436 to 1184 Mflops). #pr: updating sample at index 1 (0^th of 8), 0^th touch for (0,0,0,0,0,0,0). -First run of RSB Autotuner took 0.068644 s (6.986e-03 s -> 3.175e-08 s per spmv_sxsa) (tuned: 3 -> 1 lsubm). +First run of RSB Autotuner took 0.012291 s (1.291e-03 s -> 8.105e-08 s per spmv_sxsa) (tuned: 3 -> 1 lsubm). RSB Sparse Blocks Autotuner invoked requesting max 0 splits and max 0 merges in 1 rounds, auto threads spec. -Second run of RSB Autotuner took 0.403943 s and estimated a speedup of 1.000000 x (3.175e-08 s -> 3.175e-08 s per op) in same matrix (1 -> 1 lsubm) +Second run of RSB Autotuner took 0.0695338 s and estimated a speedup of 1.000000 x (8.105e-08 s -> 8.105e-08 s per op) in same matrix (1 -> 1 lsubm) #min:1 0 #max:1 0 #sum:3 0 #norm:1.7320508075688772 0 #used index storage compared to COO:28 vs 48 bytes (58.33%) ; compared to CSR:28 vs 40 bytes (77.78%) #%:CONSTRUCTOR_*:SORT SCAN INSERT SCAN+INSERT -%:CONSTRUCTOR_TIMES:A.mtx S N 1 3 3 6 0.000001 0.012091 0.023099 0.035190 -%:UNSORTEDCOO2RSB_TIME:A.mtx S N 1 3 3 6 0.035191 -%:RSB_SUBDIVISION_TIME:A.mtx S N 1 3 3 6 0.012091 -%:RSB_SHUFFLE_TIME:A.mtx S N 1 3 3 6 0.023099 -%:ROW_MAJOR_SORT_TIME:A.mtx S N 1 3 3 6 0.000001 -%:ROW_MAJOR_SORT_SCALING:A.mtx S N 1 3 3 6 1.000 -%:SORTEDCOO2RSB_TIME:A.mtx S N 1 3 3 6 0.035190 +%:CONSTRUCTOR_TIMES:A.mtx S N 1 3 3 6 0.000000 0.005021 0.003373 0.008394 +%:UNSORTEDCOO2RSB_TIME:A.mtx S N 1 3 3 6 0.008394 +%:RSB_SUBDIVISION_TIME:A.mtx S N 1 3 3 6 0.005021 +%:RSB_SHUFFLE_TIME:A.mtx S N 1 3 3 6 0.003373 +%:ROW_MAJOR_SORT_TIME:A.mtx S N 1 3 3 6 0.000000 +%:ROW_MAJOR_SORT_SCALING:A.mtx S N 1 3 3 6 nan +%:SORTEDCOO2RSB_TIME:A.mtx S N 1 3 3 6 0.008394 %:ROW_MAJOR_SORT_TO_MOP:A.mtx S N 1 3 3 6 0.000 %:UNSORTEDCOO2RSB_SCALING:A.mtx S N 1 3 3 6 1.00 %:SORTEDCOO2RSB_SCALING:A.mtx S N 1 3 3 6 1.00 %:RSB_SUBDIVISION_SCALING:A.mtx S N 1 3 3 6 1.00 %:RSB_SHUFFLE_SCALING:A.mtx S N 1 3 3 6 1.00 -%:CONSTRUCTOR_SCALING:A.mtx S N 1 3 3 6 1.00 1.00 1.00 1.00 +%:CONSTRUCTOR_SCALING:A.mtx S N 1 3 3 6 nan 1.00 1.00 1.00 #%:SM_COUNTS: Tot HalfwordCsr FullwordCsr HalfwordCoo FullwordCoo %:SM_COUNTS:A.mtx S N 1 3 3 6 1 1 0 0 0 %:SM_IDXOCCUPATIONRSBVSCOOANDCSR:A.mtx S N 1 3 3 6 28 48 36 @@ -3410,47 +3446,47 @@ %:SM_MINMAXAVGNNZ:A.mtx S N 1 3 3 6 6 6 6 # # Using 4 threads -# Constructed matrix (took 0.075s): (3 x 3)[0xaaaadc88c6c0]{Z} @ (0(0..0),0(0..0)) (6 nnz, 2 nnz/r) flags 0x2442186 (coo:1, csr:0, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'S' +# Constructed matrix (took 0.013s): (3 x 3)[0xaaaac73016c0]{Z} @ (0(0..0),0(0..0)) (6 nnz, 2 nnz/r) flags 0x2442186 (coo:1, csr:0, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'S' # matrix consistency check took 0.000s (ok) RSB Sparse Blocks Autotuner invoked requesting max 6 splits and max 6 merges in 1 rounds, threads spec.1 (specify negative values to enable threads tuning). Will autotune matrix: 3 x 3, type Z, 6 nnz, 2 nnz/r, 4 subms, 3 lsubms, 4.0000 bpnz. Parameters: verbosity:1 mintimes:3 maxtimes:10 mindt:0 maxdt:3 -3 iterations (4 th.) took 0.02319s; avg 0.007729s ( +/- 53.18/ 47.13 %); best 0.003619s; worst 0.01137s; std dev. 0.003182 (taking best). -Reference operation time is 0.00361896 s (0.02653 Mflops) with 4 threads. -Starting merge (user-supplied threads) based auto-tuning procedure (transA=N, nrhs=1, order=rows) (max 6 steps, inclusive 3 grace steps) on: 3 x 3, type Z, 6 nnz, 2 nnz/r, 4 subms, 3 lsubms, 4.0000 bpnz (tpop: 0.003619 Mflops: 0.027) -Merge (3 -> 1 leaves) took w.c.t. of 1.216e-05s, ~4.053e-06s of computing time (of which 9.537e-07s sorting, 3.099e-06s analysis) -3 iterations (4 th.) took 4.053e-06s; avg 1.351e-06s ( +/- 97.65/200.00 %); best 3.175e-08s; worst 4.053e-06s; std dev. 1.911e-06 (taking best). -Reference operation time is 3.17454e-08 s (3024 Mflops) with 4 threads. -After merge step 1: tpop: 3.175e-08 s ~Mflops: 3024.057 nsubm:1 otn:1 -Applying merge (3 -> 1 leaves, 1 th.) yielded SPEEDUP of 113999.249x: 0.003619s -> 3.175e-08s, so taking this instance. +3 iterations (4 th.) took 0.005096s; avg 0.001699s ( +/- 46.31/ 90.73 %); best 0.000912s; worst 0.00324s; std dev. 0.00109 (taking best). +Reference operation time is 0.000911951 s (0.1053 Mflops) with 4 threads. +Starting merge (user-supplied threads) based auto-tuning procedure (transA=N, nrhs=1, order=rows) (max 6 steps, inclusive 3 grace steps) on: 3 x 3, type Z, 6 nnz, 2 nnz/r, 4 subms, 3 lsubms, 4.0000 bpnz (tpop: 0.000912 Mflops: 0.105) +Merge (3 -> 1 leaves) took w.c.t. of 1.097e-05s, ~4.053e-06s of computing time (of which 9.537e-07s sorting, 2.146e-06s analysis) +3 iterations (4 th.) took 3.099e-06s; avg 1.033e-06s ( +/- 92.16/107.69 %); best 8.105e-08s; worst 2.146e-06s; std dev. 8.778e-07 (taking best). +Reference operation time is 8.10504e-08 s (1184 Mflops) with 4 threads. +After merge step 1: tpop: 8.105e-08 s ~Mflops: 1184.448 nsubm:1 otn:1 +Applying merge (3 -> 1 leaves, 1 th.) yielded SPEEDUP of 11251.655x: 0.000912s -> 8.105e-08s, so taking this instance. Merged all the matrix leaves: no reason to continue merging. -A total of 1 merge steps (of max 6) (3 -> 1 subms) took 0.02461s (of which 1.407e-05s partitioning, 0s I/O); computing times: 4.053e-06s in par. loops, 9.537e-07s sorting, 3.099e-06s analyzing) -Total merge + benchmarking process took 0.02461s, equivalent to 775103.3/6.8 new/old ops (0.04917s for 2 clones -- as 1548952.3/13.6 ops, or 774476.2/6.8 ops per clone), SPEEDUP of 113999.249x -Applying multi-merge (3 -> 1 leaves, 1 steps, 1 -> 1 th.sp.) yielded SPEEDUP of 113999.249x (0.003619s -> 3.175e-08s), will amortize in 6.8 ops by saving 0.003619s per op. -In 1 tuning rounds (tot. 0.072s, 0.049s for constructor, 2 clones) obtained a SPEEDUP of 11399824.9% (1.14e+05x) (from 0.02653 to 3024 Mflops). +A total of 1 merge steps (of max 6) (3 -> 1 subms) took 0.006101s (of which 1.311e-05s partitioning, 0s I/O); computing times: 4.053e-06s in par. loops, 9.537e-07s sorting, 2.146e-06s analyzing) +Total merge + benchmarking process took 0.006101s, equivalent to 75275.8/6.7 new/old ops (0.008554s for 2 clones -- as 105536.1/9.4 ops, or 52768.1/4.7 ops per clone), SPEEDUP of 11251.655x +Applying multi-merge (3 -> 1 leaves, 1 steps, 1 -> 1 th.sp.) yielded SPEEDUP of 11251.655x (0.000912s -> 8.105e-08s), will amortize in 6.7 ops by saving 0.0009119s per op. +In 1 tuning rounds (tot. 0.014s, 0.0086s for constructor, 2 clones) obtained a SPEEDUP of 1125065.5% (1.125e+04x) (from 0.1053 to 1184 Mflops). #pr: updating sample at index 5 (1^th of 8), 0^th touch for (0,1,0,0,0,0,0). -First run of RSB Autotuner took 0.0724399 s (3.619e-03 s -> 3.175e-08 s per spmv_sxsa) (tuned: 3 -> 1 lsubm). +First run of RSB Autotuner took 0.0137351 s (9.120e-04 s -> 8.105e-08 s per spmv_sxsa) (tuned: 3 -> 1 lsubm). RSB Sparse Blocks Autotuner invoked requesting max 0 splits and max 0 merges in 1 rounds, auto threads spec. -Second run of RSB Autotuner took 0.411749 s and estimated a speedup of 1.000000 x (3.175e-08 s -> 3.175e-08 s per op) in same matrix (1 -> 1 lsubm) +Second run of RSB Autotuner took 0.0438039 s and estimated a speedup of 1.000000 x (8.105e-08 s -> 8.105e-08 s per op) in same matrix (1 -> 1 lsubm) #min:1 0 #max:1 0 #sum:3 0 #norm:1.7320508075688772 0 #used index storage compared to COO:28 vs 48 bytes (58.33%) ; compared to CSR:28 vs 40 bytes (77.78%) #%:CONSTRUCTOR_*:SORT SCAN INSERT SCAN+INSERT -%:CONSTRUCTOR_TIMES:A.mtx S N 4 3 3 6 0.000000 0.026488 0.029289 0.055777 -%:UNSORTEDCOO2RSB_TIME:A.mtx S N 4 3 3 6 0.055777 -%:RSB_SUBDIVISION_TIME:A.mtx S N 4 3 3 6 0.026488 -%:RSB_SHUFFLE_TIME:A.mtx S N 4 3 3 6 0.029289 +%:CONSTRUCTOR_TIMES:A.mtx S N 4 3 3 6 0.000000 0.004470 0.004281 0.008751 +%:UNSORTEDCOO2RSB_TIME:A.mtx S N 4 3 3 6 0.008751 +%:RSB_SUBDIVISION_TIME:A.mtx S N 4 3 3 6 0.004470 +%:RSB_SHUFFLE_TIME:A.mtx S N 4 3 3 6 0.004281 %:ROW_MAJOR_SORT_TIME:A.mtx S N 4 3 3 6 0.000000 -%:ROW_MAJOR_SORT_SCALING:A.mtx S N 4 3 3 6 inf -%:SORTEDCOO2RSB_TIME:A.mtx S N 4 3 3 6 0.055777 +%:ROW_MAJOR_SORT_SCALING:A.mtx S N 4 3 3 6 nan +%:SORTEDCOO2RSB_TIME:A.mtx S N 4 3 3 6 0.008751 %:ROW_MAJOR_SORT_TO_MOP:A.mtx S N 4 3 3 6 0.000 -%:UNSORTEDCOO2RSB_SCALING:A.mtx S N 4 3 3 6 0.63 -%:SORTEDCOO2RSB_SCALING:A.mtx S N 4 3 3 6 0.63 -%:RSB_SUBDIVISION_SCALING:A.mtx S N 4 3 3 6 0.46 +%:UNSORTEDCOO2RSB_SCALING:A.mtx S N 4 3 3 6 0.96 +%:SORTEDCOO2RSB_SCALING:A.mtx S N 4 3 3 6 0.96 +%:RSB_SUBDIVISION_SCALING:A.mtx S N 4 3 3 6 1.12 %:RSB_SHUFFLE_SCALING:A.mtx S N 4 3 3 6 0.79 -%:CONSTRUCTOR_SCALING:A.mtx S N 4 3 3 6 inf 0.46 0.79 0.63 +%:CONSTRUCTOR_SCALING:A.mtx S N 4 3 3 6 nan 1.12 0.79 0.96 #%:SM_COUNTS: Tot HalfwordCsr FullwordCsr HalfwordCoo FullwordCoo %:SM_COUNTS:A.mtx S N 4 3 3 6 1 1 0 0 0 %:SM_IDXOCCUPATIONRSBVSCOOANDCSR:A.mtx S N 4 3 3 6 28 48 36 @@ -3459,50 +3495,50 @@ %:SM_MINMAXAVGNNZ:A.mtx S N 4 3 3 6 6 6 6 # %operation:matrix CONSTRUCTOR[1] SPMV[1] SPMV[4] -%operation:A.mtx 0.0511589 1e+09 1e+09 +%operation:A.mtx 0.011199 1e+09 1e+09 %constructor:matrix SORT[1] SCAN[1] SHUFFLE[1] INSERT[1] -%constructor:A.mtx 1.19209e-06 0.0120912 0 0.0230989 +%constructor:A.mtx 0 0.00502086 0 0.00337291 # symmetric matrix --- skipping transposed benchmarking # multi-nrhs benchmarking (1,2) -- now using nrhs 2. # Using alpha=1 beta=1 order=rows for rsb_spmv/rsb_spsv/rsb_spmm/rsb_spsm. # multi-transpose benchmarking -- now using transA = N. # will use input matrix flags: RSB_FLAG_USE_HALFWORD_INDICES, RSB_FLAG_SORTED_INPUT, RSB_FLAG_QUAD_PARTITIONING, RSB_FLAG_SYMMETRIC, RSB_FLAG_OWN_PARTITIONING_ARRAYS # Using 1 threads -# Constructed matrix (took 0.040s): (3 x 3)[0xaaaadc88c6c0]{Z} @ (0(0..0),0(0..0)) (6 nnz, 2 nnz/r) flags 0x2442186 (coo:1, csr:0, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'S' +# Constructed matrix (took 0.003s): (3 x 3)[0xaaaac73016c0]{Z} @ (0(0..0),0(0..0)) (6 nnz, 2 nnz/r) flags 0x2442186 (coo:1, csr:0, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'S' # matrix consistency check took 0.000s (ok) RSB Sparse Blocks Autotuner invoked requesting max 6 splits and max 6 merges in 1 rounds, threads spec.0 (specify negative values to enable threads tuning). Will autotune matrix: 3 x 3, type Z, 6 nnz, 2 nnz/r, 4 subms, 3 lsubms, 4.0000 bpnz. Parameters: verbosity:1 mintimes:3 maxtimes:10 mindt:0 maxdt:3 -3 iterations (1 th.) took 0.02779s; avg 0.009263s ( +/- 11.52/ 20.45 %); best 0.008196s; worst 0.01116s; std dev. 0.001343 (taking best). -Reference operation time is 0.00819588 s (0.02343 Mflops) with 1 threads. -Starting merge (same threads) based auto-tuning procedure (transA=N, nrhs=2, order=rows) (max 6 steps, inclusive 3 grace steps) on: 3 x 3, type Z, 6 nnz, 2 nnz/r, 4 subms, 3 lsubms, 4.0000 bpnz (tpop: 0.008196 Mflops: 0.023) -Merge (3 -> 1 leaves) took w.c.t. of 1.383e-05s, ~4.053e-06s of computing time (of which 9.537e-07s sorting, 1.907e-06s analysis) -3 iterations (1 th.) took 4.053e-06s; avg 1.351e-06s ( +/- 97.65/200.00 %); best 3.175e-08s; worst 4.053e-06s; std dev. 1.911e-06 (taking best). -Reference operation time is 3.17454e-08 s (6048 Mflops) with 1 threads. -After merge step 1: tpop: 3.175e-08 s ~Mflops: 6048.114 nsubm:1 otn:1 -Applying merge (3 -> 1 leaves, 1 th.) yielded SPEEDUP of 258174.991x: 0.008196s -> 3.175e-08s, so taking this instance. +3 iterations (1 th.) took 0.001941s; avg 0.000647s ( +/- 5.40/ 10.66 %); best 0.000612s; worst 0.000716s; std dev. 4.878e-05 (taking best). +Reference operation time is 0.00061202 s (0.3137 Mflops) with 1 threads. +Starting merge (same threads) based auto-tuning procedure (transA=N, nrhs=2, order=rows) (max 6 steps, inclusive 3 grace steps) on: 3 x 3, type Z, 6 nnz, 2 nnz/r, 4 subms, 3 lsubms, 4.0000 bpnz (tpop: 0.000612 Mflops: 0.314) +Merge (3 -> 1 leaves) took w.c.t. of 7.153e-06s, ~2.861e-06s of computing time (of which 9.537e-07s sorting, 1.192e-06s analysis) +3 iterations (1 th.) took 4.053e-06s; avg 1.351e-06s ( +/- 94.00/129.41 %); best 8.105e-08s; worst 3.099e-06s; std dev. 1.296e-06 (taking best). +Reference operation time is 8.10504e-08 s (2369 Mflops) with 1 threads. +After merge step 1: tpop: 8.105e-08 s ~Mflops: 2368.897 nsubm:1 otn:1 +Applying merge (3 -> 1 leaves, 1 th.) yielded SPEEDUP of 7551.110x: 0.000612s -> 8.105e-08s, so taking this instance. Merged all the matrix leaves: no reason to continue merging. -A total of 1 merge steps (of max 6) (3 -> 1 subms) took 0.01986s (of which 1.502e-05s partitioning, 0s I/O); computing times: 4.053e-06s in par. loops, 9.537e-07s sorting, 1.907e-06s analyzing) -Total merge + benchmarking process took 0.01986s, equivalent to 625602.7/2.4 new/old ops (0.04777s for 2 clones -- as 1504686.4/5.8 ops, or 752343.2/2.9 ops per clone), SPEEDUP of 258174.991x -Applying multi-merge (3 -> 1 leaves, 1 steps, 0 -> 1 th.sp.) yielded SPEEDUP of 258174.991x (0.008196s -> 3.175e-08s), will amortize in 2.4 ops by saving 0.008196s per op. -In 1 tuning rounds (tot. 0.076s, 0.048s for constructor, 2 clones) obtained a SPEEDUP of 25817399.1% (2.582e+05x) (from 0.02343 to 6048 Mflops). +A total of 1 merge steps (of max 6) (3 -> 1 subms) took 0.002012s (of which 1.001e-05s partitioning, 0s I/O); computing times: 2.861e-06s in par. loops, 9.537e-07s sorting, 1.192e-06s analyzing) +Total merge + benchmarking process took 0.002012s, equivalent to 24824.2/3.3 new/old ops (0.004023s for 2 clones -- as 49636.7/6.6 ops, or 24818.4/3.3 ops per clone), SPEEDUP of 7551.110x +Applying multi-merge (3 -> 1 leaves, 1 steps, 0 -> 1 th.sp.) yielded SPEEDUP of 7551.110x (0.000612s -> 8.105e-08s), will amortize in 3.3 ops by saving 0.0006119s per op. +In 1 tuning rounds (tot. 0.006s, 0.004s for constructor, 2 clones) obtained a SPEEDUP of 755011.0% (7551x) (from 0.3137 to 2369 Mflops). #pr: updating sample at index 3 (2^th of 8), 0^th touch for (0,0,0,0,1,0,0). -First run of RSB Autotuner took 0.0756371 s (8.196e-03 s -> 3.175e-08 s per spmv_sxsa) (tuned: 3 -> 1 lsubm). +First run of RSB Autotuner took 0.00602007 s (6.120e-04 s -> 8.105e-08 s per spmv_sxsa) (tuned: 3 -> 1 lsubm). RSB Sparse Blocks Autotuner invoked requesting max 0 splits and max 0 merges in 1 rounds, auto threads spec. -Second run of RSB Autotuner took 0.416153 s and estimated a speedup of 1.000000 x (3.175e-08 s -> 3.175e-08 s per op) in same matrix (1 -> 1 lsubm) +Second run of RSB Autotuner took 0.050596 s and estimated a speedup of 1.000000 x (8.105e-08 s -> 8.105e-08 s per op) in same matrix (1 -> 1 lsubm) #min:1 0 #max:1 0 #sum:3 0 #norm:1.7320508075688772 0 #used index storage compared to COO:28 vs 48 bytes (58.33%) ; compared to CSR:28 vs 40 bytes (77.78%) #%:CONSTRUCTOR_*:SORT SCAN INSERT SCAN+INSERT -%:CONSTRUCTOR_TIMES:A.mtx S N 1 3 3 6 0.000000 0.008370 0.019366 0.027736 -%:UNSORTEDCOO2RSB_TIME:A.mtx S N 1 3 3 6 0.027736 -%:RSB_SUBDIVISION_TIME:A.mtx S N 1 3 3 6 0.008370 -%:RSB_SHUFFLE_TIME:A.mtx S N 1 3 3 6 0.019366 +%:CONSTRUCTOR_TIMES:A.mtx S N 1 3 3 6 0.000000 0.000758 0.001291 0.002049 +%:UNSORTEDCOO2RSB_TIME:A.mtx S N 1 3 3 6 0.002049 +%:RSB_SUBDIVISION_TIME:A.mtx S N 1 3 3 6 0.000758 +%:RSB_SHUFFLE_TIME:A.mtx S N 1 3 3 6 0.001291 %:ROW_MAJOR_SORT_TIME:A.mtx S N 1 3 3 6 0.000000 %:ROW_MAJOR_SORT_SCALING:A.mtx S N 1 3 3 6 nan -%:SORTEDCOO2RSB_TIME:A.mtx S N 1 3 3 6 0.027736 +%:SORTEDCOO2RSB_TIME:A.mtx S N 1 3 3 6 0.002049 %:ROW_MAJOR_SORT_TO_MOP:A.mtx S N 1 3 3 6 0.000 %:UNSORTEDCOO2RSB_SCALING:A.mtx S N 1 3 3 6 1.00 %:SORTEDCOO2RSB_SCALING:A.mtx S N 1 3 3 6 1.00 @@ -3517,47 +3553,47 @@ %:SM_MINMAXAVGNNZ:A.mtx S N 1 3 3 6 6 6 6 # # Using 4 threads -# Constructed matrix (took 0.079s): (3 x 3)[0xaaaadc88c6c0]{Z} @ (0(0..0),0(0..0)) (6 nnz, 2 nnz/r) flags 0x2442186 (coo:1, csr:0, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'S' +# Constructed matrix (took 0.020s): (3 x 3)[0xaaaac73016c0]{Z} @ (0(0..0),0(0..0)) (6 nnz, 2 nnz/r) flags 0x2442186 (coo:1, csr:0, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'S' # matrix consistency check took 0.000s (ok) RSB Sparse Blocks Autotuner invoked requesting max 6 splits and max 6 merges in 1 rounds, threads spec.1 (specify negative values to enable threads tuning). Will autotune matrix: 3 x 3, type Z, 6 nnz, 2 nnz/r, 4 subms, 3 lsubms, 4.0000 bpnz. Parameters: verbosity:1 mintimes:3 maxtimes:10 mindt:0 maxdt:3 -3 iterations (4 th.) took 0.02106s; avg 0.007019s ( +/- 27.91/ 25.65 %); best 0.00506s; worst 0.008819s; std dev. 0.001539 (taking best). -Reference operation time is 0.00505996 s (0.03794 Mflops) with 4 threads. -Starting merge (user-supplied threads) based auto-tuning procedure (transA=N, nrhs=2, order=rows) (max 6 steps, inclusive 3 grace steps) on: 3 x 3, type Z, 6 nnz, 2 nnz/r, 4 subms, 3 lsubms, 4.0000 bpnz (tpop: 0.00506 Mflops: 0.038) -Merge (3 -> 1 leaves) took w.c.t. of 1.311e-05s, ~3.815e-06s of computing time (of which 0s sorting, 3.099e-06s analysis) -3 iterations (4 th.) took 5.007e-06s; avg 1.669e-06s ( +/- 98.10/200.00 %); best 3.175e-08s; worst 5.007e-06s; std dev. 2.36e-06 (taking best). -Reference operation time is 3.17454e-08 s (6048 Mflops) with 4 threads. -After merge step 1: tpop: 3.175e-08 s ~Mflops: 6048.114 nsubm:1 otn:1 -Applying merge (3 -> 1 leaves, 1 th.) yielded SPEEDUP of 159391.664x: 0.00506s -> 3.175e-08s, so taking this instance. +3 iterations (4 th.) took 0.005811s; avg 0.001937s ( +/- 27.11/ 28.34 %); best 0.001412s; worst 0.002486s; std dev. 0.0004388 (taking best). +Reference operation time is 0.00141191 s (0.136 Mflops) with 4 threads. +Starting merge (user-supplied threads) based auto-tuning procedure (transA=N, nrhs=2, order=rows) (max 6 steps, inclusive 3 grace steps) on: 3 x 3, type Z, 6 nnz, 2 nnz/r, 4 subms, 3 lsubms, 4.0000 bpnz (tpop: 0.001412 Mflops: 0.136) +Merge (3 -> 1 leaves) took w.c.t. of 1.192e-05s, ~4.053e-06s of computing time (of which 9.537e-07s sorting, 1.907e-06s analysis) +3 iterations (4 th.) took 2.861e-06s; avg 9.537e-07s ( +/- 91.50/200.00 %); best 8.105e-08s; worst 2.861e-06s; std dev. 1.349e-06 (taking best). +Reference operation time is 8.10504e-08 s (2369 Mflops) with 4 threads. +After merge step 1: tpop: 8.105e-08 s ~Mflops: 2368.897 nsubm:1 otn:1 +Applying merge (3 -> 1 leaves, 1 th.) yielded SPEEDUP of 17420.209x: 0.001412s -> 8.105e-08s, so taking this instance. Merged all the matrix leaves: no reason to continue merging. -A total of 1 merge steps (of max 6) (3 -> 1 subms) took 0.03093s (of which 1.502e-05s partitioning, 0s I/O); computing times: 3.815e-06s in par. loops, 0s sorting, 3.099e-06s analyzing) -Total merge + benchmarking process took 0.03093s, equivalent to 974344.7/6.1 new/old ops (0.05822s for 2 clones -- as 1833939.2/11.5 ops, or 916969.6/5.8 ops per clone), SPEEDUP of 159391.664x -Applying multi-merge (3 -> 1 leaves, 1 steps, 1 -> 1 th.sp.) yielded SPEEDUP of 159391.664x (0.00506s -> 3.175e-08s), will amortize in 6.1 ops by saving 0.00506s per op. -In 1 tuning rounds (tot. 0.079s, 0.058s for constructor, 2 clones) obtained a SPEEDUP of 15939066.4% (1.594e+05x) (from 0.03794 to 6048 Mflops). +A total of 1 merge steps (of max 6) (3 -> 1 subms) took 0.004796s (of which 1.502e-05s partitioning, 0s I/O); computing times: 4.053e-06s in par. loops, 9.537e-07s sorting, 1.907e-06s analyzing) +Total merge + benchmarking process took 0.004796s, equivalent to 59173.4/3.4 new/old ops (0.00869s for 2 clones -- as 107215.8/6.2 ops, or 53607.9/3.1 ops per clone), SPEEDUP of 17420.209x +Applying multi-merge (3 -> 1 leaves, 1 steps, 1 -> 1 th.sp.) yielded SPEEDUP of 17420.209x (0.001412s -> 8.105e-08s), will amortize in 3.4 ops by saving 0.001412s per op. +In 1 tuning rounds (tot. 0.015s, 0.0087s for constructor, 2 clones) obtained a SPEEDUP of 1741920.9% (1.742e+04x) (from 0.136 to 2369 Mflops). #pr: updating sample at index 7 (3^th of 8), 0^th touch for (0,1,0,0,1,0,0). -First run of RSB Autotuner took 0.079356 s (5.060e-03 s -> 3.175e-08 s per spmv_sxsa) (tuned: 3 -> 1 lsubm). +First run of RSB Autotuner took 0.0145791 s (1.412e-03 s -> 8.105e-08 s per spmv_sxsa) (tuned: 3 -> 1 lsubm). RSB Sparse Blocks Autotuner invoked requesting max 0 splits and max 0 merges in 1 rounds, auto threads spec. -Second run of RSB Autotuner took 0.416193 s and estimated a speedup of 1.000000 x (3.175e-08 s -> 3.175e-08 s per op) in same matrix (1 -> 1 lsubm) +Second run of RSB Autotuner took 0.081229 s and estimated a speedup of 1.000000 x (8.105e-08 s -> 8.105e-08 s per op) in same matrix (1 -> 1 lsubm) #min:1 0 #max:1 0 #sum:3 0 #norm:1.7320508075688772 0 #used index storage compared to COO:28 vs 48 bytes (58.33%) ; compared to CSR:28 vs 40 bytes (77.78%) #%:CONSTRUCTOR_*:SORT SCAN INSERT SCAN+INSERT -%:CONSTRUCTOR_TIMES:A.mtx S N 4 3 3 6 0.000000 0.022141 0.044003 0.066144 -%:UNSORTEDCOO2RSB_TIME:A.mtx S N 4 3 3 6 0.066144 -%:RSB_SUBDIVISION_TIME:A.mtx S N 4 3 3 6 0.022141 -%:RSB_SHUFFLE_TIME:A.mtx S N 4 3 3 6 0.044003 +%:CONSTRUCTOR_TIMES:A.mtx S N 4 3 3 6 0.000000 0.002784 0.013552 0.016336 +%:UNSORTEDCOO2RSB_TIME:A.mtx S N 4 3 3 6 0.016336 +%:RSB_SUBDIVISION_TIME:A.mtx S N 4 3 3 6 0.002784 +%:RSB_SHUFFLE_TIME:A.mtx S N 4 3 3 6 0.013552 %:ROW_MAJOR_SORT_TIME:A.mtx S N 4 3 3 6 0.000000 %:ROW_MAJOR_SORT_SCALING:A.mtx S N 4 3 3 6 nan -%:SORTEDCOO2RSB_TIME:A.mtx S N 4 3 3 6 0.066144 +%:SORTEDCOO2RSB_TIME:A.mtx S N 4 3 3 6 0.016336 %:ROW_MAJOR_SORT_TO_MOP:A.mtx S N 4 3 3 6 0.000 -%:UNSORTEDCOO2RSB_SCALING:A.mtx S N 4 3 3 6 0.42 -%:SORTEDCOO2RSB_SCALING:A.mtx S N 4 3 3 6 0.42 -%:RSB_SUBDIVISION_SCALING:A.mtx S N 4 3 3 6 0.38 -%:RSB_SHUFFLE_SCALING:A.mtx S N 4 3 3 6 0.44 -%:CONSTRUCTOR_SCALING:A.mtx S N 4 3 3 6 nan 0.38 0.44 0.42 +%:UNSORTEDCOO2RSB_SCALING:A.mtx S N 4 3 3 6 0.13 +%:SORTEDCOO2RSB_SCALING:A.mtx S N 4 3 3 6 0.13 +%:RSB_SUBDIVISION_SCALING:A.mtx S N 4 3 3 6 0.27 +%:RSB_SHUFFLE_SCALING:A.mtx S N 4 3 3 6 0.10 +%:CONSTRUCTOR_SCALING:A.mtx S N 4 3 3 6 nan 0.27 0.10 0.13 #%:SM_COUNTS: Tot HalfwordCsr FullwordCsr HalfwordCoo FullwordCoo %:SM_COUNTS:A.mtx S N 4 3 3 6 1 1 0 0 0 %:SM_IDXOCCUPATIONRSBVSCOOANDCSR:A.mtx S N 4 3 3 6 28 48 36 @@ -3566,184 +3602,184 @@ %:SM_MINMAXAVGNNZ:A.mtx S N 4 3 3 6 6 6 6 # %operation:matrix CONSTRUCTOR[1] SPMV[1] SPMV[4] -%operation:A.mtx 0.039963 1e+09 1e+09 +%operation:A.mtx 0.00349188 1e+09 1e+09 %constructor:matrix SORT[1] SCAN[1] SHUFFLE[1] INSERT[1] -%constructor:A.mtx 0 0.00836992 0 0.019366 +%constructor:A.mtx 0 0.000757933 0 0.00129104 # symmetric matrix --- skipping transposed benchmarking -# so far, program took 7.487s of wall clock time; ancillary tests 0.000s; I/O 0.000s; checks 0.000s; conversions 0.000s; rsb/mkl tuning 1.944s/0.000s . +# so far, program took 5.781s of wall clock time; ancillary tests 0.000s; I/O 0.000s; checks 0.000s; conversions 0.000s; rsb/mkl tuning 0.292s/0.000s . getrusage() stats: -ru_maxrss: 6 (maximum resident set size -- MB) -ru_stime : 0.05055s (system CPU time used) -ru_utime : 4.28s (user CPU time used) +ru_maxrss: 8 (maximum resident set size -- MB) +ru_stime : 0.08368s (system CPU time used) +ru_utime : 6.789s (user CPU time used) # benchmarking terminated --- finalizing run. # ====== BEGIN Total summary record. #pr: ======== Limiting to nrhs=1: #pr: 2 samples (out of 4) matched the dump limiting criteria. #pr: Dump from a base of 4 samples (of max 8) ordered by (1,2,1,1,2,1,2) = (filename x cores x incX x incY x nrhs x typecode x transA). pr: BESTCODE MTX NR NC NNZ NRHS TYPE SYM TRANS NT AT-NT AT-MKL-NT BPNZ AT-BPNZ NSUBM AT-SUBM RSBBEST-MFLOPS OPTIME MKL-OPTIME AT-OPTIME AT-MKL-OPTIME AT-TIME RWminBW-GBps CB-bpf AT-MS CMFLOPS -pr: 1:R_R A 3 3 6 1 Z S N 1 1 0 4.0000 4.6667 3 1 3024.06 6.986e-03 0.000e+00 3.175e-08 0.000e+00 6.864e-02 8.44e+00 2.29e+00 1 9.60e-05 -pr: 5:R_R A 3 3 6 1 Z S N 4 1 0 4.0000 4.6667 3 1 3024.06 3.619e-03 0.000e+00 3.175e-08 0.000e+00 7.244e-02 8.44e+00 2.29e+00 1 9.60e-05 +pr: 1:R_R A 3 3 6 1 Z S N 1 1 0 4.0000 4.6667 3 1 1184.45 1.291e-03 0.000e+00 8.105e-08 0.000e+00 1.229e-02 3.31e+00 2.29e+00 1 9.60e-05 +pr: 5:R_R A 3 3 6 1 Z S N 4 1 0 4.0000 4.6667 3 1 1184.45 9.120e-04 0.000e+00 8.105e-08 0.000e+00 1.374e-02 3.31e+00 2.29e+00 1 9.60e-05 #pr: 2 samples (out of 4) matched the dump limiting criteria. #pr: below, we define 'successful' autotuning when speedup of 1.010000x is exceeded, and 'tuned' results even the ones which are same as untuned #pr: rsb autotuning was successful in 2 cases (100.00 %) and unsuccessful in 0 cases (0.00 %) -#pr: (in succ. cases rsb autotuning gave avg. 16702866.6 % faster, avg. sp. ratio 167029.666x, max sp. ratio 220060.083x, avg. ratio 0.000x) -#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 2222114.2/2162328.2/2281900.1/4444228.3 tuned ops) -#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 14.9/ 9.8/ 20.0/ 29.8 untuned ops) -#pr: (and amortizes from untuned rsb in avg. 14.9, min. 9.8, max. 20.0 ops) +#pr: (in succ. cases rsb autotuning gave avg. 1358923.4 % faster, avg. sp. ratio 13590.234x, max sp. ratio 15928.813x, avg. ratio 0.000x) +#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 160554.5/151645.8/169463.2/321109.0 tuned ops) +#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 12.3/ 9.5/ 15.1/ 24.6 untuned ops) +#pr: (and amortizes from untuned rsb in avg. 12.3, min. 9.5, max. 15.1 ops) #pr: (avg/min/max (avg) nnz per subm before successful tuning were 2/ 2/ 2) #pr: (avg/min/max (avg) nnz per subm after successful tuning were 6/ 6/ 6) #pr: (avg/min/max (avg) bytes per subm before successful tuning were 32/ 32/ 32) #pr: (avg/min/max (avg) bytes per subm after successful tuning were 96/ 96/ 96) #pr: (avg/min/max (avg) bytes per nnz before successful tuning were 4.000/ 4.000/ 4.000) -#pr: (avg/min/max operands (mtx,lhs,rhs) read bandwidth lower bound 6.930/ 6.930/ 6.930,GBps) -#pr: (avg/min/max operands (mtx,rhs:r;lhs:rw) bandwidth lower bound 16.884/ 8.442/ 8.442,GBps) +#pr: (avg/min/max operands (mtx,lhs,rhs) read bandwidth lower bound 2.714/ 2.714/ 2.714,GBps) +#pr: (avg/min/max operands (mtx,rhs:r;lhs:rw) bandwidth lower bound 6.613/ 3.307/ 3.307,GBps) #pr: (avg/min/max code balance (bytes read at least once per flop) 2.292/ 2.292/ 2.292) #pr: (avg/min/max (avg) bytes per nnz after successful tuning were 4.667/ 4.667/ 4.667) #pr: (matrix has been subdivided more/less/same in resp. 0 / 2 /0 cases) #pr: (matrix has used more/less/same threads in resp. 0 / 1 /1 cases) #pr: no unsuccessful rsb autotuning attempt (according to 1.01x threshold) -#pr: rsb auto tuning (either succ. or uns.) time was: on avg.: 0.07 s, min 0.07 s, max 0.07 s, tot 0.14 s (2 samples) -#pr: rsb auto tuning ( only successful ) time was: on avg.: 0.07 s, min 0.07 s, max 0.07 s, tot 0.14 s (2 samples) -#pr: best tun. rsb canon. mflops were: on avg. 3.024e+03, min 3.024e+03, max 3.024e+03 (2 samples) -#pr: ref. unt. rsb canon. mflops were: on avg. 2.013e-02, min 1.374e-02, max 2.653e-02 (2 samples) -#pr: best tun. rsb operation time was: on avg. 3.175e-08s, min 3.175e-08s, max 3.175e-08s, tot 6.349e-08s (2 samples) -#pr: ref. unt. rsb operation time was: on avg. 5.302e-03s, min 3.619e-03s, max 6.986e-03s, tot 1.060e-02s (2 samples) -#pr: min / max ratio of in-memory MEMSET bandwidth to extrapolated read bandwidth ratio: 3.095e+00 3.095e+00 -#pr: in-cache to in-memory MEMSET bandwidth ratio: 1.051e+00 +#pr: rsb auto tuning (either succ. or uns.) time was: on avg.: 0.01 s, min 0.01 s, max 0.01 s, tot 0.03 s (2 samples) +#pr: rsb auto tuning ( only successful ) time was: on avg.: 0.01 s, min 0.01 s, max 0.01 s, tot 0.03 s (2 samples) +#pr: best tun. rsb canon. mflops were: on avg. 1.184e+03, min 1.184e+03, max 1.184e+03 (2 samples) +#pr: ref. unt. rsb canon. mflops were: on avg. 8.981e-02, min 7.436e-02, max 1.053e-01 (2 samples) +#pr: best tun. rsb operation time was: on avg. 8.105e-08s, min 8.105e-08s, max 8.105e-08s, tot 1.621e-07s (2 samples) +#pr: ref. unt. rsb operation time was: on avg. 1.101e-03s, min 9.120e-04s, max 1.291e-03s, tot 2.203e-03s (2 samples) +#pr: min / max ratio of in-memory MEMSET bandwidth to extrapolated read bandwidth ratio: 1.569e+01 1.569e+01 +#pr: in-cache to in-memory MEMSET bandwidth ratio: 1.121e+00 #pr: ======== Limiting to nrhs=2: #pr: 2 samples (out of 4) matched the dump limiting criteria. #pr: Dump from a base of 4 samples (of max 8) ordered by (1,2,1,1,2,1,2) = (filename x cores x incX x incY x nrhs x typecode x transA). pr: BESTCODE MTX NR NC NNZ NRHS TYPE SYM TRANS NT AT-NT AT-MKL-NT BPNZ AT-BPNZ NSUBM AT-SUBM RSBBEST-MFLOPS OPTIME MKL-OPTIME AT-OPTIME AT-MKL-OPTIME AT-TIME RWminBW-GBps CB-bpf AT-MS CMFLOPS -pr: 3:R_R A 3 3 6 2 Z S N 1 1 0 4.0000 4.6667 3 1 6048.11 8.196e-03 0.000e+00 3.175e-08 0.000e+00 7.564e-02 1.30e+01 1.65e+00 1 1.92e-04 -pr: 7:R_R A 3 3 6 2 Z S N 4 1 0 4.0000 4.6667 3 1 6048.11 5.060e-03 0.000e+00 3.175e-08 0.000e+00 7.936e-02 1.30e+01 1.65e+00 1 1.92e-04 +pr: 3:R_R A 3 3 6 2 Z S N 1 1 0 4.0000 4.6667 3 1 2368.90 6.120e-04 0.000e+00 8.105e-08 0.000e+00 6.020e-03 5.08e+00 1.65e+00 1 1.92e-04 +pr: 7:R_R A 3 3 6 2 Z S N 4 1 0 4.0000 4.6667 3 1 2368.90 1.412e-03 0.000e+00 8.105e-08 0.000e+00 1.458e-02 5.08e+00 1.65e+00 1 1.92e-04 #pr: 2 samples (out of 4) matched the dump limiting criteria. #pr: below, we define 'successful' autotuning when speedup of 1.010000x is exceeded, and 'tuned' results even the ones which are same as untuned #pr: rsb autotuning was successful in 2 cases (100.00 %) and unsuccessful in 0 cases (0.00 %) -#pr: (in succ. cases rsb autotuning gave avg. 20878232.7 % faster, avg. sp. ratio 208783.327x, max sp. ratio 258174.991x, avg. ratio 0.000x) -#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 2441186.6/2382613.6/2499759.7/4882373.3 tuned ops) -#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 12.5/ 9.2/ 15.7/ 24.9 untuned ops) -#pr: (and amortizes from untuned rsb in avg. 12.5, min. 9.2, max. 15.7 ops) +#pr: (in succ. cases rsb autotuning gave avg. 1248466.0 % faster, avg. sp. ratio 12485.660x, max sp. ratio 17420.209x, avg. ratio 0.000x) +#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 127076.0/74275.6/179876.5/254152.1 tuned ops) +#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 10.1/ 9.8/ 10.3/ 20.2 untuned ops) +#pr: (and amortizes from untuned rsb in avg. 10.1, min. 9.8, max. 10.3 ops) #pr: (avg/min/max (avg) nnz per subm before successful tuning were 2/ 2/ 2) #pr: (avg/min/max (avg) nnz per subm after successful tuning were 6/ 6/ 6) #pr: (avg/min/max (avg) bytes per subm before successful tuning were 32/ 32/ 32) #pr: (avg/min/max (avg) bytes per subm after successful tuning were 96/ 96/ 96) #pr: (avg/min/max (avg) bytes per nnz before successful tuning were 4.000/ 4.000/ 4.000) -#pr: (avg/min/max operands (mtx,lhs,rhs) read bandwidth lower bound 9.954/ 9.954/ 9.954,GBps) -#pr: (avg/min/max operands (mtx,rhs:r;lhs:rw) bandwidth lower bound 25.956/ 12.978/ 12.978,GBps) +#pr: (avg/min/max operands (mtx,lhs,rhs) read bandwidth lower bound 3.899/ 3.899/ 3.899,GBps) +#pr: (avg/min/max operands (mtx,rhs:r;lhs:rw) bandwidth lower bound 10.167/ 5.083/ 5.083,GBps) #pr: (avg/min/max code balance (bytes read at least once per flop) 1.646/ 1.646/ 1.646) #pr: (avg/min/max (avg) bytes per nnz after successful tuning were 4.667/ 4.667/ 4.667) #pr: (matrix has been subdivided more/less/same in resp. 0 / 2 /0 cases) #pr: (matrix has used more/less/same threads in resp. 0 / 1 /1 cases) #pr: no unsuccessful rsb autotuning attempt (according to 1.01x threshold) -#pr: rsb auto tuning (either succ. or uns.) time was: on avg.: 0.08 s, min 0.08 s, max 0.08 s, tot 0.15 s (2 samples) -#pr: rsb auto tuning ( only successful ) time was: on avg.: 0.08 s, min 0.08 s, max 0.08 s, tot 0.15 s (2 samples) -#pr: best tun. rsb canon. mflops were: on avg. 6.048e+03, min 6.048e+03, max 6.048e+03 (2 samples) -#pr: ref. unt. rsb canon. mflops were: on avg. 3.069e-02, min 2.343e-02, max 3.794e-02 (2 samples) -#pr: best tun. rsb operation time was: on avg. 3.175e-08s, min 3.175e-08s, max 3.175e-08s, tot 6.349e-08s (2 samples) -#pr: ref. unt. rsb operation time was: on avg. 6.628e-03s, min 5.060e-03s, max 8.196e-03s, tot 1.326e-02s (2 samples) -#pr: min / max ratio of in-memory MEMSET bandwidth to extrapolated read bandwidth ratio: 2.155e+00 2.155e+00 -#pr: in-cache to in-memory MEMSET bandwidth ratio: 1.051e+00 +#pr: rsb auto tuning (either succ. or uns.) time was: on avg.: 0.01 s, min 0.01 s, max 0.01 s, tot 0.02 s (2 samples) +#pr: rsb auto tuning ( only successful ) time was: on avg.: 0.01 s, min 0.01 s, max 0.01 s, tot 0.02 s (2 samples) +#pr: best tun. rsb canon. mflops were: on avg. 2.369e+03, min 2.369e+03, max 2.369e+03 (2 samples) +#pr: ref. unt. rsb canon. mflops were: on avg. 2.249e-01, min 1.360e-01, max 3.137e-01 (2 samples) +#pr: best tun. rsb operation time was: on avg. 8.105e-08s, min 8.105e-08s, max 8.105e-08s, tot 1.621e-07s (2 samples) +#pr: ref. unt. rsb operation time was: on avg. 1.012e-03s, min 6.120e-04s, max 1.412e-03s, tot 2.024e-03s (2 samples) +#pr: min / max ratio of in-memory MEMSET bandwidth to extrapolated read bandwidth ratio: 1.092e+01 1.092e+01 +#pr: in-cache to in-memory MEMSET bandwidth ratio: 1.121e+00 #pr: rsb nrhs-to-overall-min-rhs speed ratio was: on avg. 2.000e+00 x, min 2.000e+00 x, max 2.000e+00 x (2 samples, the non-min-nrhs ones) #pr: ======== Limiting to transA=N: #pr: Dump from a base of 4 samples (of max 8) ordered by (1,2,1,1,2,1,2) = (filename x cores x incX x incY x nrhs x typecode x transA). pr: BESTCODE MTX NR NC NNZ NRHS TYPE SYM TRANS NT AT-NT AT-MKL-NT BPNZ AT-BPNZ NSUBM AT-SUBM RSBBEST-MFLOPS OPTIME MKL-OPTIME AT-OPTIME AT-MKL-OPTIME AT-TIME RWminBW-GBps CB-bpf AT-MS CMFLOPS -pr: 1:R_R A 3 3 6 1 Z S N 1 1 0 4.0000 4.6667 3 1 3024.06 6.986e-03 0.000e+00 3.175e-08 0.000e+00 6.864e-02 8.44e+00 2.29e+00 1 9.60e-05 -pr: 3:R_R A 3 3 6 2 Z S N 1 1 0 4.0000 4.6667 3 1 6048.11 8.196e-03 0.000e+00 3.175e-08 0.000e+00 7.564e-02 1.30e+01 1.65e+00 1 1.92e-04 -pr: 5:R_R A 3 3 6 1 Z S N 4 1 0 4.0000 4.6667 3 1 3024.06 3.619e-03 0.000e+00 3.175e-08 0.000e+00 7.244e-02 8.44e+00 2.29e+00 1 9.60e-05 -pr: 7:R_R A 3 3 6 2 Z S N 4 1 0 4.0000 4.6667 3 1 6048.11 5.060e-03 0.000e+00 3.175e-08 0.000e+00 7.936e-02 1.30e+01 1.65e+00 1 1.92e-04 +pr: 1:R_R A 3 3 6 1 Z S N 1 1 0 4.0000 4.6667 3 1 1184.45 1.291e-03 0.000e+00 8.105e-08 0.000e+00 1.229e-02 3.31e+00 2.29e+00 1 9.60e-05 +pr: 3:R_R A 3 3 6 2 Z S N 1 1 0 4.0000 4.6667 3 1 2368.90 6.120e-04 0.000e+00 8.105e-08 0.000e+00 6.020e-03 5.08e+00 1.65e+00 1 1.92e-04 +pr: 5:R_R A 3 3 6 1 Z S N 4 1 0 4.0000 4.6667 3 1 1184.45 9.120e-04 0.000e+00 8.105e-08 0.000e+00 1.374e-02 3.31e+00 2.29e+00 1 9.60e-05 +pr: 7:R_R A 3 3 6 2 Z S N 4 1 0 4.0000 4.6667 3 1 2368.90 1.412e-03 0.000e+00 8.105e-08 0.000e+00 1.458e-02 5.08e+00 1.65e+00 1 1.92e-04 #pr: below, we define 'successful' autotuning when speedup of 1.010000x is exceeded, and 'tuned' results even the ones which are same as untuned #pr: rsb autotuning was successful in 4 cases (100.00 %) and unsuccessful in 0 cases (0.00 %) -#pr: (in succ. cases rsb autotuning gave avg. 18790549.6 % faster, avg. sp. ratio 187906.496x, max sp. ratio 258174.991x, avg. ratio 0.000x) -#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 2331650.4/2162328.2/2499759.7/9326601.6 tuned ops) -#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 13.7/ 9.2/ 20.0/ 54.8 untuned ops) -#pr: (and amortizes from untuned rsb in avg. 13.7, min. 9.2, max. 20.0 ops) +#pr: (in succ. cases rsb autotuning gave avg. 1303694.7 % faster, avg. sp. ratio 13037.947x, max sp. ratio 17420.209x, avg. ratio 0.000x) +#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 143815.3/74275.6/179876.5/575261.1 tuned ops) +#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 11.2/ 9.5/ 15.1/ 44.7 untuned ops) +#pr: (and amortizes from untuned rsb in avg. 11.2, min. 9.5, max. 15.1 ops) #pr: (avg/min/max (avg) nnz per subm before successful tuning were 2/ 2/ 2) #pr: (avg/min/max (avg) nnz per subm after successful tuning were 6/ 6/ 6) #pr: (avg/min/max (avg) bytes per subm before successful tuning were 32/ 32/ 32) #pr: (avg/min/max (avg) bytes per subm after successful tuning were 96/ 96/ 96) #pr: (avg/min/max (avg) bytes per nnz before successful tuning were 4.000/ 4.000/ 4.000) -#pr: (avg/min/max operands (mtx,lhs,rhs) read bandwidth lower bound 8.442/ 6.930/ 9.954,GBps) -#pr: (avg/min/max operands (mtx,rhs:r;lhs:rw) bandwidth lower bound 42.841/ 8.442/ 12.978,GBps) +#pr: (avg/min/max operands (mtx,lhs,rhs) read bandwidth lower bound 3.307/ 2.714/ 3.899,GBps) +#pr: (avg/min/max operands (mtx,rhs:r;lhs:rw) bandwidth lower bound 16.780/ 3.307/ 5.083,GBps) #pr: (avg/min/max code balance (bytes read at least once per flop) 1.969/ 1.646/ 2.292) #pr: (avg/min/max (avg) bytes per nnz after successful tuning were 4.667/ 4.667/ 4.667) #pr: (matrix has been subdivided more/less/same in resp. 0 / 4 /0 cases) #pr: (matrix has used more/less/same threads in resp. 0 / 2 /2 cases) #pr: no unsuccessful rsb autotuning attempt (according to 1.01x threshold) -#pr: rsb auto tuning (either succ. or uns.) time was: on avg.: 0.07 s, min 0.07 s, max 0.08 s, tot 0.30 s (4 samples) -#pr: rsb auto tuning ( only successful ) time was: on avg.: 0.07 s, min 0.07 s, max 0.08 s, tot 0.30 s (4 samples) -#pr: best tun. rsb canon. mflops were: on avg. 4.536e+03, min 3.024e+03, max 6.048e+03 (4 samples) -#pr: ref. unt. rsb canon. mflops were: on avg. 2.541e-02, min 1.374e-02, max 3.794e-02 (4 samples) -#pr: best tun. rsb operation time was: on avg. 3.175e-08s, min 3.175e-08s, max 3.175e-08s, tot 1.270e-07s (4 samples) -#pr: ref. unt. rsb operation time was: on avg. 5.965e-03s, min 3.619e-03s, max 8.196e-03s, tot 2.386e-02s (4 samples) -#pr: min / max ratio of in-memory MEMSET bandwidth to extrapolated read bandwidth ratio: 2.155e+00 3.095e+00 -#pr: in-cache to in-memory MEMSET bandwidth ratio: 1.051e+00 +#pr: rsb auto tuning (either succ. or uns.) time was: on avg.: 0.01 s, min 0.01 s, max 0.01 s, tot 0.05 s (4 samples) +#pr: rsb auto tuning ( only successful ) time was: on avg.: 0.01 s, min 0.01 s, max 0.01 s, tot 0.05 s (4 samples) +#pr: best tun. rsb canon. mflops were: on avg. 1.777e+03, min 1.184e+03, max 2.369e+03 (4 samples) +#pr: ref. unt. rsb canon. mflops were: on avg. 1.573e-01, min 7.436e-02, max 3.137e-01 (4 samples) +#pr: best tun. rsb operation time was: on avg. 8.105e-08s, min 8.105e-08s, max 8.105e-08s, tot 3.242e-07s (4 samples) +#pr: ref. unt. rsb operation time was: on avg. 1.057e-03s, min 6.120e-04s, max 1.412e-03s, tot 4.227e-03s (4 samples) +#pr: min / max ratio of in-memory MEMSET bandwidth to extrapolated read bandwidth ratio: 1.092e+01 1.569e+01 +#pr: in-cache to in-memory MEMSET bandwidth ratio: 1.121e+00 #pr: rsb nrhs-to-overall-min-rhs speed ratio was: on avg. 2.000e+00 x, min 2.000e+00 x, max 2.000e+00 x (2 samples, the non-min-nrhs ones) #pr: ======== Limiting to both transA=N and nrhs=1: #pr: 2 samples (out of 4) matched the dump limiting criteria. #pr: Dump from a base of 4 samples (of max 8) ordered by (1,2,1,1,2,1,2) = (filename x cores x incX x incY x nrhs x typecode x transA). pr: BESTCODE MTX NR NC NNZ NRHS TYPE SYM TRANS NT AT-NT AT-MKL-NT BPNZ AT-BPNZ NSUBM AT-SUBM RSBBEST-MFLOPS OPTIME MKL-OPTIME AT-OPTIME AT-MKL-OPTIME AT-TIME RWminBW-GBps CB-bpf AT-MS CMFLOPS -pr: 1:R_R A 3 3 6 1 Z S N 1 1 0 4.0000 4.6667 3 1 3024.06 6.986e-03 0.000e+00 3.175e-08 0.000e+00 6.864e-02 8.44e+00 2.29e+00 1 9.60e-05 -pr: 5:R_R A 3 3 6 1 Z S N 4 1 0 4.0000 4.6667 3 1 3024.06 3.619e-03 0.000e+00 3.175e-08 0.000e+00 7.244e-02 8.44e+00 2.29e+00 1 9.60e-05 +pr: 1:R_R A 3 3 6 1 Z S N 1 1 0 4.0000 4.6667 3 1 1184.45 1.291e-03 0.000e+00 8.105e-08 0.000e+00 1.229e-02 3.31e+00 2.29e+00 1 9.60e-05 +pr: 5:R_R A 3 3 6 1 Z S N 4 1 0 4.0000 4.6667 3 1 1184.45 9.120e-04 0.000e+00 8.105e-08 0.000e+00 1.374e-02 3.31e+00 2.29e+00 1 9.60e-05 #pr: 2 samples (out of 4) matched the dump limiting criteria. #pr: below, we define 'successful' autotuning when speedup of 1.010000x is exceeded, and 'tuned' results even the ones which are same as untuned #pr: rsb autotuning was successful in 2 cases (100.00 %) and unsuccessful in 0 cases (0.00 %) -#pr: (in succ. cases rsb autotuning gave avg. 16702866.6 % faster, avg. sp. ratio 167029.666x, max sp. ratio 220060.083x, avg. ratio 0.000x) -#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 2222114.2/2162328.2/2281900.1/4444228.3 tuned ops) -#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 14.9/ 9.8/ 20.0/ 29.8 untuned ops) -#pr: (and amortizes from untuned rsb in avg. 14.9, min. 9.8, max. 20.0 ops) +#pr: (in succ. cases rsb autotuning gave avg. 1358923.4 % faster, avg. sp. ratio 13590.234x, max sp. ratio 15928.813x, avg. ratio 0.000x) +#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 160554.5/151645.8/169463.2/321109.0 tuned ops) +#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 12.3/ 9.5/ 15.1/ 24.6 untuned ops) +#pr: (and amortizes from untuned rsb in avg. 12.3, min. 9.5, max. 15.1 ops) #pr: (avg/min/max (avg) nnz per subm before successful tuning were 2/ 2/ 2) #pr: (avg/min/max (avg) nnz per subm after successful tuning were 6/ 6/ 6) #pr: (avg/min/max (avg) bytes per subm before successful tuning were 32/ 32/ 32) #pr: (avg/min/max (avg) bytes per subm after successful tuning were 96/ 96/ 96) #pr: (avg/min/max (avg) bytes per nnz before successful tuning were 4.000/ 4.000/ 4.000) -#pr: (avg/min/max operands (mtx,lhs,rhs) read bandwidth lower bound 6.930/ 6.930/ 6.930,GBps) -#pr: (avg/min/max operands (mtx,rhs:r;lhs:rw) bandwidth lower bound 16.884/ 8.442/ 8.442,GBps) +#pr: (avg/min/max operands (mtx,lhs,rhs) read bandwidth lower bound 2.714/ 2.714/ 2.714,GBps) +#pr: (avg/min/max operands (mtx,rhs:r;lhs:rw) bandwidth lower bound 6.613/ 3.307/ 3.307,GBps) #pr: (avg/min/max code balance (bytes read at least once per flop) 2.292/ 2.292/ 2.292) #pr: (avg/min/max (avg) bytes per nnz after successful tuning were 4.667/ 4.667/ 4.667) #pr: (matrix has been subdivided more/less/same in resp. 0 / 2 /0 cases) #pr: (matrix has used more/less/same threads in resp. 0 / 1 /1 cases) #pr: no unsuccessful rsb autotuning attempt (according to 1.01x threshold) -#pr: rsb auto tuning (either succ. or uns.) time was: on avg.: 0.07 s, min 0.07 s, max 0.07 s, tot 0.14 s (2 samples) -#pr: rsb auto tuning ( only successful ) time was: on avg.: 0.07 s, min 0.07 s, max 0.07 s, tot 0.14 s (2 samples) -#pr: best tun. rsb canon. mflops were: on avg. 3.024e+03, min 3.024e+03, max 3.024e+03 (2 samples) -#pr: ref. unt. rsb canon. mflops were: on avg. 2.013e-02, min 1.374e-02, max 2.653e-02 (2 samples) -#pr: best tun. rsb operation time was: on avg. 3.175e-08s, min 3.175e-08s, max 3.175e-08s, tot 6.349e-08s (2 samples) -#pr: ref. unt. rsb operation time was: on avg. 5.302e-03s, min 3.619e-03s, max 6.986e-03s, tot 1.060e-02s (2 samples) -#pr: min / max ratio of in-memory MEMSET bandwidth to extrapolated read bandwidth ratio: 3.095e+00 3.095e+00 -#pr: in-cache to in-memory MEMSET bandwidth ratio: 1.051e+00 +#pr: rsb auto tuning (either succ. or uns.) time was: on avg.: 0.01 s, min 0.01 s, max 0.01 s, tot 0.03 s (2 samples) +#pr: rsb auto tuning ( only successful ) time was: on avg.: 0.01 s, min 0.01 s, max 0.01 s, tot 0.03 s (2 samples) +#pr: best tun. rsb canon. mflops were: on avg. 1.184e+03, min 1.184e+03, max 1.184e+03 (2 samples) +#pr: ref. unt. rsb canon. mflops were: on avg. 8.981e-02, min 7.436e-02, max 1.053e-01 (2 samples) +#pr: best tun. rsb operation time was: on avg. 8.105e-08s, min 8.105e-08s, max 8.105e-08s, tot 1.621e-07s (2 samples) +#pr: ref. unt. rsb operation time was: on avg. 1.101e-03s, min 9.120e-04s, max 1.291e-03s, tot 2.203e-03s (2 samples) +#pr: min / max ratio of in-memory MEMSET bandwidth to extrapolated read bandwidth ratio: 1.569e+01 1.569e+01 +#pr: in-cache to in-memory MEMSET bandwidth ratio: 1.121e+00 #pr: ======== Limiting to both transA=N and nrhs=2: #pr: 2 samples (out of 4) matched the dump limiting criteria. #pr: Dump from a base of 4 samples (of max 8) ordered by (1,2,1,1,2,1,2) = (filename x cores x incX x incY x nrhs x typecode x transA). pr: BESTCODE MTX NR NC NNZ NRHS TYPE SYM TRANS NT AT-NT AT-MKL-NT BPNZ AT-BPNZ NSUBM AT-SUBM RSBBEST-MFLOPS OPTIME MKL-OPTIME AT-OPTIME AT-MKL-OPTIME AT-TIME RWminBW-GBps CB-bpf AT-MS CMFLOPS -pr: 3:R_R A 3 3 6 2 Z S N 1 1 0 4.0000 4.6667 3 1 6048.11 8.196e-03 0.000e+00 3.175e-08 0.000e+00 7.564e-02 1.30e+01 1.65e+00 1 1.92e-04 -pr: 7:R_R A 3 3 6 2 Z S N 4 1 0 4.0000 4.6667 3 1 6048.11 5.060e-03 0.000e+00 3.175e-08 0.000e+00 7.936e-02 1.30e+01 1.65e+00 1 1.92e-04 +pr: 3:R_R A 3 3 6 2 Z S N 1 1 0 4.0000 4.6667 3 1 2368.90 6.120e-04 0.000e+00 8.105e-08 0.000e+00 6.020e-03 5.08e+00 1.65e+00 1 1.92e-04 +pr: 7:R_R A 3 3 6 2 Z S N 4 1 0 4.0000 4.6667 3 1 2368.90 1.412e-03 0.000e+00 8.105e-08 0.000e+00 1.458e-02 5.08e+00 1.65e+00 1 1.92e-04 #pr: 2 samples (out of 4) matched the dump limiting criteria. #pr: below, we define 'successful' autotuning when speedup of 1.010000x is exceeded, and 'tuned' results even the ones which are same as untuned #pr: rsb autotuning was successful in 2 cases (100.00 %) and unsuccessful in 0 cases (0.00 %) -#pr: (in succ. cases rsb autotuning gave avg. 20878232.7 % faster, avg. sp. ratio 208783.327x, max sp. ratio 258174.991x, avg. ratio 0.000x) -#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 2441186.6/2382613.6/2499759.7/4882373.3 tuned ops) -#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 12.5/ 9.2/ 15.7/ 24.9 untuned ops) -#pr: (and amortizes from untuned rsb in avg. 12.5, min. 9.2, max. 15.7 ops) +#pr: (in succ. cases rsb autotuning gave avg. 1248466.0 % faster, avg. sp. ratio 12485.660x, max sp. ratio 17420.209x, avg. ratio 0.000x) +#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 127076.0/74275.6/179876.5/254152.1 tuned ops) +#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 10.1/ 9.8/ 10.3/ 20.2 untuned ops) +#pr: (and amortizes from untuned rsb in avg. 10.1, min. 9.8, max. 10.3 ops) #pr: (avg/min/max (avg) nnz per subm before successful tuning were 2/ 2/ 2) #pr: (avg/min/max (avg) nnz per subm after successful tuning were 6/ 6/ 6) #pr: (avg/min/max (avg) bytes per subm before successful tuning were 32/ 32/ 32) #pr: (avg/min/max (avg) bytes per subm after successful tuning were 96/ 96/ 96) #pr: (avg/min/max (avg) bytes per nnz before successful tuning were 4.000/ 4.000/ 4.000) -#pr: (avg/min/max operands (mtx,lhs,rhs) read bandwidth lower bound 9.954/ 9.954/ 9.954,GBps) -#pr: (avg/min/max operands (mtx,rhs:r;lhs:rw) bandwidth lower bound 25.956/ 12.978/ 12.978,GBps) +#pr: (avg/min/max operands (mtx,lhs,rhs) read bandwidth lower bound 3.899/ 3.899/ 3.899,GBps) +#pr: (avg/min/max operands (mtx,rhs:r;lhs:rw) bandwidth lower bound 10.167/ 5.083/ 5.083,GBps) #pr: (avg/min/max code balance (bytes read at least once per flop) 1.646/ 1.646/ 1.646) #pr: (avg/min/max (avg) bytes per nnz after successful tuning were 4.667/ 4.667/ 4.667) #pr: (matrix has been subdivided more/less/same in resp. 0 / 2 /0 cases) #pr: (matrix has used more/less/same threads in resp. 0 / 1 /1 cases) #pr: no unsuccessful rsb autotuning attempt (according to 1.01x threshold) -#pr: rsb auto tuning (either succ. or uns.) time was: on avg.: 0.08 s, min 0.08 s, max 0.08 s, tot 0.15 s (2 samples) -#pr: rsb auto tuning ( only successful ) time was: on avg.: 0.08 s, min 0.08 s, max 0.08 s, tot 0.15 s (2 samples) -#pr: best tun. rsb canon. mflops were: on avg. 6.048e+03, min 6.048e+03, max 6.048e+03 (2 samples) -#pr: ref. unt. rsb canon. mflops were: on avg. 3.069e-02, min 2.343e-02, max 3.794e-02 (2 samples) -#pr: best tun. rsb operation time was: on avg. 3.175e-08s, min 3.175e-08s, max 3.175e-08s, tot 6.349e-08s (2 samples) -#pr: ref. unt. rsb operation time was: on avg. 6.628e-03s, min 5.060e-03s, max 8.196e-03s, tot 1.326e-02s (2 samples) -#pr: min / max ratio of in-memory MEMSET bandwidth to extrapolated read bandwidth ratio: 2.155e+00 2.155e+00 -#pr: in-cache to in-memory MEMSET bandwidth ratio: 1.051e+00 +#pr: rsb auto tuning (either succ. or uns.) time was: on avg.: 0.01 s, min 0.01 s, max 0.01 s, tot 0.02 s (2 samples) +#pr: rsb auto tuning ( only successful ) time was: on avg.: 0.01 s, min 0.01 s, max 0.01 s, tot 0.02 s (2 samples) +#pr: best tun. rsb canon. mflops were: on avg. 2.369e+03, min 2.369e+03, max 2.369e+03 (2 samples) +#pr: ref. unt. rsb canon. mflops were: on avg. 2.249e-01, min 1.360e-01, max 3.137e-01 (2 samples) +#pr: best tun. rsb operation time was: on avg. 8.105e-08s, min 8.105e-08s, max 8.105e-08s, tot 1.621e-07s (2 samples) +#pr: ref. unt. rsb operation time was: on avg. 1.012e-03s, min 6.120e-04s, max 1.412e-03s, tot 2.024e-03s (2 samples) +#pr: min / max ratio of in-memory MEMSET bandwidth to extrapolated read bandwidth ratio: 1.092e+01 1.092e+01 +#pr: in-cache to in-memory MEMSET bandwidth ratio: 1.121e+00 #pr: rsb nrhs-to-overall-min-rhs speed ratio was: on avg. 2.000e+00 x, min 2.000e+00 x, max 2.000e+00 x (2 samples, the non-min-nrhs ones) #pr: ======== Limiting to transA=T: #pr: No sample (out of 4) matched the dump criteria -- skipping dump round. @@ -3754,44 +3790,44 @@ #pr: ======== All results (not limiting) #pr: Dump from a base of 4 samples (of max 8) ordered by (1,2,1,1,2,1,2) = (filename x cores x incX x incY x nrhs x typecode x transA). pr: BESTCODE MTX NR NC NNZ NRHS TYPE SYM TRANS NT AT-NT AT-MKL-NT BPNZ AT-BPNZ NSUBM AT-SUBM RSBBEST-MFLOPS OPTIME MKL-OPTIME AT-OPTIME AT-MKL-OPTIME AT-TIME RWminBW-GBps CB-bpf AT-MS CMFLOPS -pr: 1:R_R A 3 3 6 1 Z S N 1 1 0 4.0000 4.6667 3 1 3024.06 6.986e-03 0.000e+00 3.175e-08 0.000e+00 6.864e-02 8.44e+00 2.29e+00 1 9.60e-05 -pr: 3:R_R A 3 3 6 2 Z S N 1 1 0 4.0000 4.6667 3 1 6048.11 8.196e-03 0.000e+00 3.175e-08 0.000e+00 7.564e-02 1.30e+01 1.65e+00 1 1.92e-04 -pr: 5:R_R A 3 3 6 1 Z S N 4 1 0 4.0000 4.6667 3 1 3024.06 3.619e-03 0.000e+00 3.175e-08 0.000e+00 7.244e-02 8.44e+00 2.29e+00 1 9.60e-05 -pr: 7:R_R A 3 3 6 2 Z S N 4 1 0 4.0000 4.6667 3 1 6048.11 5.060e-03 0.000e+00 3.175e-08 0.000e+00 7.936e-02 1.30e+01 1.65e+00 1 1.92e-04 +pr: 1:R_R A 3 3 6 1 Z S N 1 1 0 4.0000 4.6667 3 1 1184.45 1.291e-03 0.000e+00 8.105e-08 0.000e+00 1.229e-02 3.31e+00 2.29e+00 1 9.60e-05 +pr: 3:R_R A 3 3 6 2 Z S N 1 1 0 4.0000 4.6667 3 1 2368.90 6.120e-04 0.000e+00 8.105e-08 0.000e+00 6.020e-03 5.08e+00 1.65e+00 1 1.92e-04 +pr: 5:R_R A 3 3 6 1 Z S N 4 1 0 4.0000 4.6667 3 1 1184.45 9.120e-04 0.000e+00 8.105e-08 0.000e+00 1.374e-02 3.31e+00 2.29e+00 1 9.60e-05 +pr: 7:R_R A 3 3 6 2 Z S N 4 1 0 4.0000 4.6667 3 1 2368.90 1.412e-03 0.000e+00 8.105e-08 0.000e+00 1.458e-02 5.08e+00 1.65e+00 1 1.92e-04 #pr: below, we define 'successful' autotuning when speedup of 1.010000x is exceeded, and 'tuned' results even the ones which are same as untuned #pr: rsb autotuning was successful in 4 cases (100.00 %) and unsuccessful in 0 cases (0.00 %) -#pr: (in succ. cases rsb autotuning gave avg. 18790549.6 % faster, avg. sp. ratio 187906.496x, max sp. ratio 258174.991x, avg. ratio 0.000x) -#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 2331650.4/2162328.2/2499759.7/9326601.6 tuned ops) -#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 13.7/ 9.2/ 20.0/ 54.8 untuned ops) -#pr: (and amortizes from untuned rsb in avg. 13.7, min. 9.2, max. 20.0 ops) +#pr: (in succ. cases rsb autotuning gave avg. 1303694.7 % faster, avg. sp. ratio 13037.947x, max sp. ratio 17420.209x, avg. ratio 0.000x) +#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 143815.3/74275.6/179876.5/575261.1 tuned ops) +#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 11.2/ 9.5/ 15.1/ 44.7 untuned ops) +#pr: (and amortizes from untuned rsb in avg. 11.2, min. 9.5, max. 15.1 ops) #pr: (avg/min/max (avg) nnz per subm before successful tuning were 2/ 2/ 2) #pr: (avg/min/max (avg) nnz per subm after successful tuning were 6/ 6/ 6) #pr: (avg/min/max (avg) bytes per subm before successful tuning were 32/ 32/ 32) #pr: (avg/min/max (avg) bytes per subm after successful tuning were 96/ 96/ 96) #pr: (avg/min/max (avg) bytes per nnz before successful tuning were 4.000/ 4.000/ 4.000) -#pr: (avg/min/max operands (mtx,lhs,rhs) read bandwidth lower bound 8.442/ 6.930/ 9.954,GBps) -#pr: (avg/min/max operands (mtx,rhs:r;lhs:rw) bandwidth lower bound 42.841/ 8.442/ 12.978,GBps) +#pr: (avg/min/max operands (mtx,lhs,rhs) read bandwidth lower bound 3.307/ 2.714/ 3.899,GBps) +#pr: (avg/min/max operands (mtx,rhs:r;lhs:rw) bandwidth lower bound 16.780/ 3.307/ 5.083,GBps) #pr: (avg/min/max code balance (bytes read at least once per flop) 1.969/ 1.646/ 2.292) #pr: (avg/min/max (avg) bytes per nnz after successful tuning were 4.667/ 4.667/ 4.667) #pr: (matrix has been subdivided more/less/same in resp. 0 / 4 /0 cases) #pr: (matrix has used more/less/same threads in resp. 0 / 2 /2 cases) #pr: no unsuccessful rsb autotuning attempt (according to 1.01x threshold) -#pr: rsb auto tuning (either succ. or uns.) time was: on avg.: 0.07 s, min 0.07 s, max 0.08 s, tot 0.30 s (4 samples) -#pr: rsb auto tuning ( only successful ) time was: on avg.: 0.07 s, min 0.07 s, max 0.08 s, tot 0.30 s (4 samples) -#pr: best tun. rsb canon. mflops were: on avg. 4.536e+03, min 3.024e+03, max 6.048e+03 (4 samples) -#pr: ref. unt. rsb canon. mflops were: on avg. 2.541e-02, min 1.374e-02, max 3.794e-02 (4 samples) -#pr: best tun. rsb operation time was: on avg. 3.175e-08s, min 3.175e-08s, max 3.175e-08s, tot 1.270e-07s (4 samples) -#pr: ref. unt. rsb operation time was: on avg. 5.965e-03s, min 3.619e-03s, max 8.196e-03s, tot 2.386e-02s (4 samples) -#pr: min / max ratio of in-memory MEMSET bandwidth to extrapolated read bandwidth ratio: 2.155e+00 3.095e+00 -#pr: in-cache to in-memory MEMSET bandwidth ratio: 1.051e+00 +#pr: rsb auto tuning (either succ. or uns.) time was: on avg.: 0.01 s, min 0.01 s, max 0.01 s, tot 0.05 s (4 samples) +#pr: rsb auto tuning ( only successful ) time was: on avg.: 0.01 s, min 0.01 s, max 0.01 s, tot 0.05 s (4 samples) +#pr: best tun. rsb canon. mflops were: on avg. 1.777e+03, min 1.184e+03, max 2.369e+03 (4 samples) +#pr: ref. unt. rsb canon. mflops were: on avg. 1.573e-01, min 7.436e-02, max 3.137e-01 (4 samples) +#pr: best tun. rsb operation time was: on avg. 8.105e-08s, min 8.105e-08s, max 8.105e-08s, tot 3.242e-07s (4 samples) +#pr: ref. unt. rsb operation time was: on avg. 1.057e-03s, min 6.120e-04s, max 1.412e-03s, tot 4.227e-03s (4 samples) +#pr: min / max ratio of in-memory MEMSET bandwidth to extrapolated read bandwidth ratio: 1.092e+01 1.569e+01 +#pr: in-cache to in-memory MEMSET bandwidth ratio: 1.121e+00 #pr: rsb nrhs-to-overall-min-rhs speed ratio was: on avg. 2.000e+00 x, min 2.000e+00 x, max 2.000e+00 x (2 samples, the non-min-nrhs ones) -#pr: Record collection took 1.92 s. +#pr: Record collection took 0.29 s. #pr: Record comprises 40 memory benchmark samples (prepend RSB_PR_MBW=1 to dump this). -#pr: Record comprises 100 environment variables in 5413 bytes (prepend RSB_PR_ENV=1 to dump this). +#pr: Record comprises 100 environment variables in 5467 bytes (prepend RSB_PR_ENV=1 to dump this). # ====== END Total summary record. -#pr: ======== Saved a performance record of 8 samples to rsbench_pr__1788680910_gcc-14.2-1,4th.rpr -# Removing the temporary record file rsbench_pr__1788680910_gcc-14.2-1,4th.rpr.tmp. -# terminating run at 1788680917 (after 7.5s of w.c.t.) +#pr: ======== Saved a performance record of 8 samples to rsbench_pr__1754271489_gcc-14.2-1,4th.rpr +# Removing the temporary record file rsbench_pr__1754271489_gcc-14.2-1,4th.rpr.tmp. +# terminating run at 1754271495 (after 5.8s of w.c.t.) + ./rsbench -oa -Ob --help /build/reproducible-path/librsb-1.3.0.2+dfsg/.libs/rsbench is a swiss army knife for testing the library functionality and performance. You can use it to perform sparse matrix - unitary vector multiplication, specifying the blocking parameters, the times to perform multiplication. @@ -4065,8 +4101,8 @@ sysconf() : 4096 bytes per pagesize sysconf() : 8203948 physical pages sysconf() : 33603371008 bytes (32046 MB) of physical memory -sysconf() : 1419344 available (free) physical pages -sysconf() : 5813633024 available (free) physical memory +sysconf() : 1254671 available (free) physical pages +sysconf() : 5139132416 available (free) physical memory sysconf() , processors : 12 sysconf() , processors online : 12 sysconf() : no level 1 cache @@ -4091,30 +4127,30 @@ RSB_SUBM_IDX_MARKER : 2147483647 RSB_MAX_ALLOCATABLE_MEMORY_CHUNK: 18446744073709551615 timing min delta (if negative, don't complain with us) : 0 s -timing granularity : 3.73483e-08 s +timing granularity : 3.0005e-08 s CFLAGS : -g -O2 -Werror=implicit-function-declaration -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 CXXFLAGS : -g -O2 -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -fopenmp CC : gcc memhinfo : L2:4/64/512K,L1:8/64/24K -detected free memory : 5813116928 +detected free memory : 5139132416 detected total memory : 33603371008 -for array sized 524288 elems, took 0.000349998 s for linear search and 0 s for binary search for element 524287, in 145 tries, for a total of 0.100131 s (ignore this:152043230) -for array sized 524288 elems, took 0.000174999 s for linear search and 0 s for binary search for element 262143, in 283 tries, for a total of 0.102620 s (ignore this:300416168) -for array sized 524288 elems, took 8.67844e-05 s for linear search and 0 s for binary search for element 131071, in 579 tries, for a total of 0.103793 s (ignore this:452196386) -for array sized 524288 elems, took 4.29153e-05 s for linear search and 0 s for binary search for element 65535, in 1165 tries, for a total of 0.100030 s (ignore this:604892936) -for array sized 524288 elems, took 2.09808e-05 s for linear search and 0 s for binary search for element 32767, in 2519 tries, for a total of 0.100009 s (ignore this:769973082) -for array sized 524288 elems, took 1.09673e-05 s for linear search and 0 s for binary search for element 16383, in 5121 tries, for a total of 0.100008 s (ignore this:937767768) -for array sized 524288 elems, took 4.76837e-06 s for linear search and 0 s for binary search for element 8191, in 9930 tries, for a total of 0.100000 s (ignore this:1100441028) -for array sized 524288 elems, took 1.90735e-06 s for linear search and 0 s for binary search for element 4095, in 24960 tries, for a total of 0.107779 s (ignore this:1304863428) -for array sized 524288 elems, took 9.53674e-07 s for linear search and 0 s for binary search for element 2047, in 48337 tries, for a total of 0.100002 s (ignore this:1502755106) -for array sized 524288 elems, took 0 s for linear search and 0 s for binary search for element 1023, in 125910 tries, for a total of 0.100000 s (ignore this:1760366966) -for array sized 524288 elems, took 0 s for linear search and 0 s for binary search for element 511, in 221430 tries, for a total of 0.100001 s (ignore this:1986668426) -for array sized 524288 elems, took 0 s for linear search and 0 s for binary search for element 255, in 351245 tries, for a total of 0.100001 s (ignore this:-2129163920) -for array sized 524288 elems, took 0 s for linear search and 0 s for binary search for element 127, in 548946 tries, for a total of 0.100000 s (ignore this:-1989731636) -for array sized 524288 elems, took 0 s for linear search and 0 s for binary search for element 63, in 718373 tries, for a total of 0.100000 s (ignore this:-1899216638) -for array sized 524288 elems, took 0 s for linear search and 0 s for binary search for element 31, in 608658 tries, for a total of 0.100001 s (ignore this:-1861479842) -for array sized 524288 elems, took 0 s for linear search and 0 s for binary search for element 15, in 497444 tries, for a total of 0.105249 s (ignore this:-1846556522) -for array sized 524288 elems, took 0 s for linear search and 0 s for binary search for element 7, in 491876 tries, for a total of 0.100001 s (ignore this:-1839670258) +for array sized 524288 elems, took 0.000349998 s for linear search and 0 s for binary search for element 524287, in 242 tries, for a total of 0.100014 s (ignore this:253754908) +for array sized 524288 elems, took 0.000174999 s for linear search and 0 s for binary search for element 262143, in 568 tries, for a total of 0.100036 s (ignore this:551549356) +for array sized 524288 elems, took 8.67844e-05 s for linear search and 0 s for binary search for element 131071, in 1137 tries, for a total of 0.100049 s (ignore this:849604810) +for array sized 524288 elems, took 4.29153e-05 s for linear search and 0 s for binary search for element 65535, in 2274 tries, for a total of 0.100034 s (ignore this:1147657990) +for array sized 524288 elems, took 2.09808e-05 s for linear search and 0 s for binary search for element 32767, in 4540 tries, for a total of 0.100008 s (ignore this:1445182350) +for array sized 524288 elems, took 1.09673e-05 s for linear search and 0 s for binary search for element 16383, in 9020 tries, for a total of 0.100006 s (ignore this:1740731670) +for array sized 524288 elems, took 4.76837e-06 s for linear search and 0 s for binary search for element 8191, in 17947 tries, for a total of 0.100003 s (ignore this:2034739424) +for array sized 524288 elems, took 1.90735e-06 s for linear search and 0 s for binary search for element 4095, in 35303 tries, for a total of 0.100003 s (ignore this:-1971096302) +for array sized 524288 elems, took 9.53674e-07 s for linear search and 0 s for binary search for element 2047, in 68275 tries, for a total of 0.100001 s (ignore this:-1691578452) +for array sized 524288 elems, took 0 s for linear search and 0 s for binary search for element 1023, in 128050 tries, for a total of 0.100000 s (ignore this:-1429588152) +for array sized 524288 elems, took 0 s for linear search and 0 s for binary search for element 511, in 227754 tries, for a total of 0.100001 s (ignore this:-1196823564) +for array sized 524288 elems, took 0 s for linear search and 0 s for binary search for element 255, in 384682 tries, for a total of 0.100001 s (ignore this:-1000635744) +for array sized 524288 elems, took 0 s for linear search and 0 s for binary search for element 127, in 574457 tries, for a total of 0.100000 s (ignore this:-854723666) +for array sized 524288 elems, took 0 s for linear search and 0 s for binary search for element 63, in 765628 tries, for a total of 0.100000 s (ignore this:-758254538) +for array sized 524288 elems, took 0 s for linear search and 0 s for binary search for element 31, in 916709 tries, for a total of 0.100001 s (ignore this:-701418580) +for array sized 524288 elems, took 0 s for linear search and 0 s for binary search for element 15, in 1026895 tries, for a total of 0.100000 s (ignore this:-670611730) +for array sized 524288 elems, took 0 s for linear search and 0 s for binary search for element 7, in 1059833 tries, for a total of 0.100001 s (ignore this:-655774068) + ./rsbench -C /build/reproducible-path/librsb-1.3.0.2+dfsg/.libs/rsbench version: 1.3.0 format switches:br @@ -4161,17 +4197,17 @@ Adding matrix file: /build/reproducible-path/librsb-1.3.0.2+dfsg/A.mtx # Sorting matrices list (use --no-sort-filenames-list to prevent this) # Using matrices: A.mtx -# beginning run at 1788680920 +# beginning run at 1754271497 # /build/reproducible-path/librsb-1.3.0.2+dfsg/.libs/rsbench -oa -Ob --bench -f /build/reproducible-path/librsb-1.3.0.2+dfsg/A.mtx --verbose --nrhs 1,4 --by-rows # compiled with: CC=gcc CFLAGS=-g -O2 -Werror=implicit-function-declaration -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 # User did not specify threads; assuming 1. Environment provides max 12 threads; this build supports max 128. # User did not specify threads; assuming 1. Environment provides max 12 threads; this build supports max 128. -# average timer granularity: 3e-08 s -# Will write a final performance record to file rsbench_pr__1788680920_gcc-14.2.rpr and periodic checkpoints to rsbench_pr__1788680920_gcc-14.2.rpr.tmp +# average timer granularity: 5.32e-08 s +# Will write a final performance record to file rsbench_pr__1754271497_gcc-14.2.rpr and periodic checkpoints to rsbench_pr__1754271497_gcc-14.2.rpr.tmp # will NOT perform ancillary tests. # will flush cache memory: between each operation measurement series, and NOT between each operation. # will keep any zero encountered in the matrix. -# env: export PATH=/usr/sbin:/usr/bin:/sbin:/bin:/usr/games +# env: export PATH=/usr/sbin:/usr/bin:/sbin:/bin:/usr/games:/i/capture/the/path # env: export LD_LIBRARY_PATH=/build/reproducible-path/librsb-1.3.0.2+dfsg/.libs # env: HOSTNAME is not set # env: KMP_AFFINITY is not set @@ -4210,61 +4246,61 @@ # env: SLURM_NTASKS is not set # env: SLURM_STEP_TASKS_PER_NODE is not set # env: SLURM_TASKS_PER_NODE is not set -# detected hostname: codethink03-arm64 +# detected hostname: i-capture-the-hostname # user specified a verbosity level of 1 (each --verbose occurrence counts +1) # This test will measure times in scanning arrays sized and aligned to fit in caches. # 2 cache levels detected Will fill struct with 40 samples... -# Memory benchmark took 4.857s +# Memory benchmark took 5.421s # auto-tuning oriented output implies times==0 iterations and sort-after-load. #pr: allocated a performance record for 16 samples (4480 bytes). # multi-type benchmarking (DSCZ) -- now using typecode D (last was D). # Cache block size total 524288 bytes, per-thread 43690 bytes -# so far, program took 4.858s of wall clock time; ancillary tests 0.000s; I/O 0.000s; checks 0.000s; conversions 0.000s; rsb/mkl tuning 0.000s/0.000s . +# so far, program took 5.424s of wall clock time; ancillary tests 0.000s; I/O 0.000s; checks 0.000s; conversions 0.000s; rsb/mkl tuning 0.000s/0.000s . # reading A.mtx (184 bytes / 1 MiB / 6 nnz / 3 rows / 3 columns / 1 MiB COO) as type D... -# file input of A.mtx took 0.00 s (6 nnz, 77913 nnz/s ) (2.39 MB/s ) -#pre-sorting (6 elements) took 0.020896 s +# file input of A.mtx took 0.00 s (6 nnz, 79892 nnz/s ) (2.45 MB/s ) +#pre-sorting (6 elements) took 0.0235789 s #weeding duplicates (to 6 elements) took 3.09944e-06 s (and check, 9.53674e-07 s ) # multi-nrhs benchmarking (1,4) -- now using nrhs 1. # Using alpha=1 beta=1 order=rows for rsb_spmv/rsb_spsv/rsb_spmm/rsb_spsm. # multi-transpose benchmarking -- now using transA = N. # will use input matrix flags: RSB_FLAG_USE_HALFWORD_INDICES, RSB_FLAG_SORTED_INPUT, RSB_FLAG_QUAD_PARTITIONING, RSB_FLAG_SYMMETRIC, RSB_FLAG_OWN_PARTITIONING_ARRAYS # Using 12 threads -# Constructed matrix (took 0.055s): (3 x 3)[0xaaab0761de50]{D} @ (0(0..0),0(0..0)) (6 nnz, 2 nnz/r) flags 0x2442186 (coo:1, csr:0, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'S' +# Constructed matrix (took 0.009s): (3 x 3)[0xaaab17411ed0]{D} @ (0(0..0),0(0..0)) (6 nnz, 2 nnz/r) flags 0x2442186 (coo:1, csr:0, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'S' # matrix consistency check took 0.000s (ok) RSB Sparse Blocks Autotuner invoked requesting max 6 splits and max 6 merges in 1 rounds, threads spec.0 (specify negative values to enable threads tuning). Will autotune matrix: 3 x 3, type D, 6 nnz, 2 nnz/r, 4 subms, 3 lsubms, 4.0000 bpnz. Parameters: verbosity:1 mintimes:3 maxtimes:10 mindt:0 maxdt:3 -3 iterations (12 th.) took 0.02377s; avg 0.007923s ( +/- 1.96/ 3.64 %); best 0.007768s; worst 0.008212s; std dev. 0.0002042 (taking best). -Reference operation time is 0.00776815 s (0.00309 Mflops) with 12 threads. -Starting merge (same threads) based auto-tuning procedure (transA=N, nrhs=1, order=rows) (max 6 steps, inclusive 3 grace steps) on: 3 x 3, type D, 6 nnz, 2 nnz/r, 4 subms, 3 lsubms, 4.0000 bpnz (tpop: 0.007768 Mflops: 0.003) -Merge (3 -> 1 leaves) took w.c.t. of 2.503e-05s, ~9.06e-06s of computing time (of which 9.537e-07s sorting, 5.007e-06s analysis) -3 iterations (12 th.) took 0.0001512s; avg 5.039e-05s ( +/- 99.94/200.00 %); best 3.099e-08s; worst 0.0001512s; std dev. 7.126e-05 (taking best). -Reference operation time is 3.09944e-08 s (774.3 Mflops) with 12 threads. -After merge step 1: tpop: 3.099e-08 s ~Mflops: 774.333 nsubm:1 otn:12 -Applying merge (3 -> 1 leaves, 12 th.) yielded SPEEDUP of 250630.769x: 0.007768s -> 3.099e-08s, so taking this instance. +3 iterations (12 th.) took 0.01858s; avg 0.006193s ( +/- 27.05/ 14.24 %); best 0.004518s; worst 0.007075s; std dev. 0.001185 (taking best). +Reference operation time is 0.00451803 s (0.005312 Mflops) with 12 threads. +Starting merge (same threads) based auto-tuning procedure (transA=N, nrhs=1, order=rows) (max 6 steps, inclusive 3 grace steps) on: 3 x 3, type D, 6 nnz, 2 nnz/r, 4 subms, 3 lsubms, 4.0000 bpnz (tpop: 0.004518 Mflops: 0.005) +Merge (3 -> 1 leaves) took w.c.t. of 2.599e-05s, ~1.001e-05s of computing time (of which 0s sorting, 5.007e-06s analysis) +3 iterations (12 th.) took 0.000124s; avg 4.133e-05s ( +/- 99.87/197.69 %); best 5.335e-08s; worst 0.000123s; std dev. 5.777e-05 (taking best). +Reference operation time is 5.33462e-08 s (449.9 Mflops) with 12 threads. +After merge step 1: tpop: 5.335e-08 s ~Mflops: 449.892 nsubm:1 otn:12 +Applying merge (3 -> 1 leaves, 12 th.) yielded SPEEDUP of 84692.737x: 0.004518s -> 5.335e-08s, so taking this instance. Merged all the matrix leaves: no reason to continue merging. -A total of 1 merge steps (of max 6) (3 -> 1 subms) took 0.02419s (of which 2.813e-05s partitioning, 0s I/O); computing times: 9.06e-06s in par. loops, 9.537e-07s sorting, 5.007e-06s analyzing) -Total merge + benchmarking process took 0.02419s, equivalent to 780592.3/3.1 new/old ops (0.04814s for 2 clones -- as 1553176.9/6.2 ops, or 776588.5/3.1 ops per clone), SPEEDUP of 250630.769x -Applying multi-merge (3 -> 1 leaves, 1 steps, 0 -> 12 th.sp.) yielded SPEEDUP of 250630.769x (0.007768s -> 3.099e-08s), will amortize in 3.1 ops by saving 0.007768s per op. -In 1 tuning rounds (tot. 0.072s, 0.048s for constructor, 2 clones) obtained a SPEEDUP of 25062976.9% (2.506e+05x) (from 0.00309 to 774.3 Mflops). +A total of 1 merge steps (of max 6) (3 -> 1 subms) took 0.01347s (of which 3.099e-05s partitioning, 0s I/O); computing times: 1.001e-05s in par. loops, 0s sorting, 5.007e-06s analyzing) +Total merge + benchmarking process took 0.01347s, equivalent to 252558.7/3.0 new/old ops (0.01948s for 2 clones -- as 365184.4/4.3 ops, or 182592.2/2.2 ops per clone), SPEEDUP of 84692.737x +Applying multi-merge (3 -> 1 leaves, 1 steps, 0 -> 12 th.sp.) yielded SPEEDUP of 84692.737x (0.004518s -> 5.335e-08s), will amortize in 3.0 ops by saving 0.004518s per op. +In 1 tuning rounds (tot. 0.038s, 0.019s for constructor, 2 clones) obtained a SPEEDUP of 8469173.7% (8.469e+04x) (from 0.005312 to 449.9 Mflops). #pr: updating sample at index 1 (0^th of 16), 0^th touch for (0,0,0,0,0,0,0). -First run of RSB Autotuner took 0.072202 s (7.768e-03 s -> 3.099e-08 s per spmv_sxsa) (tuned: 3 -> 1 lsubm). +First run of RSB Autotuner took 0.038424 s (4.518e-03 s -> 5.335e-08 s per spmv_sxsa) (tuned: 3 -> 1 lsubm). RSB Sparse Blocks Autotuner invoked requesting max 0 splits and max 0 merges in 1 rounds, auto threads spec. -Second run of RSB Autotuner took 0.399757 s and estimated a speedup of 1.000000 x (3.099e-08 s -> 3.099e-08 s per op) in same matrix (1 -> 1 lsubm) +Second run of RSB Autotuner took 0.122634 s and estimated a speedup of 1.000000 x (5.335e-08 s -> 5.335e-08 s per op) in same matrix (1 -> 1 lsubm) #min:1 #max:1 #sum:3 #norm:1.7320508075688772 #used index storage compared to COO:28 vs 48 bytes (58.33%) ; compared to CSR:28 vs 40 bytes (77.78%) #%:CONSTRUCTOR_*:SORT SCAN INSERT SCAN+INSERT -%:CONSTRUCTOR_TIMES:A.mtx S N 12 3 3 6 0.000000 0.019579 0.016224 0.035803 -%:UNSORTEDCOO2RSB_TIME:A.mtx S N 12 3 3 6 0.035803 -%:RSB_SUBDIVISION_TIME:A.mtx S N 12 3 3 6 0.019579 -%:RSB_SHUFFLE_TIME:A.mtx S N 12 3 3 6 0.016224 +%:CONSTRUCTOR_TIMES:A.mtx S N 12 3 3 6 0.000000 0.003712 0.001995 0.005707 +%:UNSORTEDCOO2RSB_TIME:A.mtx S N 12 3 3 6 0.005707 +%:RSB_SUBDIVISION_TIME:A.mtx S N 12 3 3 6 0.003712 +%:RSB_SHUFFLE_TIME:A.mtx S N 12 3 3 6 0.001995 %:ROW_MAJOR_SORT_TIME:A.mtx S N 12 3 3 6 0.000000 %:ROW_MAJOR_SORT_SCALING:A.mtx S N 12 3 3 6 nan -%:SORTEDCOO2RSB_TIME:A.mtx S N 12 3 3 6 0.035803 +%:SORTEDCOO2RSB_TIME:A.mtx S N 12 3 3 6 0.005707 %:ROW_MAJOR_SORT_TO_MOP:A.mtx S N 12 3 3 6 0.000 %:UNSORTEDCOO2RSB_SCALING:A.mtx S N 12 3 3 6 1.00 %:SORTEDCOO2RSB_SCALING:A.mtx S N 12 3 3 6 1.00 @@ -4279,50 +4315,50 @@ %:SM_MINMAXAVGNNZ:A.mtx S N 12 3 3 6 6 6 6 # %operation:matrix CONSTRUCTOR[12] SPMV[12] SPMV[12] -%operation:A.mtx 0.054956 1e+09 1e+09 +%operation:A.mtx 0.00883317 1e+09 1e+09 %constructor:matrix SORT[12] SCAN[12] SHUFFLE[12] INSERT[12] -%constructor:A.mtx 0 0.0195789 0 0.0162239 +%constructor:A.mtx 0 0.00371194 0 0.00199509 # symmetric matrix --- skipping transposed benchmarking # multi-nrhs benchmarking (1,4) -- now using nrhs 4. # Using alpha=1 beta=1 order=rows for rsb_spmv/rsb_spsv/rsb_spmm/rsb_spsm. # multi-transpose benchmarking -- now using transA = N. # will use input matrix flags: RSB_FLAG_USE_HALFWORD_INDICES, RSB_FLAG_SORTED_INPUT, RSB_FLAG_QUAD_PARTITIONING, RSB_FLAG_SYMMETRIC, RSB_FLAG_OWN_PARTITIONING_ARRAYS # Using 12 threads -# Constructed matrix (took 0.056s): (3 x 3)[0xaaab0761de50]{D} @ (0(0..0),0(0..0)) (6 nnz, 2 nnz/r) flags 0x2442186 (coo:1, csr:0, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'S' +# Constructed matrix (took 0.013s): (3 x 3)[0xaaab17411ed0]{D} @ (0(0..0),0(0..0)) (6 nnz, 2 nnz/r) flags 0x2442186 (coo:1, csr:0, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'S' # matrix consistency check took 0.000s (ok) RSB Sparse Blocks Autotuner invoked requesting max 6 splits and max 6 merges in 1 rounds, threads spec.0 (specify negative values to enable threads tuning). Will autotune matrix: 3 x 3, type D, 6 nnz, 2 nnz/r, 4 subms, 3 lsubms, 4.0000 bpnz. Parameters: verbosity:1 mintimes:3 maxtimes:10 mindt:0 maxdt:3 -3 iterations (12 th.) took 0.02397s; avg 0.007989s ( +/- 0.28/ 0.15 %); best 0.007967s; worst 0.008001s; std dev. 1.58e-05 (taking best). -Reference operation time is 0.007967 s (0.01205 Mflops) with 12 threads. -Starting merge (same threads) based auto-tuning procedure (transA=N, nrhs=4, order=rows) (max 6 steps, inclusive 3 grace steps) on: 3 x 3, type D, 6 nnz, 2 nnz/r, 4 subms, 3 lsubms, 4.0000 bpnz (tpop: 0.007967 Mflops: 0.012) -Merge (3 -> 1 leaves) took w.c.t. of 1.502e-05s, ~3.815e-06s of computing time (of which 9.537e-07s sorting, 3.099e-06s analysis) -3 iterations (12 th.) took 4.053e-06s; avg 1.351e-06s ( +/- 97.71/200.00 %); best 3.099e-08s; worst 4.053e-06s; std dev. 1.911e-06 (taking best). -Reference operation time is 3.09944e-08 s (3097 Mflops) with 12 threads. -After merge step 1: tpop: 3.099e-08 s ~Mflops: 3097.332 nsubm:1 otn:12 -Applying merge (3 -> 1 leaves, 12 th.) yielded SPEEDUP of 257046.154x: 0.007967s -> 3.099e-08s, so taking this instance. +3 iterations (12 th.) took 0.004898s; avg 0.001633s ( +/- 48.19/ 35.97 %); best 0.0008459s; worst 0.00222s; std dev. 0.0005784 (taking best). +Reference operation time is 0.000845909 s (0.1135 Mflops) with 12 threads. +Starting merge (same threads) based auto-tuning procedure (transA=N, nrhs=4, order=rows) (max 6 steps, inclusive 3 grace steps) on: 3 x 3, type D, 6 nnz, 2 nnz/r, 4 subms, 3 lsubms, 4.0000 bpnz (tpop: 0.0008459 Mflops: 0.113) +Merge (3 -> 1 leaves) took w.c.t. of 1.001e-05s, ~3.099e-06s of computing time (of which 1.192e-06s sorting, 2.146e-06s analysis) +3 iterations (12 th.) took 1.907e-06s; avg 6.358e-07s ( +/- 91.61/200.00 %); best 5.335e-08s; worst 1.907e-06s; std dev. 8.991e-07 (taking best). +Reference operation time is 5.33462e-08 s (1800 Mflops) with 12 threads. +After merge step 1: tpop: 5.335e-08 s ~Mflops: 1799.567 nsubm:1 otn:12 +Applying merge (3 -> 1 leaves, 12 th.) yielded SPEEDUP of 15856.983x: 0.0008459s -> 5.335e-08s, so taking this instance. Merged all the matrix leaves: no reason to continue merging. -A total of 1 merge steps (of max 6) (3 -> 1 subms) took 0.024s (of which 1.812e-05s partitioning, 0s I/O); computing times: 3.815e-06s in par. loops, 9.537e-07s sorting, 3.099e-06s analyzing) -Total merge + benchmarking process took 0.024s, equivalent to 774300.0/3.0 new/old ops (0.04795s for 2 clones -- as 1547084.6/6.0 ops, or 773542.3/3.0 ops per clone), SPEEDUP of 257046.154x -Applying multi-merge (3 -> 1 leaves, 1 steps, 0 -> 12 th.sp.) yielded SPEEDUP of 257046.154x (0.007967s -> 3.099e-08s), will amortize in 3.0 ops by saving 0.007967s per op. -In 1 tuning rounds (tot. 0.072s, 0.048s for constructor, 2 clones) obtained a SPEEDUP of 25704515.4% (2.57e+05x) (from 0.01205 to 3097 Mflops). +A total of 1 merge steps (of max 6) (3 -> 1 subms) took 0.003023s (of which 1.311e-05s partitioning, 0s I/O); computing times: 3.099e-06s in par. loops, 1.192e-06s sorting, 2.146e-06s analyzing) +Total merge + benchmarking process took 0.003023s, equivalent to 56665.9/3.6 new/old ops (0.007373s for 2 clones -- as 138207.8/8.7 ops, or 69103.9/4.4 ops per clone), SPEEDUP of 15856.983x +Applying multi-merge (3 -> 1 leaves, 1 steps, 0 -> 12 th.sp.) yielded SPEEDUP of 15856.983x (0.0008459s -> 5.335e-08s), will amortize in 3.6 ops by saving 0.0008459s per op. +In 1 tuning rounds (tot. 0.012s, 0.0074s for constructor, 2 clones) obtained a SPEEDUP of 1585598.3% (1.586e+04x) (from 0.1135 to 1800 Mflops). #pr: updating sample at index 9 (1^th of 16), 0^th touch for (0,0,0,0,1,0,0). -First run of RSB Autotuner took 0.072006 s (7.967e-03 s -> 3.099e-08 s per spmv_sxsa) (tuned: 3 -> 1 lsubm). +First run of RSB Autotuner took 0.0123439 s (8.459e-04 s -> 5.335e-08 s per spmv_sxsa) (tuned: 3 -> 1 lsubm). RSB Sparse Blocks Autotuner invoked requesting max 0 splits and max 0 merges in 1 rounds, auto threads spec. -Second run of RSB Autotuner took 0.396211 s and estimated a speedup of 1.000000 x (3.099e-08 s -> 3.099e-08 s per op) in same matrix (1 -> 1 lsubm) +Second run of RSB Autotuner took 0.0972469 s and estimated a speedup of 1.000000 x (5.335e-08 s -> 5.335e-08 s per op) in same matrix (1 -> 1 lsubm) #min:1 #max:1 #sum:3 #norm:1.7320508075688772 #used index storage compared to COO:28 vs 48 bytes (58.33%) ; compared to CSR:28 vs 40 bytes (77.78%) #%:CONSTRUCTOR_*:SORT SCAN INSERT SCAN+INSERT -%:CONSTRUCTOR_TIMES:A.mtx S N 12 3 3 6 0.000000 0.023602 0.016000 0.039602 -%:UNSORTEDCOO2RSB_TIME:A.mtx S N 12 3 3 6 0.039602 -%:RSB_SUBDIVISION_TIME:A.mtx S N 12 3 3 6 0.023602 -%:RSB_SHUFFLE_TIME:A.mtx S N 12 3 3 6 0.016000 +%:CONSTRUCTOR_TIMES:A.mtx S N 12 3 3 6 0.000000 0.006216 0.002217 0.008433 +%:UNSORTEDCOO2RSB_TIME:A.mtx S N 12 3 3 6 0.008433 +%:RSB_SUBDIVISION_TIME:A.mtx S N 12 3 3 6 0.006216 +%:RSB_SHUFFLE_TIME:A.mtx S N 12 3 3 6 0.002217 %:ROW_MAJOR_SORT_TIME:A.mtx S N 12 3 3 6 0.000000 %:ROW_MAJOR_SORT_SCALING:A.mtx S N 12 3 3 6 nan -%:SORTEDCOO2RSB_TIME:A.mtx S N 12 3 3 6 0.039602 +%:SORTEDCOO2RSB_TIME:A.mtx S N 12 3 3 6 0.008433 %:ROW_MAJOR_SORT_TO_MOP:A.mtx S N 12 3 3 6 0.000 %:UNSORTEDCOO2RSB_SCALING:A.mtx S N 12 3 3 6 1.00 %:SORTEDCOO2RSB_SCALING:A.mtx S N 12 3 3 6 1.00 @@ -4337,59 +4373,59 @@ %:SM_MINMAXAVGNNZ:A.mtx S N 12 3 3 6 6 6 6 # %operation:matrix CONSTRUCTOR[12] SPMV[12] SPMV[12] -%operation:A.mtx 0.0556099 1e+09 1e+09 +%operation:A.mtx 0.0133169 1e+09 1e+09 %constructor:matrix SORT[12] SCAN[12] SHUFFLE[12] INSERT[12] -%constructor:A.mtx 0 0.023602 0 0.016 +%constructor:A.mtx 0 0.00621581 0 0.00221682 # symmetric matrix --- skipping transposed benchmarking -# so far, program took 6.007s of wall clock time; ancillary tests 0.000s; I/O 0.000s; checks 0.000s; conversions 0.000s; rsb/mkl tuning 0.940s/0.000s . +# so far, program took 5.757s of wall clock time; ancillary tests 0.000s; I/O 0.000s; checks 0.000s; conversions 0.000s; rsb/mkl tuning 0.271s/0.000s . getrusage() stats: -ru_maxrss: 6 (maximum resident set size -- MB) -ru_stime : 0.02935s (system CPU time used) -ru_utime : 3.346s (user CPU time used) +ru_maxrss: 8 (maximum resident set size -- MB) +ru_stime : 0.04844s (system CPU time used) +ru_utime : 6.149s (user CPU time used) # multi-type benchmarking (DSCZ) -- now using typecode S (last was D). # Cache block size total 524288 bytes, per-thread 43690 bytes -# so far, program took 6.007s of wall clock time; ancillary tests 0.000s; I/O 0.000s; checks 0.000s; conversions 0.000s; rsb/mkl tuning 0.940s/0.000s . +# so far, program took 5.757s of wall clock time; ancillary tests 0.000s; I/O 0.000s; checks 0.000s; conversions 0.000s; rsb/mkl tuning 0.271s/0.000s . # Reusing type converted (D->S) arrays from last iteration instead of reloading matrix file. # multi-nrhs benchmarking (1,4) -- now using nrhs 1. # Using alpha=1 beta=1 order=rows for rsb_spmv/rsb_spsv/rsb_spmm/rsb_spsm. # multi-transpose benchmarking -- now using transA = N. # will use input matrix flags: RSB_FLAG_USE_HALFWORD_INDICES, RSB_FLAG_SORTED_INPUT, RSB_FLAG_QUAD_PARTITIONING, RSB_FLAG_SYMMETRIC, RSB_FLAG_OWN_PARTITIONING_ARRAYS # Using 12 threads -# Constructed matrix (took 0.055s): (3 x 3)[0xaaab0761de50]{S} @ (0(0..0),0(0..0)) (6 nnz, 2 nnz/r) flags 0x2442186 (coo:1, csr:0, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'S' +# Constructed matrix (took 0.005s): (3 x 3)[0xaaab17411ed0]{S} @ (0(0..0),0(0..0)) (6 nnz, 2 nnz/r) flags 0x2442186 (coo:1, csr:0, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'S' # matrix consistency check took 0.000s (ok) RSB Sparse Blocks Autotuner invoked requesting max 6 splits and max 6 merges in 1 rounds, threads spec.0 (specify negative values to enable threads tuning). Will autotune matrix: 3 x 3, type S, 6 nnz, 2 nnz/r, 4 subms, 3 lsubms, 4.0000 bpnz. Parameters: verbosity:1 mintimes:3 maxtimes:10 mindt:0 maxdt:3 -3 iterations (12 th.) took 0.028s; avg 0.009332s ( +/- 14.34/ 28.59 %); best 0.007994s; worst 0.012s; std dev. 0.001887 (taking best). -Reference operation time is 0.00799394 s (0.003002 Mflops) with 12 threads. -Starting merge (same threads) based auto-tuning procedure (transA=N, nrhs=1, order=rows) (max 6 steps, inclusive 3 grace steps) on: 3 x 3, type S, 6 nnz, 2 nnz/r, 4 subms, 3 lsubms, 4.0000 bpnz (tpop: 0.007994 Mflops: 0.003) -Merge (3 -> 1 leaves) took w.c.t. of 1.502e-05s, ~4.053e-06s of computing time (of which 1.192e-06s sorting, 2.861e-06s analysis) -3 iterations (12 th.) took 5.96e-06s; avg 1.987e-06s ( +/- 98.44/152.00 %); best 3.099e-08s; worst 5.007e-06s; std dev. 2.171e-06 (taking best). -Reference operation time is 3.09944e-08 s (774.3 Mflops) with 12 threads. -After merge step 1: tpop: 3.099e-08 s ~Mflops: 774.333 nsubm:1 otn:12 -Applying merge (3 -> 1 leaves, 12 th.) yielded SPEEDUP of 257915.385x: 0.007994s -> 3.099e-08s, so taking this instance. +3 iterations (12 th.) took 0.003011s; avg 0.001004s ( +/- 14.53/ 7.42 %); best 0.0008578s; worst 0.001078s; std dev. 0.0001031 (taking best). +Reference operation time is 0.00085783 s (0.02798 Mflops) with 12 threads. +Starting merge (same threads) based auto-tuning procedure (transA=N, nrhs=1, order=rows) (max 6 steps, inclusive 3 grace steps) on: 3 x 3, type S, 6 nnz, 2 nnz/r, 4 subms, 3 lsubms, 4.0000 bpnz (tpop: 0.0008578 Mflops: 0.028) +Merge (3 -> 1 leaves) took w.c.t. of 1.097e-05s, ~4.053e-06s of computing time (of which 0s sorting, 1.907e-06s analysis) +3 iterations (12 th.) took 5.007e-06s; avg 1.669e-06s ( +/- 96.80/142.86 %); best 5.335e-08s; worst 4.053e-06s; std dev. 1.73e-06 (taking best). +Reference operation time is 5.33462e-08 s (449.9 Mflops) with 12 threads. +After merge step 1: tpop: 5.335e-08 s ~Mflops: 449.892 nsubm:1 otn:12 +Applying merge (3 -> 1 leaves, 12 th.) yielded SPEEDUP of 16080.447x: 0.0008578s -> 5.335e-08s, so taking this instance. Merged all the matrix leaves: no reason to continue merging. -A total of 1 merge steps (of max 6) (3 -> 1 subms) took 0.02185s (of which 1.717e-05s partitioning, 0s I/O); computing times: 4.053e-06s in par. loops, 1.192e-06s sorting, 2.861e-06s analyzing) -Total merge + benchmarking process took 0.02185s, equivalent to 704969.2/2.7 new/old ops (0.04557s for 2 clones -- as 1470176.9/5.7 ops, or 735088.5/2.9 ops per clone), SPEEDUP of 257915.385x -Applying multi-merge (3 -> 1 leaves, 1 steps, 0 -> 12 th.sp.) yielded SPEEDUP of 257915.385x (0.007994s -> 3.099e-08s), will amortize in 2.7 ops by saving 0.007994s per op. -In 1 tuning rounds (tot. 0.074s, 0.046s for constructor, 2 clones) obtained a SPEEDUP of 25791438.5% (2.579e+05x) (from 0.003002 to 774.3 Mflops). +A total of 1 merge steps (of max 6) (3 -> 1 subms) took 0.002776s (of which 1.383e-05s partitioning, 0s I/O); computing times: 4.053e-06s in par. loops, 0s sorting, 1.907e-06s analyzing) +Total merge + benchmarking process took 0.002776s, equivalent to 52035.8/3.2 new/old ops (0.004266s for 2 clones -- as 79964.2/5.0 ops, or 39982.1/2.5 ops per clone), SPEEDUP of 16080.447x +Applying multi-merge (3 -> 1 leaves, 1 steps, 0 -> 12 th.sp.) yielded SPEEDUP of 16080.447x (0.0008578s -> 5.335e-08s), will amortize in 3.2 ops by saving 0.0008578s per op. +In 1 tuning rounds (tot. 0.0075s, 0.0043s for constructor, 2 clones) obtained a SPEEDUP of 1607944.7% (1.608e+04x) (from 0.02798 to 449.9 Mflops). #pr: updating sample at index 3 (2^th of 16), 0^th touch for (0,0,0,0,0,1,0). -First run of RSB Autotuner took 0.0737381 s (7.994e-03 s -> 3.099e-08 s per spmv_sxsa) (tuned: 3 -> 1 lsubm). +First run of RSB Autotuner took 0.00750017 s (8.578e-04 s -> 5.335e-08 s per spmv_sxsa) (tuned: 3 -> 1 lsubm). RSB Sparse Blocks Autotuner invoked requesting max 0 splits and max 0 merges in 1 rounds, auto threads spec. -Second run of RSB Autotuner took 0.358445 s and estimated a speedup of 1.000000 x (3.099e-08 s -> 3.099e-08 s per op) in same matrix (1 -> 1 lsubm) +Second run of RSB Autotuner took 0.0390909 s and estimated a speedup of 1.000000 x (5.335e-08 s -> 5.335e-08 s per op) in same matrix (1 -> 1 lsubm) #min:1 #max:1 #sum:3 #norm:1.73205078 #used index storage compared to COO:28 vs 48 bytes (58.33%) ; compared to CSR:28 vs 40 bytes (77.78%) #%:CONSTRUCTOR_*:SORT SCAN INSERT SCAN+INSERT -%:CONSTRUCTOR_TIMES:A.mtx S N 12 3 3 6 0.000000 0.023373 0.015996 0.039369 -%:UNSORTEDCOO2RSB_TIME:A.mtx S N 12 3 3 6 0.039369 -%:RSB_SUBDIVISION_TIME:A.mtx S N 12 3 3 6 0.023373 -%:RSB_SHUFFLE_TIME:A.mtx S N 12 3 3 6 0.015996 +%:CONSTRUCTOR_TIMES:A.mtx S N 12 3 3 6 0.000000 0.001984 0.001522 0.003506 +%:UNSORTEDCOO2RSB_TIME:A.mtx S N 12 3 3 6 0.003506 +%:RSB_SUBDIVISION_TIME:A.mtx S N 12 3 3 6 0.001984 +%:RSB_SHUFFLE_TIME:A.mtx S N 12 3 3 6 0.001522 %:ROW_MAJOR_SORT_TIME:A.mtx S N 12 3 3 6 0.000000 %:ROW_MAJOR_SORT_SCALING:A.mtx S N 12 3 3 6 nan -%:SORTEDCOO2RSB_TIME:A.mtx S N 12 3 3 6 0.039369 +%:SORTEDCOO2RSB_TIME:A.mtx S N 12 3 3 6 0.003506 %:ROW_MAJOR_SORT_TO_MOP:A.mtx S N 12 3 3 6 0.000 %:UNSORTEDCOO2RSB_SCALING:A.mtx S N 12 3 3 6 1.00 %:SORTEDCOO2RSB_SCALING:A.mtx S N 12 3 3 6 1.00 @@ -4404,56 +4440,56 @@ %:SM_MINMAXAVGNNZ:A.mtx S N 12 3 3 6 6 6 6 # %operation:matrix CONSTRUCTOR[12] SPMV[12] SPMV[12] -%operation:A.mtx 0.055377 1e+09 1e+09 +%operation:A.mtx 0.00469208 1e+09 1e+09 %constructor:matrix SORT[12] SCAN[12] SHUFFLE[12] INSERT[12] -%constructor:A.mtx 0 0.0233731 0 0.015996 +%constructor:A.mtx 0 0.00198412 0 0.00152206 # symmetric matrix --- skipping transposed benchmarking # multi-nrhs benchmarking (1,4) -- now using nrhs 4. # Using alpha=1 beta=1 order=rows for rsb_spmv/rsb_spsv/rsb_spmm/rsb_spsm. # multi-transpose benchmarking -- now using transA = N. # will use input matrix flags: RSB_FLAG_USE_HALFWORD_INDICES, RSB_FLAG_SORTED_INPUT, RSB_FLAG_QUAD_PARTITIONING, RSB_FLAG_SYMMETRIC, RSB_FLAG_OWN_PARTITIONING_ARRAYS # Using 12 threads -# Constructed matrix (took 0.056s): (3 x 3)[0xaaab0761de50]{S} @ (0(0..0),0(0..0)) (6 nnz, 2 nnz/r) flags 0x2442186 (coo:1, csr:0, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'S' +# Constructed matrix (took 0.006s): (3 x 3)[0xaaab17411ed0]{S} @ (0(0..0),0(0..0)) (6 nnz, 2 nnz/r) flags 0x2442186 (coo:1, csr:0, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'S' # matrix consistency check took 0.000s (ok) RSB Sparse Blocks Autotuner invoked requesting max 6 splits and max 6 merges in 1 rounds, threads spec.0 (specify negative values to enable threads tuning). Will autotune matrix: 3 x 3, type S, 6 nnz, 2 nnz/r, 4 subms, 3 lsubms, 4.0000 bpnz. Parameters: verbosity:1 mintimes:3 maxtimes:10 mindt:0 maxdt:3 -3 iterations (12 th.) took 0.02754s; avg 0.00918s ( +/- 15.16/ 27.97 %); best 0.007788s; worst 0.01175s; std dev. 0.001818 (taking best). -Reference operation time is 0.00778794 s (0.01233 Mflops) with 12 threads. -Starting merge (same threads) based auto-tuning procedure (transA=N, nrhs=4, order=rows) (max 6 steps, inclusive 3 grace steps) on: 3 x 3, type S, 6 nnz, 2 nnz/r, 4 subms, 3 lsubms, 4.0000 bpnz (tpop: 0.007788 Mflops: 0.012) -Merge (3 -> 1 leaves) took w.c.t. of 1.717e-05s, ~5.007e-06s of computing time (of which 1.192e-06s sorting, 3.099e-06s analysis) -3 iterations (12 th.) took 5.007e-06s; avg 1.669e-06s ( +/- 98.14/142.86 %); best 3.099e-08s; worst 4.053e-06s; std dev. 1.73e-06 (taking best). -Reference operation time is 3.09944e-08 s (3097 Mflops) with 12 threads. -After merge step 1: tpop: 3.099e-08 s ~Mflops: 3097.332 nsubm:1 otn:12 -Applying merge (3 -> 1 leaves, 12 th.) yielded SPEEDUP of 251269.231x: 0.007788s -> 3.099e-08s, so taking this instance. +3 iterations (12 th.) took 0.00236s; avg 0.0007866s ( +/- 45.08/ 45.67 %); best 0.000432s; worst 0.001146s; std dev. 0.0002914 (taking best). +Reference operation time is 0.000432014 s (0.2222 Mflops) with 12 threads. +Starting merge (same threads) based auto-tuning procedure (transA=N, nrhs=4, order=rows) (max 6 steps, inclusive 3 grace steps) on: 3 x 3, type S, 6 nnz, 2 nnz/r, 4 subms, 3 lsubms, 4.0000 bpnz (tpop: 0.000432 Mflops: 0.222) +Merge (3 -> 1 leaves) took w.c.t. of 1.717e-05s, ~5.96e-06s of computing time (of which 1.907e-06s sorting, 3.815e-06s analysis) +3 iterations (12 th.) took 3.099e-06s; avg 1.033e-06s ( +/- 94.84/200.00 %); best 5.335e-08s; worst 3.099e-06s; std dev. 1.461e-06 (taking best). +Reference operation time is 5.33462e-08 s (1800 Mflops) with 12 threads. +After merge step 1: tpop: 5.335e-08 s ~Mflops: 1799.567 nsubm:1 otn:12 +Applying merge (3 -> 1 leaves, 12 th.) yielded SPEEDUP of 8098.324x: 0.000432s -> 5.335e-08s, so taking this instance. Merged all the matrix leaves: no reason to continue merging. -A total of 1 merge steps (of max 6) (3 -> 1 subms) took 0.02451s (of which 2.003e-05s partitioning, 0s I/O); computing times: 5.007e-06s in par. loops, 1.192e-06s sorting, 3.099e-06s analyzing) -Total merge + benchmarking process took 0.02451s, equivalent to 790853.8/3.1 new/old ops (0.04887s for 2 clones -- as 1576738.5/6.3 ops, or 788369.2/3.1 ops per clone), SPEEDUP of 251269.231x -Applying multi-merge (3 -> 1 leaves, 1 steps, 0 -> 12 th.sp.) yielded SPEEDUP of 251269.231x (0.007788s -> 3.099e-08s), will amortize in 3.1 ops by saving 0.007788s per op. -In 1 tuning rounds (tot. 0.077s, 0.049s for constructor, 2 clones) obtained a SPEEDUP of 25126823.1% (2.513e+05x) (from 0.01233 to 3097 Mflops). +A total of 1 merge steps (of max 6) (3 -> 1 subms) took 0.002849s (of which 1.907e-05s partitioning, 0s I/O); computing times: 5.96e-06s in par. loops, 1.907e-06s sorting, 3.815e-06s analyzing) +Total merge + benchmarking process took 0.002849s, equivalent to 53407.8/6.6 new/old ops (0.007372s for 2 clones -- as 138189.9/17.1 ops, or 69095.0/8.5 ops per clone), SPEEDUP of 8098.324x +Applying multi-merge (3 -> 1 leaves, 1 steps, 0 -> 12 th.sp.) yielded SPEEDUP of 8098.324x (0.000432s -> 5.335e-08s), will amortize in 6.6 ops by saving 0.000432s per op. +In 1 tuning rounds (tot. 0.0098s, 0.0074s for constructor, 2 clones) obtained a SPEEDUP of 809732.4% (8098x) (from 0.2222 to 1800 Mflops). #pr: updating sample at index 11 (3^th of 16), 0^th touch for (0,0,0,0,1,1,0). -First run of RSB Autotuner took 0.076524 s (7.788e-03 s -> 3.099e-08 s per spmv_sxsa) (tuned: 3 -> 1 lsubm). +First run of RSB Autotuner took 0.00985289 s (4.320e-04 s -> 5.335e-08 s per spmv_sxsa) (tuned: 3 -> 1 lsubm). RSB Sparse Blocks Autotuner invoked requesting max 0 splits and max 0 merges in 1 rounds, auto threads spec. -Second run of RSB Autotuner took 0.351898 s and estimated a speedup of 1.000000 x (3.099e-08 s -> 3.099e-08 s per op) in same matrix (1 -> 1 lsubm) +Second run of RSB Autotuner took 0.0452878 s and estimated a speedup of 1.000000 x (5.335e-08 s -> 5.335e-08 s per op) in same matrix (1 -> 1 lsubm) #min:1 #max:1 #sum:3 #norm:1.73205078 #used index storage compared to COO:28 vs 48 bytes (58.33%) ; compared to CSR:28 vs 40 bytes (77.78%) #%:CONSTRUCTOR_*:SORT SCAN INSERT SCAN+INSERT -%:CONSTRUCTOR_TIMES:A.mtx S N 12 3 3 6 0.000001 0.023623 0.015990 0.039613 -%:UNSORTEDCOO2RSB_TIME:A.mtx S N 12 3 3 6 0.039614 -%:RSB_SUBDIVISION_TIME:A.mtx S N 12 3 3 6 0.023623 -%:RSB_SHUFFLE_TIME:A.mtx S N 12 3 3 6 0.015990 -%:ROW_MAJOR_SORT_TIME:A.mtx S N 12 3 3 6 0.000001 -%:ROW_MAJOR_SORT_SCALING:A.mtx S N 12 3 3 6 1.000 -%:SORTEDCOO2RSB_TIME:A.mtx S N 12 3 3 6 0.039613 +%:CONSTRUCTOR_TIMES:A.mtx S N 12 3 3 6 0.000000 0.002945 0.001470 0.004415 +%:UNSORTEDCOO2RSB_TIME:A.mtx S N 12 3 3 6 0.004415 +%:RSB_SUBDIVISION_TIME:A.mtx S N 12 3 3 6 0.002945 +%:RSB_SHUFFLE_TIME:A.mtx S N 12 3 3 6 0.001470 +%:ROW_MAJOR_SORT_TIME:A.mtx S N 12 3 3 6 0.000000 +%:ROW_MAJOR_SORT_SCALING:A.mtx S N 12 3 3 6 nan +%:SORTEDCOO2RSB_TIME:A.mtx S N 12 3 3 6 0.004415 %:ROW_MAJOR_SORT_TO_MOP:A.mtx S N 12 3 3 6 0.000 %:UNSORTEDCOO2RSB_SCALING:A.mtx S N 12 3 3 6 1.00 %:SORTEDCOO2RSB_SCALING:A.mtx S N 12 3 3 6 1.00 %:RSB_SUBDIVISION_SCALING:A.mtx S N 12 3 3 6 1.00 %:RSB_SHUFFLE_SCALING:A.mtx S N 12 3 3 6 1.00 -%:CONSTRUCTOR_SCALING:A.mtx S N 12 3 3 6 1.00 1.00 1.00 1.00 +%:CONSTRUCTOR_SCALING:A.mtx S N 12 3 3 6 nan 1.00 1.00 1.00 #%:SM_COUNTS: Tot HalfwordCsr FullwordCsr HalfwordCoo FullwordCoo %:SM_COUNTS:A.mtx S N 12 3 3 6 1 1 0 0 0 %:SM_IDXOCCUPATIONRSBVSCOOANDCSR:A.mtx S N 12 3 3 6 28 48 36 @@ -4462,59 +4498,59 @@ %:SM_MINMAXAVGNNZ:A.mtx S N 12 3 3 6 6 6 6 # %operation:matrix CONSTRUCTOR[12] SPMV[12] SPMV[12] -%operation:A.mtx 0.0556202 1e+09 1e+09 +%operation:A.mtx 0.00613308 1e+09 1e+09 %constructor:matrix SORT[12] SCAN[12] SHUFFLE[12] INSERT[12] -%constructor:A.mtx 9.53674e-07 0.023623 0 0.01599 +%constructor:A.mtx 0 0.00294495 0 0.00147009 # symmetric matrix --- skipping transposed benchmarking -# so far, program took 7.058s of wall clock time; ancillary tests 0.000s; I/O 0.000s; checks 0.000s; conversions 0.000s; rsb/mkl tuning 1.801s/0.000s . +# so far, program took 5.881s of wall clock time; ancillary tests 0.000s; I/O 0.000s; checks 0.000s; conversions 0.000s; rsb/mkl tuning 0.372s/0.000s . getrusage() stats: -ru_maxrss: 6 (maximum resident set size -- MB) -ru_stime : 0.03994s (system CPU time used) -ru_utime : 3.908s (user CPU time used) +ru_maxrss: 8 (maximum resident set size -- MB) +ru_stime : 0.05249s (system CPU time used) +ru_utime : 6.674s (user CPU time used) # multi-type benchmarking (DSCZ) -- now using typecode C (last was S). # Cache block size total 524288 bytes, per-thread 43690 bytes -# so far, program took 7.058s of wall clock time; ancillary tests 0.000s; I/O 0.000s; checks 0.000s; conversions 0.000s; rsb/mkl tuning 1.801s/0.000s . +# so far, program took 5.881s of wall clock time; ancillary tests 0.000s; I/O 0.000s; checks 0.000s; conversions 0.000s; rsb/mkl tuning 0.372s/0.000s . # Reusing type converted (S->C) arrays from last iteration instead of reloading matrix file. # multi-nrhs benchmarking (1,4) -- now using nrhs 1. # Using alpha=1 beta=1 order=rows for rsb_spmv/rsb_spsv/rsb_spmm/rsb_spsm. # multi-transpose benchmarking -- now using transA = N. # will use input matrix flags: RSB_FLAG_USE_HALFWORD_INDICES, RSB_FLAG_SORTED_INPUT, RSB_FLAG_QUAD_PARTITIONING, RSB_FLAG_SYMMETRIC, RSB_FLAG_OWN_PARTITIONING_ARRAYS # Using 12 threads -# Constructed matrix (took 0.048s): (3 x 3)[0xaaab07621260]{C} @ (0(0..0),0(0..0)) (6 nnz, 2 nnz/r) flags 0x2442186 (coo:1, csr:0, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'S' +# Constructed matrix (took 0.006s): (3 x 3)[0xaaab17415280]{C} @ (0(0..0),0(0..0)) (6 nnz, 2 nnz/r) flags 0x2442186 (coo:1, csr:0, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'S' # matrix consistency check took 0.000s (ok) RSB Sparse Blocks Autotuner invoked requesting max 6 splits and max 6 merges in 1 rounds, threads spec.0 (specify negative values to enable threads tuning). Will autotune matrix: 3 x 3, type C, 6 nnz, 2 nnz/r, 4 subms, 3 lsubms, 4.0000 bpnz. Parameters: verbosity:1 mintimes:3 maxtimes:10 mindt:0 maxdt:3 -3 iterations (12 th.) took 0.02376s; avg 0.007921s ( +/- 1.99/ 1.61 %); best 0.007763s; worst 0.008048s; std dev. 0.0001184 (taking best). -Reference operation time is 0.00776291 s (0.01237 Mflops) with 12 threads. -Starting merge (same threads) based auto-tuning procedure (transA=N, nrhs=1, order=rows) (max 6 steps, inclusive 3 grace steps) on: 3 x 3, type C, 6 nnz, 2 nnz/r, 4 subms, 3 lsubms, 4.0000 bpnz (tpop: 0.007763 Mflops: 0.012) -Merge (3 -> 1 leaves) took w.c.t. of 1.287e-05s, ~4.053e-06s of computing time (of which 0s sorting, 2.146e-06s analysis) -3 iterations (12 th.) took 0.0001011s; avg 3.37e-05s ( +/- 99.91/197.17 %); best 3.099e-08s; worst 0.0001001s; std dev. 4.698e-05 (taking best). -Reference operation time is 3.09944e-08 s (3097 Mflops) with 12 threads. -After merge step 1: tpop: 3.099e-08 s ~Mflops: 3097.332 nsubm:1 otn:12 -Applying merge (3 -> 1 leaves, 12 th.) yielded SPEEDUP of 250461.538x: 0.007763s -> 3.099e-08s, so taking this instance. +3 iterations (12 th.) took 0.002572s; avg 0.0008574s ( +/- 19.74/ 20.49 %); best 0.0006881s; worst 0.001033s; std dev. 0.0001409 (taking best). +Reference operation time is 0.000688076 s (0.1395 Mflops) with 12 threads. +Starting merge (same threads) based auto-tuning procedure (transA=N, nrhs=1, order=rows) (max 6 steps, inclusive 3 grace steps) on: 3 x 3, type C, 6 nnz, 2 nnz/r, 4 subms, 3 lsubms, 4.0000 bpnz (tpop: 0.0006881 Mflops: 0.140) +Merge (3 -> 1 leaves) took w.c.t. of 1.812e-05s, ~5.007e-06s of computing time (of which 9.537e-07s sorting, 5.007e-06s analysis) +3 iterations (12 th.) took 0.0001259s; avg 4.196e-05s ( +/- 99.87/200.00 %); best 5.335e-08s; worst 0.0001259s; std dev. 5.934e-05 (taking best). +Reference operation time is 5.33462e-08 s (1800 Mflops) with 12 threads. +After merge step 1: tpop: 5.335e-08 s ~Mflops: 1799.567 nsubm:1 otn:12 +Applying merge (3 -> 1 leaves, 12 th.) yielded SPEEDUP of 12898.324x: 0.0006881s -> 5.335e-08s, so taking this instance. Merged all the matrix leaves: no reason to continue merging. -A total of 1 merge steps (of max 6) (3 -> 1 subms) took 0.0242s (of which 1.502e-05s partitioning, 0s I/O); computing times: 4.053e-06s in par. loops, 0s sorting, 2.146e-06s analyzing) -Total merge + benchmarking process took 0.0242s, equivalent to 780684.6/3.1 new/old ops (0.04814s for 2 clones -- as 1553246.2/6.2 ops, or 776623.1/3.1 ops per clone), SPEEDUP of 250461.538x -Applying multi-merge (3 -> 1 leaves, 1 steps, 0 -> 12 th.sp.) yielded SPEEDUP of 250461.538x (0.007763s -> 3.099e-08s), will amortize in 3.1 ops by saving 0.007763s per op. -In 1 tuning rounds (tot. 0.072s, 0.048s for constructor, 2 clones) obtained a SPEEDUP of 25046053.8% (2.505e+05x) (from 0.01237 to 3097 Mflops). +A total of 1 merge steps (of max 6) (3 -> 1 subms) took 0.00243s (of which 2.098e-05s partitioning, 0s I/O); computing times: 5.007e-06s in par. loops, 9.537e-07s sorting, 5.007e-06s analyzing) +Total merge + benchmarking process took 0.00243s, equivalent to 45550.8/3.5 new/old ops (0.004611s for 2 clones -- as 86435.8/6.7 ops, or 43217.9/3.4 ops per clone), SPEEDUP of 12898.324x +Applying multi-merge (3 -> 1 leaves, 1 steps, 0 -> 12 th.sp.) yielded SPEEDUP of 12898.324x (0.0006881s -> 5.335e-08s), will amortize in 3.5 ops by saving 0.000688s per op. +In 1 tuning rounds (tot. 0.0074s, 0.0046s for constructor, 2 clones) obtained a SPEEDUP of 1289732.4% (1.29e+04x) (from 0.1395 to 1800 Mflops). #pr: updating sample at index 5 (4^th of 16), 0^th touch for (0,0,0,0,0,2,0). -First run of RSB Autotuner took 0.0720851 s (7.763e-03 s -> 3.099e-08 s per spmv_sxsa) (tuned: 3 -> 1 lsubm). +First run of RSB Autotuner took 0.00738502 s (6.881e-04 s -> 5.335e-08 s per spmv_sxsa) (tuned: 3 -> 1 lsubm). RSB Sparse Blocks Autotuner invoked requesting max 0 splits and max 0 merges in 1 rounds, auto threads spec. -Second run of RSB Autotuner took 0.399996 s and estimated a speedup of 1.000000 x (3.099e-08 s -> 3.099e-08 s per op) in same matrix (1 -> 1 lsubm) +Second run of RSB Autotuner took 0.0921991 s and estimated a speedup of 1.000000 x (5.335e-08 s -> 5.335e-08 s per op) in same matrix (1 -> 1 lsubm) #min:1 0 #max:1 0 #sum:3 0 #norm:1.73205078 0 #used index storage compared to COO:28 vs 48 bytes (58.33%) ; compared to CSR:28 vs 40 bytes (77.78%) #%:CONSTRUCTOR_*:SORT SCAN INSERT SCAN+INSERT -%:CONSTRUCTOR_TIMES:A.mtx S N 12 3 3 6 0.000000 0.015950 0.015977 0.031927 -%:UNSORTEDCOO2RSB_TIME:A.mtx S N 12 3 3 6 0.031927 -%:RSB_SUBDIVISION_TIME:A.mtx S N 12 3 3 6 0.015950 -%:RSB_SHUFFLE_TIME:A.mtx S N 12 3 3 6 0.015977 +%:CONSTRUCTOR_TIMES:A.mtx S N 12 3 3 6 0.000000 0.002236 0.001886 0.004122 +%:UNSORTEDCOO2RSB_TIME:A.mtx S N 12 3 3 6 0.004122 +%:RSB_SUBDIVISION_TIME:A.mtx S N 12 3 3 6 0.002236 +%:RSB_SHUFFLE_TIME:A.mtx S N 12 3 3 6 0.001886 %:ROW_MAJOR_SORT_TIME:A.mtx S N 12 3 3 6 0.000000 %:ROW_MAJOR_SORT_SCALING:A.mtx S N 12 3 3 6 nan -%:SORTEDCOO2RSB_TIME:A.mtx S N 12 3 3 6 0.031927 +%:SORTEDCOO2RSB_TIME:A.mtx S N 12 3 3 6 0.004122 %:ROW_MAJOR_SORT_TO_MOP:A.mtx S N 12 3 3 6 0.000 %:UNSORTEDCOO2RSB_SCALING:A.mtx S N 12 3 3 6 1.00 %:SORTEDCOO2RSB_SCALING:A.mtx S N 12 3 3 6 1.00 @@ -4529,50 +4565,50 @@ %:SM_MINMAXAVGNNZ:A.mtx S N 12 3 3 6 6 6 6 # %operation:matrix CONSTRUCTOR[12] SPMV[12] SPMV[12] -%operation:A.mtx 0.0479598 1e+09 1e+09 +%operation:A.mtx 0.00607491 1e+09 1e+09 %constructor:matrix SORT[12] SCAN[12] SHUFFLE[12] INSERT[12] -%constructor:A.mtx 0 0.01595 0 0.0159771 +%constructor:A.mtx 0 0.00223589 0 0.00188613 # symmetric matrix --- skipping transposed benchmarking # multi-nrhs benchmarking (1,4) -- now using nrhs 4. # Using alpha=1 beta=1 order=rows for rsb_spmv/rsb_spsv/rsb_spmm/rsb_spsm. # multi-transpose benchmarking -- now using transA = N. # will use input matrix flags: RSB_FLAG_USE_HALFWORD_INDICES, RSB_FLAG_SORTED_INPUT, RSB_FLAG_QUAD_PARTITIONING, RSB_FLAG_SYMMETRIC, RSB_FLAG_OWN_PARTITIONING_ARRAYS # Using 12 threads -# Constructed matrix (took 0.056s): (3 x 3)[0xaaab07621260]{C} @ (0(0..0),0(0..0)) (6 nnz, 2 nnz/r) flags 0x2442186 (coo:1, csr:0, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'S' +# Constructed matrix (took 0.004s): (3 x 3)[0xaaab17415280]{C} @ (0(0..0),0(0..0)) (6 nnz, 2 nnz/r) flags 0x2442186 (coo:1, csr:0, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'S' # matrix consistency check took 0.000s (ok) RSB Sparse Blocks Autotuner invoked requesting max 6 splits and max 6 merges in 1 rounds, threads spec.0 (specify negative values to enable threads tuning). Will autotune matrix: 3 x 3, type C, 6 nnz, 2 nnz/r, 4 subms, 3 lsubms, 4.0000 bpnz. Parameters: verbosity:1 mintimes:3 maxtimes:10 mindt:0 maxdt:3 -3 iterations (12 th.) took 0.02044s; avg 0.006813s ( +/- 34.74/ 20.25 %); best 0.004446s; worst 0.008193s; std dev. 0.001681 (taking best). -Reference operation time is 0.00444603 s (0.08637 Mflops) with 12 threads. -Starting merge (same threads) based auto-tuning procedure (transA=N, nrhs=4, order=rows) (max 6 steps, inclusive 3 grace steps) on: 3 x 3, type C, 6 nnz, 2 nnz/r, 4 subms, 3 lsubms, 4.0000 bpnz (tpop: 0.004446 Mflops: 0.086) -Merge (3 -> 1 leaves) took w.c.t. of 1.192e-05s, ~4.053e-06s of computing time (of which 1.192e-06s sorting, 2.861e-06s analysis) -3 iterations (12 th.) took 2.861e-06s; avg 9.537e-07s ( +/- 96.75/200.00 %); best 3.099e-08s; worst 2.861e-06s; std dev. 1.349e-06 (taking best). -Reference operation time is 3.09944e-08 s (1.239e+04 Mflops) with 12 threads. -After merge step 1: tpop: 3.099e-08 s ~Mflops: 12389.329 nsubm:1 otn:12 -Applying merge (3 -> 1 leaves, 12 th.) yielded SPEEDUP of 143446.154x: 0.004446s -> 3.099e-08s, so taking this instance. +3 iterations (12 th.) took 0.005844s; avg 0.001948s ( +/- 23.78/ 19.66 %); best 0.001485s; worst 0.002331s; std dev. 0.0003501 (taking best). +Reference operation time is 0.00148487 s (0.2586 Mflops) with 12 threads. +Starting merge (same threads) based auto-tuning procedure (transA=N, nrhs=4, order=rows) (max 6 steps, inclusive 3 grace steps) on: 3 x 3, type C, 6 nnz, 2 nnz/r, 4 subms, 3 lsubms, 4.0000 bpnz (tpop: 0.001485 Mflops: 0.259) +Merge (3 -> 1 leaves) took w.c.t. of 1.693e-05s, ~5.007e-06s of computing time (of which 9.537e-07s sorting, 3.099e-06s analysis) +3 iterations (12 th.) took 4.053e-06s; avg 1.351e-06s ( +/- 96.05/200.00 %); best 5.335e-08s; worst 4.053e-06s; std dev. 1.911e-06 (taking best). +Reference operation time is 5.33462e-08 s (7198 Mflops) with 12 threads. +After merge step 1: tpop: 5.335e-08 s ~Mflops: 7198.269 nsubm:1 otn:12 +Applying merge (3 -> 1 leaves, 12 th.) yielded SPEEDUP of 27834.637x: 0.001485s -> 5.335e-08s, so taking this instance. Merged all the matrix leaves: no reason to continue merging. -A total of 1 merge steps (of max 6) (3 -> 1 subms) took 0.0238s (of which 1.287e-05s partitioning, 0s I/O); computing times: 4.053e-06s in par. loops, 1.192e-06s sorting, 2.861e-06s analyzing) -Total merge + benchmarking process took 0.0238s, equivalent to 767976.9/5.4 new/old ops (0.04732s for 2 clones -- as 1526792.3/10.6 ops, or 763396.2/5.3 ops per clone), SPEEDUP of 143446.154x -Applying multi-merge (3 -> 1 leaves, 1 steps, 0 -> 12 th.sp.) yielded SPEEDUP of 143446.154x (0.004446s -> 3.099e-08s), will amortize in 5.4 ops by saving 0.004446s per op. -In 1 tuning rounds (tot. 0.068s, 0.047s for constructor, 2 clones) obtained a SPEEDUP of 14344515.4% (1.434e+05x) (from 0.08637 to 1.239e+04 Mflops). +A total of 1 merge steps (of max 6) (3 -> 1 subms) took 0.003251s (of which 1.907e-05s partitioning, 0s I/O); computing times: 5.007e-06s in par. loops, 9.537e-07s sorting, 3.099e-06s analyzing) +Total merge + benchmarking process took 0.003251s, equivalent to 60943.0/2.2 new/old ops (0.01239s for 2 clones -- as 232219.0/8.3 ops, or 116109.5/4.2 ops per clone), SPEEDUP of 27834.637x +Applying multi-merge (3 -> 1 leaves, 1 steps, 0 -> 12 th.sp.) yielded SPEEDUP of 27834.637x (0.001485s -> 5.335e-08s), will amortize in 2.2 ops by saving 0.001485s per op. +In 1 tuning rounds (tot. 0.018s, 0.012s for constructor, 2 clones) obtained a SPEEDUP of 2783363.7% (2.783e+04x) (from 0.2586 to 7198 Mflops). #pr: updating sample at index 13 (5^th of 16), 0^th touch for (0,0,0,0,1,2,0). -First run of RSB Autotuner took 0.0678399 s (4.446e-03 s -> 3.099e-08 s per spmv_sxsa) (tuned: 3 -> 1 lsubm). +First run of RSB Autotuner took 0.0183501 s (1.485e-03 s -> 5.335e-08 s per spmv_sxsa) (tuned: 3 -> 1 lsubm). RSB Sparse Blocks Autotuner invoked requesting max 0 splits and max 0 merges in 1 rounds, auto threads spec. -Second run of RSB Autotuner took 0.423942 s and estimated a speedup of 1.000000 x (3.099e-08 s -> 3.099e-08 s per op) in same matrix (1 -> 1 lsubm) +Second run of RSB Autotuner took 0.0609329 s and estimated a speedup of 1.000000 x (5.335e-08 s -> 5.335e-08 s per op) in same matrix (1 -> 1 lsubm) #min:1 0 #max:1 0 #sum:3 0 #norm:1.73205078 0 #used index storage compared to COO:28 vs 48 bytes (58.33%) ; compared to CSR:28 vs 40 bytes (77.78%) #%:CONSTRUCTOR_*:SORT SCAN INSERT SCAN+INSERT -%:CONSTRUCTOR_TIMES:A.mtx S N 12 3 3 6 0.000000 0.023372 0.016211 0.039583 -%:UNSORTEDCOO2RSB_TIME:A.mtx S N 12 3 3 6 0.039583 -%:RSB_SUBDIVISION_TIME:A.mtx S N 12 3 3 6 0.023372 -%:RSB_SHUFFLE_TIME:A.mtx S N 12 3 3 6 0.016211 +%:CONSTRUCTOR_TIMES:A.mtx S N 12 3 3 6 0.000000 0.001089 0.001558 0.002647 +%:UNSORTEDCOO2RSB_TIME:A.mtx S N 12 3 3 6 0.002647 +%:RSB_SUBDIVISION_TIME:A.mtx S N 12 3 3 6 0.001089 +%:RSB_SHUFFLE_TIME:A.mtx S N 12 3 3 6 0.001558 %:ROW_MAJOR_SORT_TIME:A.mtx S N 12 3 3 6 0.000000 %:ROW_MAJOR_SORT_SCALING:A.mtx S N 12 3 3 6 nan -%:SORTEDCOO2RSB_TIME:A.mtx S N 12 3 3 6 0.039583 +%:SORTEDCOO2RSB_TIME:A.mtx S N 12 3 3 6 0.002647 %:ROW_MAJOR_SORT_TO_MOP:A.mtx S N 12 3 3 6 0.000 %:UNSORTEDCOO2RSB_SCALING:A.mtx S N 12 3 3 6 1.00 %:SORTEDCOO2RSB_SCALING:A.mtx S N 12 3 3 6 1.00 @@ -4587,59 +4623,59 @@ %:SM_MINMAXAVGNNZ:A.mtx S N 12 3 3 6 6 6 6 # %operation:matrix CONSTRUCTOR[12] SPMV[12] SPMV[12] -%operation:A.mtx 0.0555818 1e+09 1e+09 +%operation:A.mtx 0.00357103 1e+09 1e+09 %constructor:matrix SORT[12] SCAN[12] SHUFFLE[12] INSERT[12] -%constructor:A.mtx 0 0.0233719 0 0.016211 +%constructor:A.mtx 0 0.0010891 0 0.00155783 # symmetric matrix --- skipping transposed benchmarking -# so far, program took 8.203s of wall clock time; ancillary tests 0.000s; I/O 0.000s; checks 0.000s; conversions 0.000s; rsb/mkl tuning 2.765s/0.000s . +# so far, program took 6.080s of wall clock time; ancillary tests 0.000s; I/O 0.000s; checks 0.000s; conversions 0.000s; rsb/mkl tuning 0.551s/0.000s . getrusage() stats: -ru_maxrss: 6 (maximum resident set size -- MB) -ru_stime : 0.05247s (system CPU time used) -ru_utime : 4.519s (user CPU time used) +ru_maxrss: 8 (maximum resident set size -- MB) +ru_stime : 0.06469s (system CPU time used) +ru_utime : 7.255s (user CPU time used) # multi-type benchmarking (DSCZ) -- now using typecode Z (last was C). # Cache block size total 524288 bytes, per-thread 43690 bytes -# so far, program took 8.203s of wall clock time; ancillary tests 0.000s; I/O 0.000s; checks 0.000s; conversions 0.000s; rsb/mkl tuning 2.765s/0.000s . +# so far, program took 6.080s of wall clock time; ancillary tests 0.000s; I/O 0.000s; checks 0.000s; conversions 0.000s; rsb/mkl tuning 0.551s/0.000s . # Reusing type converted (C->Z) arrays from last iteration instead of reloading matrix file. # multi-nrhs benchmarking (1,4) -- now using nrhs 1. # Using alpha=1 beta=1 order=rows for rsb_spmv/rsb_spsv/rsb_spmm/rsb_spsm. # multi-transpose benchmarking -- now using transA = N. # will use input matrix flags: RSB_FLAG_USE_HALFWORD_INDICES, RSB_FLAG_SORTED_INPUT, RSB_FLAG_QUAD_PARTITIONING, RSB_FLAG_SYMMETRIC, RSB_FLAG_OWN_PARTITIONING_ARRAYS # Using 12 threads -# Constructed matrix (took 0.052s): (3 x 3)[0xaaab07621260]{Z} @ (0(0..0),0(0..0)) (6 nnz, 2 nnz/r) flags 0x2442186 (coo:1, csr:0, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'S' +# Constructed matrix (took 0.006s): (3 x 3)[0xaaab17415280]{Z} @ (0(0..0),0(0..0)) (6 nnz, 2 nnz/r) flags 0x2442186 (coo:1, csr:0, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'S' # matrix consistency check took 0.000s (ok) RSB Sparse Blocks Autotuner invoked requesting max 6 splits and max 6 merges in 1 rounds, threads spec.0 (specify negative values to enable threads tuning). Will autotune matrix: 3 x 3, type Z, 6 nnz, 2 nnz/r, 4 subms, 3 lsubms, 4.0000 bpnz. Parameters: verbosity:1 mintimes:3 maxtimes:10 mindt:0 maxdt:3 -3 iterations (12 th.) took 0.02344s; avg 0.007813s ( +/- 2.04/ 2.15 %); best 0.007653s; worst 0.007981s; std dev. 0.0001341 (taking best). -Reference operation time is 0.007653 s (0.01254 Mflops) with 12 threads. -Starting merge (same threads) based auto-tuning procedure (transA=N, nrhs=1, order=rows) (max 6 steps, inclusive 3 grace steps) on: 3 x 3, type Z, 6 nnz, 2 nnz/r, 4 subms, 3 lsubms, 4.0000 bpnz (tpop: 0.007653 Mflops: 0.013) -Merge (3 -> 1 leaves) took w.c.t. of 1.192e-05s, ~4.053e-06s of computing time (of which 0s sorting, 2.861e-06s analysis) -3 iterations (12 th.) took 1.597e-05s; avg 5.325e-06s ( +/- 99.42/200.00 %); best 3.099e-08s; worst 1.597e-05s; std dev. 7.53e-06 (taking best). -Reference operation time is 3.09944e-08 s (3097 Mflops) with 12 threads. -After merge step 1: tpop: 3.099e-08 s ~Mflops: 3097.332 nsubm:1 otn:12 -Applying merge (3 -> 1 leaves, 12 th.) yielded SPEEDUP of 246915.385x: 0.007653s -> 3.099e-08s, so taking this instance. +3 iterations (12 th.) took 0.002941s; avg 0.0009804s ( +/- 35.94/ 30.76 %); best 0.000628s; worst 0.001282s; std dev. 0.0002694 (taking best). +Reference operation time is 0.000627995 s (0.1529 Mflops) with 12 threads. +Starting merge (same threads) based auto-tuning procedure (transA=N, nrhs=1, order=rows) (max 6 steps, inclusive 3 grace steps) on: 3 x 3, type Z, 6 nnz, 2 nnz/r, 4 subms, 3 lsubms, 4.0000 bpnz (tpop: 0.000628 Mflops: 0.153) +Merge (3 -> 1 leaves) took w.c.t. of 9.06e-06s, ~4.053e-06s of computing time (of which 9.537e-07s sorting, 2.146e-06s analysis) +3 iterations (12 th.) took 1.192e-05s; avg 3.974e-06s ( +/- 98.66/200.00 %); best 5.335e-08s; worst 1.192e-05s; std dev. 5.62e-06 (taking best). +Reference operation time is 5.33462e-08 s (1800 Mflops) with 12 threads. +After merge step 1: tpop: 5.335e-08 s ~Mflops: 1799.567 nsubm:1 otn:12 +Applying merge (3 -> 1 leaves, 12 th.) yielded SPEEDUP of 11772.067x: 0.000628s -> 5.335e-08s, so taking this instance. Merged all the matrix leaves: no reason to continue merging. -A total of 1 merge steps (of max 6) (3 -> 1 subms) took 0.02465s (of which 1.407e-05s partitioning, 0s I/O); computing times: 4.053e-06s in par. loops, 0s sorting, 2.861e-06s analyzing) -Total merge + benchmarking process took 0.02465s, equivalent to 795461.5/3.2 new/old ops (0.04879s for 2 clones -- as 1574092.3/6.4 ops, or 787046.2/3.2 ops per clone), SPEEDUP of 246915.385x -Applying multi-merge (3 -> 1 leaves, 1 steps, 0 -> 12 th.sp.) yielded SPEEDUP of 246915.385x (0.007653s -> 3.099e-08s), will amortize in 3.2 ops by saving 0.007653s per op. -In 1 tuning rounds (tot. 0.072s, 0.049s for constructor, 2 clones) obtained a SPEEDUP of 24691438.5% (2.469e+05x) (from 0.01254 to 3097 Mflops). +A total of 1 merge steps (of max 6) (3 -> 1 subms) took 0.002575s (of which 1.097e-05s partitioning, 0s I/O); computing times: 4.053e-06s in par. loops, 9.537e-07s sorting, 2.146e-06s analyzing) +Total merge + benchmarking process took 0.002575s, equivalent to 48272.6/4.1 new/old ops (0.005399s for 2 clones -- as 101206.7/8.6 ops, or 50603.4/4.3 ops per clone), SPEEDUP of 11772.067x +Applying multi-merge (3 -> 1 leaves, 1 steps, 0 -> 12 th.sp.) yielded SPEEDUP of 11772.067x (0.000628s -> 5.335e-08s), will amortize in 4.1 ops by saving 0.0006279s per op. +In 1 tuning rounds (tot. 0.0084s, 0.0054s for constructor, 2 clones) obtained a SPEEDUP of 1177106.7% (1.177e+04x) (from 0.1529 to 1800 Mflops). #pr: updating sample at index 7 (6^th of 16), 0^th touch for (0,0,0,0,0,3,0). -First run of RSB Autotuner took 0.0723171 s (7.653e-03 s -> 3.099e-08 s per spmv_sxsa) (tuned: 3 -> 1 lsubm). +First run of RSB Autotuner took 0.00841498 s (6.280e-04 s -> 5.335e-08 s per spmv_sxsa) (tuned: 3 -> 1 lsubm). RSB Sparse Blocks Autotuner invoked requesting max 0 splits and max 0 merges in 1 rounds, auto threads spec. -Second run of RSB Autotuner took 0.407017 s and estimated a speedup of 1.000000 x (3.099e-08 s -> 3.099e-08 s per op) in same matrix (1 -> 1 lsubm) +Second run of RSB Autotuner took 0.042639 s and estimated a speedup of 1.000000 x (5.335e-08 s -> 5.335e-08 s per op) in same matrix (1 -> 1 lsubm) #min:1 0 #max:1 0 #sum:3 0 #norm:1.7320508075688772 0 #used index storage compared to COO:28 vs 48 bytes (58.33%) ; compared to CSR:28 vs 40 bytes (77.78%) #%:CONSTRUCTOR_*:SORT SCAN INSERT SCAN+INSERT -%:CONSTRUCTOR_TIMES:A.mtx S N 12 3 3 6 0.000000 0.019545 0.015997 0.035542 -%:UNSORTEDCOO2RSB_TIME:A.mtx S N 12 3 3 6 0.035542 -%:RSB_SUBDIVISION_TIME:A.mtx S N 12 3 3 6 0.019545 -%:RSB_SHUFFLE_TIME:A.mtx S N 12 3 3 6 0.015997 +%:CONSTRUCTOR_TIMES:A.mtx S N 12 3 3 6 0.000000 0.002646 0.001909 0.004555 +%:UNSORTEDCOO2RSB_TIME:A.mtx S N 12 3 3 6 0.004555 +%:RSB_SUBDIVISION_TIME:A.mtx S N 12 3 3 6 0.002646 +%:RSB_SHUFFLE_TIME:A.mtx S N 12 3 3 6 0.001909 %:ROW_MAJOR_SORT_TIME:A.mtx S N 12 3 3 6 0.000000 %:ROW_MAJOR_SORT_SCALING:A.mtx S N 12 3 3 6 nan -%:SORTEDCOO2RSB_TIME:A.mtx S N 12 3 3 6 0.035542 +%:SORTEDCOO2RSB_TIME:A.mtx S N 12 3 3 6 0.004555 %:ROW_MAJOR_SORT_TO_MOP:A.mtx S N 12 3 3 6 0.000 %:UNSORTEDCOO2RSB_SCALING:A.mtx S N 12 3 3 6 1.00 %:SORTEDCOO2RSB_SCALING:A.mtx S N 12 3 3 6 1.00 @@ -4654,50 +4690,50 @@ %:SM_MINMAXAVGNNZ:A.mtx S N 12 3 3 6 6 6 6 # %operation:matrix CONSTRUCTOR[12] SPMV[12] SPMV[12] -%operation:A.mtx 0.0515501 1e+09 1e+09 +%operation:A.mtx 0.00641418 1e+09 1e+09 %constructor:matrix SORT[12] SCAN[12] SHUFFLE[12] INSERT[12] -%constructor:A.mtx 0 0.0195448 0 0.0159969 +%constructor:A.mtx 0 0.00264597 0 0.00190902 # symmetric matrix --- skipping transposed benchmarking # multi-nrhs benchmarking (1,4) -- now using nrhs 4. # Using alpha=1 beta=1 order=rows for rsb_spmv/rsb_spsv/rsb_spmm/rsb_spsm. # multi-transpose benchmarking -- now using transA = N. # will use input matrix flags: RSB_FLAG_USE_HALFWORD_INDICES, RSB_FLAG_SORTED_INPUT, RSB_FLAG_QUAD_PARTITIONING, RSB_FLAG_SYMMETRIC, RSB_FLAG_OWN_PARTITIONING_ARRAYS # Using 12 threads -# Constructed matrix (took 0.052s): (3 x 3)[0xaaab07621260]{Z} @ (0(0..0),0(0..0)) (6 nnz, 2 nnz/r) flags 0x2442186 (coo:1, csr:0, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'S' +# Constructed matrix (took 0.006s): (3 x 3)[0xaaab17415280]{Z} @ (0(0..0),0(0..0)) (6 nnz, 2 nnz/r) flags 0x2442186 (coo:1, csr:0, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'S' # matrix consistency check took 0.000s (ok) RSB Sparse Blocks Autotuner invoked requesting max 6 splits and max 6 merges in 1 rounds, threads spec.0 (specify negative values to enable threads tuning). Will autotune matrix: 3 x 3, type Z, 6 nnz, 2 nnz/r, 4 subms, 3 lsubms, 4.0000 bpnz. Parameters: verbosity:1 mintimes:3 maxtimes:10 mindt:0 maxdt:3 -3 iterations (12 th.) took 0.024s; avg 0.008s ( +/- 0.02/ 0.03 %); best 0.007998s; worst 0.008002s; std dev. 1.73e-06 (taking best). -Reference operation time is 0.00799799 s (0.04801 Mflops) with 12 threads. -Starting merge (same threads) based auto-tuning procedure (transA=N, nrhs=4, order=rows) (max 6 steps, inclusive 3 grace steps) on: 3 x 3, type Z, 6 nnz, 2 nnz/r, 4 subms, 3 lsubms, 4.0000 bpnz (tpop: 0.007998 Mflops: 0.048) -Merge (3 -> 1 leaves) took w.c.t. of 1.502e-05s, ~4.053e-06s of computing time (of which 9.537e-07s sorting, 3.099e-06s analysis) -3 iterations (12 th.) took 5.007e-06s; avg 1.669e-06s ( +/- 98.14/142.86 %); best 3.099e-08s; worst 4.053e-06s; std dev. 1.73e-06 (taking best). -Reference operation time is 3.09944e-08 s (1.239e+04 Mflops) with 12 threads. -After merge step 1: tpop: 3.099e-08 s ~Mflops: 12389.329 nsubm:1 otn:12 -Applying merge (3 -> 1 leaves, 12 th.) yielded SPEEDUP of 258046.154x: 0.007998s -> 3.099e-08s, so taking this instance. +3 iterations (12 th.) took 0.002732s; avg 0.0009107s ( +/- 29.84/ 16.29 %); best 0.000639s; worst 0.001059s; std dev. 0.0001924 (taking best). +Reference operation time is 0.000638962 s (0.601 Mflops) with 12 threads. +Starting merge (same threads) based auto-tuning procedure (transA=N, nrhs=4, order=rows) (max 6 steps, inclusive 3 grace steps) on: 3 x 3, type Z, 6 nnz, 2 nnz/r, 4 subms, 3 lsubms, 4.0000 bpnz (tpop: 0.000639 Mflops: 0.601) +Merge (3 -> 1 leaves) took w.c.t. of 1.001e-05s, ~4.053e-06s of computing time (of which 9.537e-07s sorting, 9.537e-07s analysis) +3 iterations (12 th.) took 3.815e-06s; avg 1.272e-06s ( +/- 95.80/200.00 %); best 5.335e-08s; worst 3.815e-06s; std dev. 1.798e-06 (taking best). +Reference operation time is 5.33462e-08 s (7198 Mflops) with 12 threads. +After merge step 1: tpop: 5.335e-08 s ~Mflops: 7198.269 nsubm:1 otn:12 +Applying merge (3 -> 1 leaves, 12 th.) yielded SPEEDUP of 11977.654x: 0.000639s -> 5.335e-08s, so taking this instance. Merged all the matrix leaves: no reason to continue merging. -A total of 1 merge steps (of max 6) (3 -> 1 subms) took 0.02399s (of which 1.717e-05s partitioning, 0s I/O); computing times: 4.053e-06s in par. loops, 9.537e-07s sorting, 3.099e-06s analyzing) -Total merge + benchmarking process took 0.02399s, equivalent to 773946.2/3.0 new/old ops (0.04792s for 2 clones -- as 1546015.4/6.0 ops, or 773007.7/3.0 ops per clone), SPEEDUP of 258046.154x -Applying multi-merge (3 -> 1 leaves, 1 steps, 0 -> 12 th.sp.) yielded SPEEDUP of 258046.154x (0.007998s -> 3.099e-08s), will amortize in 3.0 ops by saving 0.007998s per op. -In 1 tuning rounds (tot. 0.072s, 0.048s for constructor, 2 clones) obtained a SPEEDUP of 25804515.4% (2.58e+05x) (from 0.04801 to 1.239e+04 Mflops). +A total of 1 merge steps (of max 6) (3 -> 1 subms) took 0.002327s (of which 1.287e-05s partitioning, 0s I/O); computing times: 4.053e-06s in par. loops, 9.537e-07s sorting, 9.537e-07s analyzing) +Total merge + benchmarking process took 0.002327s, equivalent to 43620.1/3.6 new/old ops (0.005768s for 2 clones -- as 108120.7/9.0 ops, or 54060.3/4.5 ops per clone), SPEEDUP of 11977.654x +Applying multi-merge (3 -> 1 leaves, 1 steps, 0 -> 12 th.sp.) yielded SPEEDUP of 11977.654x (0.000639s -> 5.335e-08s), will amortize in 3.6 ops by saving 0.0006389s per op. +In 1 tuning rounds (tot. 0.0087s, 0.0058s for constructor, 2 clones) obtained a SPEEDUP of 1197665.4% (1.198e+04x) (from 0.601 to 7198 Mflops). #pr: updating sample at index 15 (7^th of 16), 0^th touch for (0,0,0,0,1,3,0). -First run of RSB Autotuner took 0.072181 s (7.998e-03 s -> 3.099e-08 s per spmv_sxsa) (tuned: 3 -> 1 lsubm). +First run of RSB Autotuner took 0.00875807 s (6.390e-04 s -> 5.335e-08 s per spmv_sxsa) (tuned: 3 -> 1 lsubm). RSB Sparse Blocks Autotuner invoked requesting max 0 splits and max 0 merges in 1 rounds, auto threads spec. -Second run of RSB Autotuner took 0.403807 s and estimated a speedup of 1.000000 x (3.099e-08 s -> 3.099e-08 s per op) in same matrix (1 -> 1 lsubm) +Second run of RSB Autotuner took 0.0533531 s and estimated a speedup of 1.000000 x (5.335e-08 s -> 5.335e-08 s per op) in same matrix (1 -> 1 lsubm) #min:1 0 #max:1 0 #sum:3 0 #norm:1.7320508075688772 0 #used index storage compared to COO:28 vs 48 bytes (58.33%) ; compared to CSR:28 vs 40 bytes (77.78%) #%:CONSTRUCTOR_*:SORT SCAN INSERT SCAN+INSERT -%:CONSTRUCTOR_TIMES:A.mtx S N 12 3 3 6 0.000000 0.019942 0.016011 0.035953 -%:UNSORTEDCOO2RSB_TIME:A.mtx S N 12 3 3 6 0.035953 -%:RSB_SUBDIVISION_TIME:A.mtx S N 12 3 3 6 0.019942 -%:RSB_SHUFFLE_TIME:A.mtx S N 12 3 3 6 0.016011 +%:CONSTRUCTOR_TIMES:A.mtx S N 12 3 3 6 0.000000 0.001980 0.001691 0.003671 +%:UNSORTEDCOO2RSB_TIME:A.mtx S N 12 3 3 6 0.003671 +%:RSB_SUBDIVISION_TIME:A.mtx S N 12 3 3 6 0.001980 +%:RSB_SHUFFLE_TIME:A.mtx S N 12 3 3 6 0.001691 %:ROW_MAJOR_SORT_TIME:A.mtx S N 12 3 3 6 0.000000 %:ROW_MAJOR_SORT_SCALING:A.mtx S N 12 3 3 6 nan -%:SORTEDCOO2RSB_TIME:A.mtx S N 12 3 3 6 0.035953 +%:SORTEDCOO2RSB_TIME:A.mtx S N 12 3 3 6 0.003671 %:ROW_MAJOR_SORT_TO_MOP:A.mtx S N 12 3 3 6 0.000 %:UNSORTEDCOO2RSB_SCALING:A.mtx S N 12 3 3 6 1.00 %:SORTEDCOO2RSB_SCALING:A.mtx S N 12 3 3 6 1.00 @@ -4712,332 +4748,332 @@ %:SM_MINMAXAVGNNZ:A.mtx S N 12 3 3 6 6 6 6 # %operation:matrix CONSTRUCTOR[12] SPMV[12] SPMV[12] -%operation:A.mtx 0.0519462 1e+09 1e+09 +%operation:A.mtx 0.00647497 1e+09 1e+09 %constructor:matrix SORT[12] SCAN[12] SHUFFLE[12] INSERT[12] -%constructor:A.mtx 0 0.019942 0 0.016011 +%constructor:A.mtx 0 0.00197983 0 0.0016911 # symmetric matrix --- skipping transposed benchmarking -# so far, program took 9.342s of wall clock time; ancillary tests 0.000s; I/O 0.000s; checks 0.000s; conversions 0.000s; rsb/mkl tuning 3.720s/0.000s . +# so far, program took 6.216s of wall clock time; ancillary tests 0.000s; I/O 0.000s; checks 0.000s; conversions 0.000s; rsb/mkl tuning 0.664s/0.000s . getrusage() stats: -ru_maxrss: 6 (maximum resident set size -- MB) -ru_stime : 0.06s (system CPU time used) -ru_utime : 5.167s (user CPU time used) +ru_maxrss: 8 (maximum resident set size -- MB) +ru_stime : 0.06902s (system CPU time used) +ru_utime : 7.788s (user CPU time used) # benchmarking terminated --- finalizing run. # ====== BEGIN Total summary record. #pr: ======== Limiting to type D: #pr: 2 samples (out of 8) matched the dump limiting criteria. #pr: Dump from a base of 8 samples (of max 16) ordered by (1,1,1,1,2,4,2) = (filename x cores x incX x incY x nrhs x typecode x transA). pr: BESTCODE MTX NR NC NNZ NRHS TYPE SYM TRANS NT AT-NT AT-MKL-NT BPNZ AT-BPNZ NSUBM AT-SUBM RSBBEST-MFLOPS OPTIME MKL-OPTIME AT-OPTIME AT-MKL-OPTIME AT-TIME RWminBW-GBps CB-bpf AT-MS CMFLOPS -pr: 1:R_R A 3 3 6 1 D S N 12 12 0 4.0000 4.6667 3 1 774.33 7.768e-03 0.000e+00 3.099e-08 0.000e+00 7.220e-02 4.78e+00 5.17e+00 1 2.40e-05 -pr: 9:R_R A 3 3 6 4 D S N 12 12 0 4.0000 4.6667 3 1 3097.33 7.967e-03 0.000e+00 3.099e-08 0.000e+00 7.201e-02 1.17e+01 2.79e+00 1 9.60e-05 +pr: 1:R_R A 3 3 6 1 D S N 12 12 0 4.0000 4.6667 3 1 449.89 4.518e-03 0.000e+00 5.335e-08 0.000e+00 3.842e-02 2.77e+00 5.17e+00 1 2.40e-05 +pr: 9:R_R A 3 3 6 4 D S N 12 12 0 4.0000 4.6667 3 1 1799.57 8.459e-04 0.000e+00 5.335e-08 0.000e+00 1.234e-02 6.82e+00 2.79e+00 1 9.60e-05 #pr: 2 samples (out of 8) matched the dump limiting criteria. #pr: below, we define 'successful' autotuning when speedup of 1.010000x is exceeded, and 'tuned' results even the ones which are same as untuned #pr: rsb autotuning was successful in 2 cases (100.00 %) and unsuccessful in 0 cases (0.00 %) -#pr: (in succ. cases rsb autotuning gave avg. 25383746.2 % faster, avg. sp. ratio 253838.462x, max sp. ratio 257046.154x, avg. ratio 0.000x) -#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 2326353.8/2323192.3/2329515.4/4652707.7 tuned ops) -#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 9.2/ 9.0/ 9.3/ 18.3 untuned ops) -#pr: (and amortizes from untuned rsb in avg. 9.2, min. 9.0, max. 9.3 ops) +#pr: (in succ. cases rsb autotuning gave avg. 5027386.0 % faster, avg. sp. ratio 50274.860x, max sp. ratio 84692.737x, avg. ratio 0.000x) +#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 475834.6/231392.2/720277.1/951669.3 tuned ops) +#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 11.5/ 8.5/ 14.6/ 23.1 untuned ops) +#pr: (and amortizes from untuned rsb in avg. 11.5, min. 8.5, max. 14.6 ops) #pr: (avg/min/max (avg) nnz per subm before successful tuning were 2/ 2/ 2) #pr: (avg/min/max (avg) nnz per subm after successful tuning were 6/ 6/ 6) #pr: (avg/min/max (avg) bytes per subm before successful tuning were 16/ 16/ 16) #pr: (avg/min/max (avg) bytes per subm after successful tuning were 48/ 48/ 48) #pr: (avg/min/max (avg) bytes per nnz before successful tuning were 4.000/ 4.000/ 4.000) -#pr: (avg/min/max operands (mtx,lhs,rhs) read bandwidth lower bound 6.324/ 4.001/ 8.647,GBps) -#pr: (avg/min/max operands (mtx,rhs:r;lhs:rw) bandwidth lower bound 16.519/ 4.775/ 11.744,GBps) +#pr: (avg/min/max operands (mtx,lhs,rhs) read bandwidth lower bound 3.674/ 2.324/ 5.024,GBps) +#pr: (avg/min/max operands (mtx,rhs:r;lhs:rw) bandwidth lower bound 9.598/ 2.774/ 6.823,GBps) #pr: (avg/min/max code balance (bytes read at least once per flop) 3.979/ 2.792/ 5.167) #pr: (avg/min/max (avg) bytes per nnz after successful tuning were 4.667/ 4.667/ 4.667) #pr: (matrix has been subdivided more/less/same in resp. 0 / 2 /0 cases) #pr: (matrix has used more/less/same threads in resp. 0 / 0 /2 cases) #pr: no unsuccessful rsb autotuning attempt (according to 1.01x threshold) -#pr: rsb auto tuning (either succ. or uns.) time was: on avg.: 0.07 s, min 0.07 s, max 0.07 s, tot 0.14 s (2 samples) -#pr: rsb auto tuning ( only successful ) time was: on avg.: 0.07 s, min 0.07 s, max 0.07 s, tot 0.14 s (2 samples) -#pr: best tun. rsb canon. mflops were: on avg. 1.936e+03, min 7.743e+02, max 3.097e+03 (2 samples) -#pr: ref. unt. rsb canon. mflops were: on avg. 7.570e-03, min 3.090e-03, max 1.205e-02 (2 samples) -#pr: best tun. rsb operation time was: on avg. 3.099e-08s, min 3.099e-08s, max 3.099e-08s, tot 6.199e-08s (2 samples) -#pr: ref. unt. rsb operation time was: on avg. 7.868e-03s, min 7.768e-03s, max 7.967e-03s, tot 1.574e-02s (2 samples) -#pr: min / max ratio of in-memory MEMSET bandwidth to extrapolated read bandwidth ratio: 3.496e+00 7.557e+00 -#pr: in-cache to in-memory MEMSET bandwidth ratio: 1.575e+00 +#pr: rsb auto tuning (either succ. or uns.) time was: on avg.: 0.03 s, min 0.01 s, max 0.04 s, tot 0.05 s (2 samples) +#pr: rsb auto tuning ( only successful ) time was: on avg.: 0.03 s, min 0.01 s, max 0.04 s, tot 0.05 s (2 samples) +#pr: best tun. rsb canon. mflops were: on avg. 1.125e+03, min 4.499e+02, max 1.800e+03 (2 samples) +#pr: ref. unt. rsb canon. mflops were: on avg. 5.940e-02, min 5.312e-03, max 1.135e-01 (2 samples) +#pr: best tun. rsb operation time was: on avg. 5.335e-08s, min 5.335e-08s, max 5.335e-08s, tot 1.067e-07s (2 samples) +#pr: ref. unt. rsb operation time was: on avg. 2.682e-03s, min 8.459e-04s, max 4.518e-03s, tot 5.364e-03s (2 samples) +#pr: min / max ratio of in-memory MEMSET bandwidth to extrapolated read bandwidth ratio: 9.138e+00 1.975e+01 +#pr: in-cache to in-memory MEMSET bandwidth ratio: 1.040e+00 #pr: rsb nrhs-to-overall-min-rhs speed ratio was: on avg. 4.000e+00 x, min 4.000e+00 x, max 4.000e+00 x (1 samples, the non-min-nrhs ones) #pr: ======== Limiting to type S: #pr: 2 samples (out of 8) matched the dump limiting criteria. #pr: Dump from a base of 8 samples (of max 16) ordered by (1,1,1,1,2,4,2) = (filename x cores x incX x incY x nrhs x typecode x transA). pr: BESTCODE MTX NR NC NNZ NRHS TYPE SYM TRANS NT AT-NT AT-MKL-NT BPNZ AT-BPNZ NSUBM AT-SUBM RSBBEST-MFLOPS OPTIME MKL-OPTIME AT-OPTIME AT-MKL-OPTIME AT-TIME RWminBW-GBps CB-bpf AT-MS CMFLOPS -pr: 3:R_R A 3 3 6 1 S S N 12 12 0 4.0000 4.6667 3 1 774.33 7.994e-03 0.000e+00 3.099e-08 0.000e+00 7.374e-02 2.84e+00 3.17e+00 1 2.40e-05 -pr: 11:R_R A 3 3 6 4 S S N 12 12 0 4.0000 4.6667 3 1 3097.33 7.788e-03 0.000e+00 3.099e-08 0.000e+00 7.652e-02 6.32e+00 1.54e+00 1 9.60e-05 +pr: 3:R_R A 3 3 6 1 S S N 12 12 0 4.0000 4.6667 3 1 449.89 8.578e-04 0.000e+00 5.335e-08 0.000e+00 7.500e-03 1.65e+00 3.17e+00 1 2.40e-05 +pr: 11:R_R A 3 3 6 4 S S N 12 12 0 4.0000 4.6667 3 1 1799.57 4.320e-04 0.000e+00 5.335e-08 0.000e+00 9.853e-03 3.67e+00 1.54e+00 1 9.60e-05 #pr: 2 samples (out of 8) matched the dump limiting criteria. #pr: below, we define 'successful' autotuning when speedup of 1.010000x is exceeded, and 'tuned' results even the ones which are same as untuned #pr: rsb autotuning was successful in 2 cases (100.00 %) and unsuccessful in 0 cases (0.00 %) -#pr: (in succ. cases rsb autotuning gave avg. 25459130.8 % faster, avg. sp. ratio 254592.308x, max sp. ratio 257915.385x, avg. ratio 0.000x) -#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 2424019.2/2379076.9/2468961.5/4848038.5 tuned ops) -#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 9.5/ 9.2/ 9.8/ 19.1 untuned ops) -#pr: (and amortizes from untuned rsb in avg. 9.5, min. 9.2, max. 9.8 ops) +#pr: (in succ. cases rsb autotuning gave avg. 1208838.5 % faster, avg. sp. ratio 12089.385x, max sp. ratio 16080.447x, avg. ratio 0.000x) +#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 162645.8/140594.4/184697.2/325291.6 tuned ops) +#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 15.8/ 8.7/ 22.8/ 31.6 untuned ops) +#pr: (and amortizes from untuned rsb in avg. 15.8, min. 8.7, max. 22.8 ops) #pr: (avg/min/max (avg) nnz per subm before successful tuning were 2/ 2/ 2) #pr: (avg/min/max (avg) nnz per subm after successful tuning were 6/ 6/ 6) #pr: (avg/min/max (avg) bytes per subm before successful tuning were 8/ 8/ 8) #pr: (avg/min/max (avg) bytes per subm after successful tuning were 24/ 24/ 24) #pr: (avg/min/max (avg) bytes per nnz before successful tuning were 4.000/ 4.000/ 4.000) -#pr: (avg/min/max operands (mtx,lhs,rhs) read bandwidth lower bound 3.614/ 2.452/ 4.775,GBps) -#pr: (avg/min/max operands (mtx,rhs:r;lhs:rw) bandwidth lower bound 9.163/ 2.839/ 6.324,GBps) +#pr: (avg/min/max operands (mtx,lhs,rhs) read bandwidth lower bound 2.099/ 1.425/ 2.774,GBps) +#pr: (avg/min/max operands (mtx,rhs:r;lhs:rw) bandwidth lower bound 5.324/ 1.650/ 3.674,GBps) #pr: (avg/min/max code balance (bytes read at least once per flop) 2.354/ 1.542/ 3.167) #pr: (avg/min/max (avg) bytes per nnz after successful tuning were 4.667/ 4.667/ 4.667) #pr: (matrix has been subdivided more/less/same in resp. 0 / 2 /0 cases) #pr: (matrix has used more/less/same threads in resp. 0 / 0 /2 cases) #pr: no unsuccessful rsb autotuning attempt (according to 1.01x threshold) -#pr: rsb auto tuning (either succ. or uns.) time was: on avg.: 0.08 s, min 0.07 s, max 0.08 s, tot 0.15 s (2 samples) -#pr: rsb auto tuning ( only successful ) time was: on avg.: 0.08 s, min 0.07 s, max 0.08 s, tot 0.15 s (2 samples) -#pr: best tun. rsb canon. mflops were: on avg. 1.936e+03, min 7.743e+02, max 3.097e+03 (2 samples) -#pr: ref. unt. rsb canon. mflops were: on avg. 7.665e-03, min 3.002e-03, max 1.233e-02 (2 samples) -#pr: best tun. rsb operation time was: on avg. 3.099e-08s, min 3.099e-08s, max 3.099e-08s, tot 6.199e-08s (2 samples) -#pr: ref. unt. rsb operation time was: on avg. 7.891e-03s, min 7.788e-03s, max 7.994e-03s, tot 1.578e-02s (2 samples) -#pr: min / max ratio of in-memory MEMSET bandwidth to extrapolated read bandwidth ratio: 6.331e+00 1.233e+01 -#pr: in-cache to in-memory MEMSET bandwidth ratio: 1.575e+00 +#pr: rsb auto tuning (either succ. or uns.) time was: on avg.: 0.01 s, min 0.01 s, max 0.01 s, tot 0.02 s (2 samples) +#pr: rsb auto tuning ( only successful ) time was: on avg.: 0.01 s, min 0.01 s, max 0.01 s, tot 0.02 s (2 samples) +#pr: best tun. rsb canon. mflops were: on avg. 1.125e+03, min 4.499e+02, max 1.800e+03 (2 samples) +#pr: ref. unt. rsb canon. mflops were: on avg. 1.251e-01, min 2.798e-02, max 2.222e-01 (2 samples) +#pr: best tun. rsb operation time was: on avg. 5.335e-08s, min 5.335e-08s, max 5.335e-08s, tot 1.067e-07s (2 samples) +#pr: ref. unt. rsb operation time was: on avg. 6.449e-04s, min 4.320e-04s, max 8.578e-04s, tot 1.290e-03s (2 samples) +#pr: min / max ratio of in-memory MEMSET bandwidth to extrapolated read bandwidth ratio: 1.655e+01 3.222e+01 +#pr: in-cache to in-memory MEMSET bandwidth ratio: 1.040e+00 #pr: rsb nrhs-to-overall-min-rhs speed ratio was: on avg. 4.000e+00 x, min 4.000e+00 x, max 4.000e+00 x (1 samples, the non-min-nrhs ones) #pr: ======== Limiting to type C: #pr: 2 samples (out of 8) matched the dump limiting criteria. #pr: Dump from a base of 8 samples (of max 16) ordered by (1,1,1,1,2,4,2) = (filename x cores x incX x incY x nrhs x typecode x transA). pr: BESTCODE MTX NR NC NNZ NRHS TYPE SYM TRANS NT AT-NT AT-MKL-NT BPNZ AT-BPNZ NSUBM AT-SUBM RSBBEST-MFLOPS OPTIME MKL-OPTIME AT-OPTIME AT-MKL-OPTIME AT-TIME RWminBW-GBps CB-bpf AT-MS CMFLOPS -pr: 5:R_R A 3 3 6 1 C S N 12 12 0 4.0000 4.6667 3 1 3097.33 7.763e-03 0.000e+00 3.099e-08 0.000e+00 7.209e-02 4.78e+00 1.29e+00 1 9.60e-05 -pr: 13:R_R A 3 3 6 4 C S N 12 12 0 4.0000 4.6667 3 1 12389.33 4.446e-03 0.000e+00 3.099e-08 0.000e+00 6.784e-02 1.17e+01 6.98e-01 1 3.84e-04 +pr: 5:R_R A 3 3 6 1 C S N 12 12 0 4.0000 4.6667 3 1 1799.57 6.881e-04 0.000e+00 5.335e-08 0.000e+00 7.385e-03 2.77e+00 1.29e+00 1 9.60e-05 +pr: 13:R_R A 3 3 6 4 C S N 12 12 0 4.0000 4.6667 3 1 7198.27 1.485e-03 0.000e+00 5.335e-08 0.000e+00 1.835e-02 6.82e+00 6.98e-01 1 3.84e-04 #pr: 2 samples (out of 8) matched the dump limiting criteria. #pr: below, we define 'successful' autotuning when speedup of 1.010000x is exceeded, and 'tuned' results even the ones which are same as untuned #pr: rsb autotuning was successful in 2 cases (100.00 %) and unsuccessful in 0 cases (0.00 %) -#pr: (in succ. cases rsb autotuning gave avg. 19695284.6 % faster, avg. sp. ratio 196953.846x, max sp. ratio 250461.538x, avg. ratio 0.000x) -#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 2257261.5/2188776.9/2325746.2/4514523.1 tuned ops) -#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 12.3/ 9.3/ 15.3/ 24.5 untuned ops) -#pr: (and amortizes from untuned rsb in avg. 12.3, min. 9.3, max. 15.3 ops) +#pr: (in succ. cases rsb autotuning gave avg. 2036548.0 % faster, avg. sp. ratio 20366.480x, max sp. ratio 27834.637x, avg. ratio 0.000x) +#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 241208.9/138435.8/343982.1/482417.9 tuned ops) +#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 11.5/ 10.7/ 12.4/ 23.1 untuned ops) +#pr: (and amortizes from untuned rsb in avg. 11.5, min. 10.7, max. 12.4 ops) #pr: (avg/min/max (avg) nnz per subm before successful tuning were 2/ 2/ 2) #pr: (avg/min/max (avg) nnz per subm after successful tuning were 6/ 6/ 6) #pr: (avg/min/max (avg) bytes per subm before successful tuning were 16/ 16/ 16) #pr: (avg/min/max (avg) bytes per subm after successful tuning were 48/ 48/ 48) #pr: (avg/min/max (avg) bytes per nnz before successful tuning were 4.000/ 4.000/ 4.000) -#pr: (avg/min/max operands (mtx,lhs,rhs) read bandwidth lower bound 6.324/ 4.001/ 8.647,GBps) -#pr: (avg/min/max operands (mtx,rhs:r;lhs:rw) bandwidth lower bound 16.519/ 4.775/ 11.744,GBps) +#pr: (avg/min/max operands (mtx,lhs,rhs) read bandwidth lower bound 3.674/ 2.324/ 5.024,GBps) +#pr: (avg/min/max operands (mtx,rhs:r;lhs:rw) bandwidth lower bound 9.598/ 2.774/ 6.823,GBps) #pr: (avg/min/max code balance (bytes read at least once per flop) 0.995/ 0.698/ 1.292) #pr: (avg/min/max (avg) bytes per nnz after successful tuning were 4.667/ 4.667/ 4.667) #pr: (matrix has been subdivided more/less/same in resp. 0 / 2 /0 cases) #pr: (matrix has used more/less/same threads in resp. 0 / 0 /2 cases) #pr: no unsuccessful rsb autotuning attempt (according to 1.01x threshold) -#pr: rsb auto tuning (either succ. or uns.) time was: on avg.: 0.07 s, min 0.07 s, max 0.07 s, tot 0.14 s (2 samples) -#pr: rsb auto tuning ( only successful ) time was: on avg.: 0.07 s, min 0.07 s, max 0.07 s, tot 0.14 s (2 samples) -#pr: best tun. rsb canon. mflops were: on avg. 7.743e+03, min 3.097e+03, max 1.239e+04 (2 samples) -#pr: ref. unt. rsb canon. mflops were: on avg. 4.937e-02, min 1.237e-02, max 8.637e-02 (2 samples) -#pr: best tun. rsb operation time was: on avg. 3.099e-08s, min 3.099e-08s, max 3.099e-08s, tot 6.199e-08s (2 samples) -#pr: ref. unt. rsb operation time was: on avg. 6.104e-03s, min 4.446e-03s, max 7.763e-03s, tot 1.221e-02s (2 samples) -#pr: min / max ratio of in-memory MEMSET bandwidth to extrapolated read bandwidth ratio: 3.496e+00 7.557e+00 -#pr: in-cache to in-memory MEMSET bandwidth ratio: 1.575e+00 +#pr: rsb auto tuning (either succ. or uns.) time was: on avg.: 0.01 s, min 0.01 s, max 0.02 s, tot 0.03 s (2 samples) +#pr: rsb auto tuning ( only successful ) time was: on avg.: 0.01 s, min 0.01 s, max 0.02 s, tot 0.03 s (2 samples) +#pr: best tun. rsb canon. mflops were: on avg. 4.499e+03, min 1.800e+03, max 7.198e+03 (2 samples) +#pr: ref. unt. rsb canon. mflops were: on avg. 1.991e-01, min 1.395e-01, max 2.586e-01 (2 samples) +#pr: best tun. rsb operation time was: on avg. 5.335e-08s, min 5.335e-08s, max 5.335e-08s, tot 1.067e-07s (2 samples) +#pr: ref. unt. rsb operation time was: on avg. 1.086e-03s, min 6.881e-04s, max 1.485e-03s, tot 2.173e-03s (2 samples) +#pr: min / max ratio of in-memory MEMSET bandwidth to extrapolated read bandwidth ratio: 9.138e+00 1.975e+01 +#pr: in-cache to in-memory MEMSET bandwidth ratio: 1.040e+00 #pr: rsb nrhs-to-overall-min-rhs speed ratio was: on avg. 4.000e+00 x, min 4.000e+00 x, max 4.000e+00 x (1 samples, the non-min-nrhs ones) #pr: ======== Limiting to type Z: #pr: 2 samples (out of 8) matched the dump limiting criteria. #pr: Dump from a base of 8 samples (of max 16) ordered by (1,1,1,1,2,4,2) = (filename x cores x incX x incY x nrhs x typecode x transA). pr: BESTCODE MTX NR NC NNZ NRHS TYPE SYM TRANS NT AT-NT AT-MKL-NT BPNZ AT-BPNZ NSUBM AT-SUBM RSBBEST-MFLOPS OPTIME MKL-OPTIME AT-OPTIME AT-MKL-OPTIME AT-TIME RWminBW-GBps CB-bpf AT-MS CMFLOPS -pr: 7:R_R A 3 3 6 1 Z S N 12 12 0 4.0000 4.6667 3 1 3097.33 7.653e-03 0.000e+00 3.099e-08 0.000e+00 7.232e-02 8.65e+00 2.29e+00 1 9.60e-05 -pr: 15:R_R A 3 3 6 4 Z S N 12 12 0 4.0000 4.6667 3 1 12389.33 7.998e-03 0.000e+00 3.099e-08 0.000e+00 7.218e-02 2.26e+01 1.32e+00 1 3.84e-04 +pr: 7:R_R A 3 3 6 1 Z S N 12 12 0 4.0000 4.6667 3 1 1799.57 6.280e-04 0.000e+00 5.335e-08 0.000e+00 8.415e-03 5.02e+00 2.29e+00 1 9.60e-05 +pr: 15:R_R A 3 3 6 4 Z S N 12 12 0 4.0000 4.6667 3 1 7198.27 6.390e-04 0.000e+00 5.335e-08 0.000e+00 8.758e-03 1.31e+01 1.32e+00 1 3.84e-04 #pr: 2 samples (out of 8) matched the dump limiting criteria. #pr: below, we define 'successful' autotuning when speedup of 1.010000x is exceeded, and 'tuned' results even the ones which are same as untuned #pr: rsb autotuning was successful in 2 cases (100.00 %) and unsuccessful in 0 cases (0.00 %) -#pr: (in succ. cases rsb autotuning gave avg. 25247976.9 % faster, avg. sp. ratio 252480.769x, max sp. ratio 258046.154x, avg. ratio 0.000x) -#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 2331034.6/2328838.5/2333230.8/4662069.2 tuned ops) -#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 9.2/ 9.0/ 9.4/ 18.5 untuned ops) -#pr: (and amortizes from untuned rsb in avg. 9.2, min. 9.0, max. 9.4 ops) +#pr: (in succ. cases rsb autotuning gave avg. 1187386.0 % faster, avg. sp. ratio 11874.860x, max sp. ratio 11977.654x, avg. ratio 0.000x) +#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 160958.7/157743.0/164174.3/321917.3 tuned ops) +#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 13.6/ 13.4/ 13.7/ 27.1 untuned ops) +#pr: (and amortizes from untuned rsb in avg. 13.6, min. 13.4, max. 13.7 ops) #pr: (avg/min/max (avg) nnz per subm before successful tuning were 2/ 2/ 2) #pr: (avg/min/max (avg) nnz per subm after successful tuning were 6/ 6/ 6) #pr: (avg/min/max (avg) bytes per subm before successful tuning were 32/ 32/ 32) #pr: (avg/min/max (avg) bytes per subm after successful tuning were 96/ 96/ 96) #pr: (avg/min/max (avg) bytes per nnz before successful tuning were 4.000/ 4.000/ 4.000) -#pr: (avg/min/max operands (mtx,lhs,rhs) read bandwidth lower bound 11.744/ 7.098/ 16.390,GBps) -#pr: (avg/min/max operands (mtx,rhs:r;lhs:rw) bandwidth lower bound 31.231/ 8.647/ 22.585,GBps) +#pr: (avg/min/max operands (mtx,lhs,rhs) read bandwidth lower bound 6.823/ 4.124/ 9.523,GBps) +#pr: (avg/min/max operands (mtx,rhs:r;lhs:rw) bandwidth lower bound 18.146/ 5.024/ 13.122,GBps) #pr: (avg/min/max code balance (bytes read at least once per flop) 1.807/ 1.323/ 2.292) #pr: (avg/min/max (avg) bytes per nnz after successful tuning were 4.667/ 4.667/ 4.667) #pr: (matrix has been subdivided more/less/same in resp. 0 / 2 /0 cases) #pr: (matrix has used more/less/same threads in resp. 0 / 0 /2 cases) #pr: no unsuccessful rsb autotuning attempt (according to 1.01x threshold) -#pr: rsb auto tuning (either succ. or uns.) time was: on avg.: 0.07 s, min 0.07 s, max 0.07 s, tot 0.14 s (2 samples) -#pr: rsb auto tuning ( only successful ) time was: on avg.: 0.07 s, min 0.07 s, max 0.07 s, tot 0.14 s (2 samples) -#pr: best tun. rsb canon. mflops were: on avg. 7.743e+03, min 3.097e+03, max 1.239e+04 (2 samples) -#pr: ref. unt. rsb canon. mflops were: on avg. 3.028e-02, min 1.254e-02, max 4.801e-02 (2 samples) -#pr: best tun. rsb operation time was: on avg. 3.099e-08s, min 3.099e-08s, max 3.099e-08s, tot 6.199e-08s (2 samples) -#pr: ref. unt. rsb operation time was: on avg. 7.825e-03s, min 7.653e-03s, max 7.998e-03s, tot 1.565e-02s (2 samples) -#pr: min / max ratio of in-memory MEMSET bandwidth to extrapolated read bandwidth ratio: 1.845e+00 4.259e+00 -#pr: in-cache to in-memory MEMSET bandwidth ratio: 1.575e+00 +#pr: rsb auto tuning (either succ. or uns.) time was: on avg.: 0.01 s, min 0.01 s, max 0.01 s, tot 0.02 s (2 samples) +#pr: rsb auto tuning ( only successful ) time was: on avg.: 0.01 s, min 0.01 s, max 0.01 s, tot 0.02 s (2 samples) +#pr: best tun. rsb canon. mflops were: on avg. 4.499e+03, min 1.800e+03, max 7.198e+03 (2 samples) +#pr: ref. unt. rsb canon. mflops were: on avg. 3.769e-01, min 1.529e-01, max 6.010e-01 (2 samples) +#pr: best tun. rsb operation time was: on avg. 5.335e-08s, min 5.335e-08s, max 5.335e-08s, tot 1.067e-07s (2 samples) +#pr: ref. unt. rsb operation time was: on avg. 6.335e-04s, min 6.280e-04s, max 6.390e-04s, tot 1.267e-03s (2 samples) +#pr: min / max ratio of in-memory MEMSET bandwidth to extrapolated read bandwidth ratio: 4.821e+00 1.113e+01 +#pr: in-cache to in-memory MEMSET bandwidth ratio: 1.040e+00 #pr: rsb nrhs-to-overall-min-rhs speed ratio was: on avg. 4.000e+00 x, min 4.000e+00 x, max 4.000e+00 x (1 samples, the non-min-nrhs ones) #pr: ======== Limiting to nrhs=1: #pr: 4 samples (out of 8) matched the dump limiting criteria. #pr: Dump from a base of 8 samples (of max 16) ordered by (1,1,1,1,2,4,2) = (filename x cores x incX x incY x nrhs x typecode x transA). pr: BESTCODE MTX NR NC NNZ NRHS TYPE SYM TRANS NT AT-NT AT-MKL-NT BPNZ AT-BPNZ NSUBM AT-SUBM RSBBEST-MFLOPS OPTIME MKL-OPTIME AT-OPTIME AT-MKL-OPTIME AT-TIME RWminBW-GBps CB-bpf AT-MS CMFLOPS -pr: 1:R_R A 3 3 6 1 D S N 12 12 0 4.0000 4.6667 3 1 774.33 7.768e-03 0.000e+00 3.099e-08 0.000e+00 7.220e-02 4.78e+00 5.17e+00 1 2.40e-05 -pr: 3:R_R A 3 3 6 1 S S N 12 12 0 4.0000 4.6667 3 1 774.33 7.994e-03 0.000e+00 3.099e-08 0.000e+00 7.374e-02 2.84e+00 3.17e+00 1 2.40e-05 -pr: 5:R_R A 3 3 6 1 C S N 12 12 0 4.0000 4.6667 3 1 3097.33 7.763e-03 0.000e+00 3.099e-08 0.000e+00 7.209e-02 4.78e+00 1.29e+00 1 9.60e-05 -pr: 7:R_R A 3 3 6 1 Z S N 12 12 0 4.0000 4.6667 3 1 3097.33 7.653e-03 0.000e+00 3.099e-08 0.000e+00 7.232e-02 8.65e+00 2.29e+00 1 9.60e-05 +pr: 1:R_R A 3 3 6 1 D S N 12 12 0 4.0000 4.6667 3 1 449.89 4.518e-03 0.000e+00 5.335e-08 0.000e+00 3.842e-02 2.77e+00 5.17e+00 1 2.40e-05 +pr: 3:R_R A 3 3 6 1 S S N 12 12 0 4.0000 4.6667 3 1 449.89 8.578e-04 0.000e+00 5.335e-08 0.000e+00 7.500e-03 1.65e+00 3.17e+00 1 2.40e-05 +pr: 5:R_R A 3 3 6 1 C S N 12 12 0 4.0000 4.6667 3 1 1799.57 6.881e-04 0.000e+00 5.335e-08 0.000e+00 7.385e-03 2.77e+00 1.29e+00 1 9.60e-05 +pr: 7:R_R A 3 3 6 1 Z S N 12 12 0 4.0000 4.6667 3 1 1799.57 6.280e-04 0.000e+00 5.335e-08 0.000e+00 8.415e-03 5.02e+00 2.29e+00 1 9.60e-05 #pr: 4 samples (out of 8) matched the dump limiting criteria. #pr: below, we define 'successful' autotuning when speedup of 1.010000x is exceeded, and 'tuned' results even the ones which are same as untuned #pr: rsb autotuning was successful in 4 cases (100.00 %) and unsuccessful in 0 cases (0.00 %) -#pr: (in succ. cases rsb autotuning gave avg. 25147976.9 % faster, avg. sp. ratio 251480.769x, max sp. ratio 257915.385x, avg. ratio 0.000x) -#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 2341892.3/2325746.2/2379076.9/9367569.2 tuned ops) -#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 9.3/ 9.2/ 9.4/ 37.3 untuned ops) -#pr: (and amortizes from untuned rsb in avg. 9.3, min. 9.2, max. 9.4 ops) +#pr: (in succ. cases rsb autotuning gave avg. 3135989.4 % faster, avg. sp. ratio 31360.894x, max sp. ratio 84692.737x, avg. ratio 0.000x) +#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 289262.6/138435.8/720277.1/1157050.3 tuned ops) +#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 10.3/ 8.5/ 13.4/ 41.4 untuned ops) +#pr: (and amortizes from untuned rsb in avg. 10.3, min. 8.5, max. 13.4 ops) #pr: (avg/min/max (avg) nnz per subm before successful tuning were 2/ 2/ 2) #pr: (avg/min/max (avg) nnz per subm after successful tuning were 6/ 6/ 6) #pr: (avg/min/max (avg) bytes per subm before successful tuning were 18/ 8/ 32) #pr: (avg/min/max (avg) bytes per subm after successful tuning were 54/ 24/ 96) #pr: (avg/min/max (avg) bytes per nnz before successful tuning were 4.000/ 4.000/ 4.000) -#pr: (avg/min/max operands (mtx,lhs,rhs) read bandwidth lower bound 4.388/ 2.452/ 7.098,GBps) -#pr: (avg/min/max operands (mtx,rhs:r;lhs:rw) bandwidth lower bound 21.036/ 2.839/ 8.647,GBps) +#pr: (avg/min/max operands (mtx,lhs,rhs) read bandwidth lower bound 2.549/ 1.425/ 4.124,GBps) +#pr: (avg/min/max operands (mtx,rhs:r;lhs:rw) bandwidth lower bound 12.222/ 1.650/ 5.024,GBps) #pr: (avg/min/max code balance (bytes read at least once per flop) 2.979/ 1.292/ 5.167) #pr: (avg/min/max (avg) bytes per nnz after successful tuning were 4.667/ 4.667/ 4.667) #pr: (matrix has been subdivided more/less/same in resp. 0 / 4 /0 cases) #pr: (matrix has used more/less/same threads in resp. 0 / 0 /4 cases) #pr: no unsuccessful rsb autotuning attempt (according to 1.01x threshold) -#pr: rsb auto tuning (either succ. or uns.) time was: on avg.: 0.07 s, min 0.07 s, max 0.07 s, tot 0.29 s (4 samples) -#pr: rsb auto tuning ( only successful ) time was: on avg.: 0.07 s, min 0.07 s, max 0.07 s, tot 0.29 s (4 samples) -#pr: best tun. rsb canon. mflops were: on avg. 1.936e+03, min 7.743e+02, max 3.097e+03 (4 samples) -#pr: ref. unt. rsb canon. mflops were: on avg. 7.751e-03, min 3.002e-03, max 1.254e-02 (4 samples) -#pr: best tun. rsb operation time was: on avg. 3.099e-08s, min 3.099e-08s, max 3.099e-08s, tot 1.240e-07s (4 samples) -#pr: ref. unt. rsb operation time was: on avg. 7.794e-03s, min 7.653e-03s, max 7.994e-03s, tot 3.118e-02s (4 samples) -#pr: min / max ratio of in-memory MEMSET bandwidth to extrapolated read bandwidth ratio: 4.259e+00 1.233e+01 -#pr: in-cache to in-memory MEMSET bandwidth ratio: 1.575e+00 +#pr: rsb auto tuning (either succ. or uns.) time was: on avg.: 0.02 s, min 0.01 s, max 0.04 s, tot 0.06 s (4 samples) +#pr: rsb auto tuning ( only successful ) time was: on avg.: 0.02 s, min 0.01 s, max 0.04 s, tot 0.06 s (4 samples) +#pr: best tun. rsb canon. mflops were: on avg. 1.125e+03, min 4.499e+02, max 1.800e+03 (4 samples) +#pr: ref. unt. rsb canon. mflops were: on avg. 8.142e-02, min 5.312e-03, max 1.529e-01 (4 samples) +#pr: best tun. rsb operation time was: on avg. 5.335e-08s, min 5.335e-08s, max 5.335e-08s, tot 2.134e-07s (4 samples) +#pr: ref. unt. rsb operation time was: on avg. 1.673e-03s, min 6.280e-04s, max 4.518e-03s, tot 6.692e-03s (4 samples) +#pr: min / max ratio of in-memory MEMSET bandwidth to extrapolated read bandwidth ratio: 1.113e+01 3.222e+01 +#pr: in-cache to in-memory MEMSET bandwidth ratio: 1.040e+00 #pr: ======== Limiting to nrhs=4: #pr: 4 samples (out of 8) matched the dump limiting criteria. #pr: Dump from a base of 8 samples (of max 16) ordered by (1,1,1,1,2,4,2) = (filename x cores x incX x incY x nrhs x typecode x transA). pr: BESTCODE MTX NR NC NNZ NRHS TYPE SYM TRANS NT AT-NT AT-MKL-NT BPNZ AT-BPNZ NSUBM AT-SUBM RSBBEST-MFLOPS OPTIME MKL-OPTIME AT-OPTIME AT-MKL-OPTIME AT-TIME RWminBW-GBps CB-bpf AT-MS CMFLOPS -pr: 9:R_R A 3 3 6 4 D S N 12 12 0 4.0000 4.6667 3 1 3097.33 7.967e-03 0.000e+00 3.099e-08 0.000e+00 7.201e-02 1.17e+01 2.79e+00 1 9.60e-05 -pr: 11:R_R A 3 3 6 4 S S N 12 12 0 4.0000 4.6667 3 1 3097.33 7.788e-03 0.000e+00 3.099e-08 0.000e+00 7.652e-02 6.32e+00 1.54e+00 1 9.60e-05 -pr: 13:R_R A 3 3 6 4 C S N 12 12 0 4.0000 4.6667 3 1 12389.33 4.446e-03 0.000e+00 3.099e-08 0.000e+00 6.784e-02 1.17e+01 6.98e-01 1 3.84e-04 -pr: 15:R_R A 3 3 6 4 Z S N 12 12 0 4.0000 4.6667 3 1 12389.33 7.998e-03 0.000e+00 3.099e-08 0.000e+00 7.218e-02 2.26e+01 1.32e+00 1 3.84e-04 +pr: 9:R_R A 3 3 6 4 D S N 12 12 0 4.0000 4.6667 3 1 1799.57 8.459e-04 0.000e+00 5.335e-08 0.000e+00 1.234e-02 6.82e+00 2.79e+00 1 9.60e-05 +pr: 11:R_R A 3 3 6 4 S S N 12 12 0 4.0000 4.6667 3 1 1799.57 4.320e-04 0.000e+00 5.335e-08 0.000e+00 9.853e-03 3.67e+00 1.54e+00 1 9.60e-05 +pr: 13:R_R A 3 3 6 4 C S N 12 12 0 4.0000 4.6667 3 1 7198.27 1.485e-03 0.000e+00 5.335e-08 0.000e+00 1.835e-02 6.82e+00 6.98e-01 1 3.84e-04 +pr: 15:R_R A 3 3 6 4 Z S N 12 12 0 4.0000 4.6667 3 1 7198.27 6.390e-04 0.000e+00 5.335e-08 0.000e+00 8.758e-03 1.31e+01 1.32e+00 1 3.84e-04 #pr: 4 samples (out of 8) matched the dump limiting criteria. #pr: below, we define 'successful' autotuning when speedup of 1.010000x is exceeded, and 'tuned' results even the ones which are same as untuned #pr: rsb autotuning was successful in 4 cases (100.00 %) and unsuccessful in 0 cases (0.00 %) -#pr: (in succ. cases rsb autotuning gave avg. 22745092.3 % faster, avg. sp. ratio 227451.923x, max sp. ratio 258046.154x, avg. ratio 0.000x) -#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 2327442.3/2188776.9/2468961.5/9309769.2 tuned ops) -#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 10.8/ 9.0/ 15.3/ 43.1 untuned ops) -#pr: (and amortizes from untuned rsb in avg. 10.8, min. 9.0, max. 15.3 ops) +#pr: (in succ. cases rsb autotuning gave avg. 1594089.9 % faster, avg. sp. ratio 15941.899x, max sp. ratio 27834.637x, avg. ratio 0.000x) +#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 231061.5/164174.3/343982.1/924245.8 tuned ops) +#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 15.9/ 12.4/ 22.8/ 63.5 untuned ops) +#pr: (and amortizes from untuned rsb in avg. 15.9, min. 12.4, max. 22.8 ops) #pr: (avg/min/max (avg) nnz per subm before successful tuning were 2/ 2/ 2) #pr: (avg/min/max (avg) nnz per subm after successful tuning were 6/ 6/ 6) #pr: (avg/min/max (avg) bytes per subm before successful tuning were 18/ 8/ 32) #pr: (avg/min/max (avg) bytes per subm after successful tuning were 54/ 24/ 96) #pr: (avg/min/max (avg) bytes per nnz before successful tuning were 4.000/ 4.000/ 4.000) -#pr: (avg/min/max operands (mtx,lhs,rhs) read bandwidth lower bound 9.615/ 4.775/ 16.390,GBps) -#pr: (avg/min/max operands (mtx,rhs:r;lhs:rw) bandwidth lower bound 52.397/ 6.324/ 22.585,GBps) +#pr: (avg/min/max operands (mtx,lhs,rhs) read bandwidth lower bound 5.586/ 2.774/ 9.523,GBps) +#pr: (avg/min/max operands (mtx,rhs:r;lhs:rw) bandwidth lower bound 30.443/ 3.674/ 13.122,GBps) #pr: (avg/min/max code balance (bytes read at least once per flop) 1.589/ 0.698/ 2.792) #pr: (avg/min/max (avg) bytes per nnz after successful tuning were 4.667/ 4.667/ 4.667) #pr: (matrix has been subdivided more/less/same in resp. 0 / 4 /0 cases) #pr: (matrix has used more/less/same threads in resp. 0 / 0 /4 cases) #pr: no unsuccessful rsb autotuning attempt (according to 1.01x threshold) -#pr: rsb auto tuning (either succ. or uns.) time was: on avg.: 0.07 s, min 0.07 s, max 0.08 s, tot 0.29 s (4 samples) -#pr: rsb auto tuning ( only successful ) time was: on avg.: 0.07 s, min 0.07 s, max 0.08 s, tot 0.29 s (4 samples) -#pr: best tun. rsb canon. mflops were: on avg. 7.743e+03, min 3.097e+03, max 1.239e+04 (4 samples) -#pr: ref. unt. rsb canon. mflops were: on avg. 3.969e-02, min 1.205e-02, max 8.637e-02 (4 samples) -#pr: best tun. rsb operation time was: on avg. 3.099e-08s, min 3.099e-08s, max 3.099e-08s, tot 1.240e-07s (4 samples) -#pr: ref. unt. rsb operation time was: on avg. 7.050e-03s, min 4.446e-03s, max 7.998e-03s, tot 2.820e-02s (4 samples) -#pr: min / max ratio of in-memory MEMSET bandwidth to extrapolated read bandwidth ratio: 1.845e+00 6.331e+00 -#pr: in-cache to in-memory MEMSET bandwidth ratio: 1.575e+00 +#pr: rsb auto tuning (either succ. or uns.) time was: on avg.: 0.01 s, min 0.01 s, max 0.02 s, tot 0.05 s (4 samples) +#pr: rsb auto tuning ( only successful ) time was: on avg.: 0.01 s, min 0.01 s, max 0.02 s, tot 0.05 s (4 samples) +#pr: best tun. rsb canon. mflops were: on avg. 4.499e+03, min 1.800e+03, max 7.198e+03 (4 samples) +#pr: ref. unt. rsb canon. mflops were: on avg. 2.988e-01, min 1.135e-01, max 6.010e-01 (4 samples) +#pr: best tun. rsb operation time was: on avg. 5.335e-08s, min 5.335e-08s, max 5.335e-08s, tot 2.134e-07s (4 samples) +#pr: ref. unt. rsb operation time was: on avg. 8.504e-04s, min 4.320e-04s, max 1.485e-03s, tot 3.402e-03s (4 samples) +#pr: min / max ratio of in-memory MEMSET bandwidth to extrapolated read bandwidth ratio: 4.821e+00 1.655e+01 +#pr: in-cache to in-memory MEMSET bandwidth ratio: 1.040e+00 #pr: rsb nrhs-to-overall-min-rhs speed ratio was: on avg. 4.000e+00 x, min 4.000e+00 x, max 4.000e+00 x (4 samples, the non-min-nrhs ones) #pr: ======== Limiting to transA=N: #pr: Dump from a base of 8 samples (of max 16) ordered by (1,1,1,1,2,4,2) = (filename x cores x incX x incY x nrhs x typecode x transA). pr: BESTCODE MTX NR NC NNZ NRHS TYPE SYM TRANS NT AT-NT AT-MKL-NT BPNZ AT-BPNZ NSUBM AT-SUBM RSBBEST-MFLOPS OPTIME MKL-OPTIME AT-OPTIME AT-MKL-OPTIME AT-TIME RWminBW-GBps CB-bpf AT-MS CMFLOPS -pr: 1:R_R A 3 3 6 1 D S N 12 12 0 4.0000 4.6667 3 1 774.33 7.768e-03 0.000e+00 3.099e-08 0.000e+00 7.220e-02 4.78e+00 5.17e+00 1 2.40e-05 -pr: 3:R_R A 3 3 6 1 S S N 12 12 0 4.0000 4.6667 3 1 774.33 7.994e-03 0.000e+00 3.099e-08 0.000e+00 7.374e-02 2.84e+00 3.17e+00 1 2.40e-05 -pr: 5:R_R A 3 3 6 1 C S N 12 12 0 4.0000 4.6667 3 1 3097.33 7.763e-03 0.000e+00 3.099e-08 0.000e+00 7.209e-02 4.78e+00 1.29e+00 1 9.60e-05 -pr: 7:R_R A 3 3 6 1 Z S N 12 12 0 4.0000 4.6667 3 1 3097.33 7.653e-03 0.000e+00 3.099e-08 0.000e+00 7.232e-02 8.65e+00 2.29e+00 1 9.60e-05 -pr: 9:R_R A 3 3 6 4 D S N 12 12 0 4.0000 4.6667 3 1 3097.33 7.967e-03 0.000e+00 3.099e-08 0.000e+00 7.201e-02 1.17e+01 2.79e+00 1 9.60e-05 -pr: 11:R_R A 3 3 6 4 S S N 12 12 0 4.0000 4.6667 3 1 3097.33 7.788e-03 0.000e+00 3.099e-08 0.000e+00 7.652e-02 6.32e+00 1.54e+00 1 9.60e-05 -pr: 13:R_R A 3 3 6 4 C S N 12 12 0 4.0000 4.6667 3 1 12389.33 4.446e-03 0.000e+00 3.099e-08 0.000e+00 6.784e-02 1.17e+01 6.98e-01 1 3.84e-04 -pr: 15:R_R A 3 3 6 4 Z S N 12 12 0 4.0000 4.6667 3 1 12389.33 7.998e-03 0.000e+00 3.099e-08 0.000e+00 7.218e-02 2.26e+01 1.32e+00 1 3.84e-04 +pr: 1:R_R A 3 3 6 1 D S N 12 12 0 4.0000 4.6667 3 1 449.89 4.518e-03 0.000e+00 5.335e-08 0.000e+00 3.842e-02 2.77e+00 5.17e+00 1 2.40e-05 +pr: 3:R_R A 3 3 6 1 S S N 12 12 0 4.0000 4.6667 3 1 449.89 8.578e-04 0.000e+00 5.335e-08 0.000e+00 7.500e-03 1.65e+00 3.17e+00 1 2.40e-05 +pr: 5:R_R A 3 3 6 1 C S N 12 12 0 4.0000 4.6667 3 1 1799.57 6.881e-04 0.000e+00 5.335e-08 0.000e+00 7.385e-03 2.77e+00 1.29e+00 1 9.60e-05 +pr: 7:R_R A 3 3 6 1 Z S N 12 12 0 4.0000 4.6667 3 1 1799.57 6.280e-04 0.000e+00 5.335e-08 0.000e+00 8.415e-03 5.02e+00 2.29e+00 1 9.60e-05 +pr: 9:R_R A 3 3 6 4 D S N 12 12 0 4.0000 4.6667 3 1 1799.57 8.459e-04 0.000e+00 5.335e-08 0.000e+00 1.234e-02 6.82e+00 2.79e+00 1 9.60e-05 +pr: 11:R_R A 3 3 6 4 S S N 12 12 0 4.0000 4.6667 3 1 1799.57 4.320e-04 0.000e+00 5.335e-08 0.000e+00 9.853e-03 3.67e+00 1.54e+00 1 9.60e-05 +pr: 13:R_R A 3 3 6 4 C S N 12 12 0 4.0000 4.6667 3 1 7198.27 1.485e-03 0.000e+00 5.335e-08 0.000e+00 1.835e-02 6.82e+00 6.98e-01 1 3.84e-04 +pr: 15:R_R A 3 3 6 4 Z S N 12 12 0 4.0000 4.6667 3 1 7198.27 6.390e-04 0.000e+00 5.335e-08 0.000e+00 8.758e-03 1.31e+01 1.32e+00 1 3.84e-04 #pr: below, we define 'successful' autotuning when speedup of 1.010000x is exceeded, and 'tuned' results even the ones which are same as untuned #pr: rsb autotuning was successful in 8 cases (100.00 %) and unsuccessful in 0 cases (0.00 %) -#pr: (in succ. cases rsb autotuning gave avg. 23946534.6 % faster, avg. sp. ratio 239466.346x, max sp. ratio 258046.154x, avg. ratio 0.000x) -#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 2334667.3/2188776.9/2468961.5/18677338.5 tuned ops) -#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 10.1/ 9.0/ 15.3/ 80.4 untuned ops) -#pr: (and amortizes from untuned rsb in avg. 10.1, min. 9.0, max. 15.3 ops) +#pr: (in succ. cases rsb autotuning gave avg. 2365039.7 % faster, avg. sp. ratio 23651.397x, max sp. ratio 84692.737x, avg. ratio 0.000x) +#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 260162.0/138435.8/720277.1/2081296.1 tuned ops) +#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 13.1/ 8.5/ 22.8/104.8 untuned ops) +#pr: (and amortizes from untuned rsb in avg. 13.1, min. 8.5, max. 22.8 ops) #pr: (avg/min/max (avg) nnz per subm before successful tuning were 2/ 2/ 2) #pr: (avg/min/max (avg) nnz per subm after successful tuning were 6/ 6/ 6) #pr: (avg/min/max (avg) bytes per subm before successful tuning were 18/ 8/ 32) #pr: (avg/min/max (avg) bytes per subm after successful tuning were 54/ 24/ 96) #pr: (avg/min/max (avg) bytes per nnz before successful tuning were 4.000/ 4.000/ 4.000) -#pr: (avg/min/max operands (mtx,lhs,rhs) read bandwidth lower bound 7.001/ 2.452/ 16.390,GBps) -#pr: (avg/min/max operands (mtx,rhs:r;lhs:rw) bandwidth lower bound 73.433/ 2.839/ 22.585,GBps) +#pr: (avg/min/max operands (mtx,lhs,rhs) read bandwidth lower bound 4.068/ 1.425/ 9.523,GBps) +#pr: (avg/min/max operands (mtx,rhs:r;lhs:rw) bandwidth lower bound 42.665/ 1.650/ 13.122,GBps) #pr: (avg/min/max code balance (bytes read at least once per flop) 2.284/ 0.698/ 5.167) #pr: (avg/min/max (avg) bytes per nnz after successful tuning were 4.667/ 4.667/ 4.667) #pr: (matrix has been subdivided more/less/same in resp. 0 / 8 /0 cases) #pr: (matrix has used more/less/same threads in resp. 0 / 0 /8 cases) #pr: no unsuccessful rsb autotuning attempt (according to 1.01x threshold) -#pr: rsb auto tuning (either succ. or uns.) time was: on avg.: 0.07 s, min 0.07 s, max 0.08 s, tot 0.58 s (8 samples) -#pr: rsb auto tuning ( only successful ) time was: on avg.: 0.07 s, min 0.07 s, max 0.08 s, tot 0.58 s (8 samples) -#pr: best tun. rsb canon. mflops were: on avg. 4.840e+03, min 7.743e+02, max 1.239e+04 (8 samples) -#pr: ref. unt. rsb canon. mflops were: on avg. 2.372e-02, min 3.002e-03, max 8.637e-02 (8 samples) -#pr: best tun. rsb operation time was: on avg. 3.099e-08s, min 3.099e-08s, max 3.099e-08s, tot 2.480e-07s (8 samples) -#pr: ref. unt. rsb operation time was: on avg. 7.422e-03s, min 4.446e-03s, max 7.998e-03s, tot 5.938e-02s (8 samples) -#pr: min / max ratio of in-memory MEMSET bandwidth to extrapolated read bandwidth ratio: 1.845e+00 1.233e+01 -#pr: in-cache to in-memory MEMSET bandwidth ratio: 1.575e+00 +#pr: rsb auto tuning (either succ. or uns.) time was: on avg.: 0.01 s, min 0.01 s, max 0.04 s, tot 0.11 s (8 samples) +#pr: rsb auto tuning ( only successful ) time was: on avg.: 0.01 s, min 0.01 s, max 0.04 s, tot 0.11 s (8 samples) +#pr: best tun. rsb canon. mflops were: on avg. 2.812e+03, min 4.499e+02, max 7.198e+03 (8 samples) +#pr: ref. unt. rsb canon. mflops were: on avg. 1.901e-01, min 5.312e-03, max 6.010e-01 (8 samples) +#pr: best tun. rsb operation time was: on avg. 5.335e-08s, min 5.335e-08s, max 5.335e-08s, tot 4.268e-07s (8 samples) +#pr: ref. unt. rsb operation time was: on avg. 1.262e-03s, min 4.320e-04s, max 4.518e-03s, tot 1.009e-02s (8 samples) +#pr: min / max ratio of in-memory MEMSET bandwidth to extrapolated read bandwidth ratio: 4.821e+00 3.222e+01 +#pr: in-cache to in-memory MEMSET bandwidth ratio: 1.040e+00 #pr: rsb nrhs-to-overall-min-rhs speed ratio was: on avg. 4.000e+00 x, min 4.000e+00 x, max 4.000e+00 x (4 samples, the non-min-nrhs ones) #pr: ======== Limiting to both transA=N and nrhs=1: #pr: 4 samples (out of 8) matched the dump limiting criteria. #pr: Dump from a base of 8 samples (of max 16) ordered by (1,1,1,1,2,4,2) = (filename x cores x incX x incY x nrhs x typecode x transA). pr: BESTCODE MTX NR NC NNZ NRHS TYPE SYM TRANS NT AT-NT AT-MKL-NT BPNZ AT-BPNZ NSUBM AT-SUBM RSBBEST-MFLOPS OPTIME MKL-OPTIME AT-OPTIME AT-MKL-OPTIME AT-TIME RWminBW-GBps CB-bpf AT-MS CMFLOPS -pr: 1:R_R A 3 3 6 1 D S N 12 12 0 4.0000 4.6667 3 1 774.33 7.768e-03 0.000e+00 3.099e-08 0.000e+00 7.220e-02 4.78e+00 5.17e+00 1 2.40e-05 -pr: 3:R_R A 3 3 6 1 S S N 12 12 0 4.0000 4.6667 3 1 774.33 7.994e-03 0.000e+00 3.099e-08 0.000e+00 7.374e-02 2.84e+00 3.17e+00 1 2.40e-05 -pr: 5:R_R A 3 3 6 1 C S N 12 12 0 4.0000 4.6667 3 1 3097.33 7.763e-03 0.000e+00 3.099e-08 0.000e+00 7.209e-02 4.78e+00 1.29e+00 1 9.60e-05 -pr: 7:R_R A 3 3 6 1 Z S N 12 12 0 4.0000 4.6667 3 1 3097.33 7.653e-03 0.000e+00 3.099e-08 0.000e+00 7.232e-02 8.65e+00 2.29e+00 1 9.60e-05 +pr: 1:R_R A 3 3 6 1 D S N 12 12 0 4.0000 4.6667 3 1 449.89 4.518e-03 0.000e+00 5.335e-08 0.000e+00 3.842e-02 2.77e+00 5.17e+00 1 2.40e-05 +pr: 3:R_R A 3 3 6 1 S S N 12 12 0 4.0000 4.6667 3 1 449.89 8.578e-04 0.000e+00 5.335e-08 0.000e+00 7.500e-03 1.65e+00 3.17e+00 1 2.40e-05 +pr: 5:R_R A 3 3 6 1 C S N 12 12 0 4.0000 4.6667 3 1 1799.57 6.881e-04 0.000e+00 5.335e-08 0.000e+00 7.385e-03 2.77e+00 1.29e+00 1 9.60e-05 +pr: 7:R_R A 3 3 6 1 Z S N 12 12 0 4.0000 4.6667 3 1 1799.57 6.280e-04 0.000e+00 5.335e-08 0.000e+00 8.415e-03 5.02e+00 2.29e+00 1 9.60e-05 #pr: 4 samples (out of 8) matched the dump limiting criteria. #pr: below, we define 'successful' autotuning when speedup of 1.010000x is exceeded, and 'tuned' results even the ones which are same as untuned #pr: rsb autotuning was successful in 4 cases (100.00 %) and unsuccessful in 0 cases (0.00 %) -#pr: (in succ. cases rsb autotuning gave avg. 25147976.9 % faster, avg. sp. ratio 251480.769x, max sp. ratio 257915.385x, avg. ratio 0.000x) -#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 2341892.3/2325746.2/2379076.9/9367569.2 tuned ops) -#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 9.3/ 9.2/ 9.4/ 37.3 untuned ops) -#pr: (and amortizes from untuned rsb in avg. 9.3, min. 9.2, max. 9.4 ops) +#pr: (in succ. cases rsb autotuning gave avg. 3135989.4 % faster, avg. sp. ratio 31360.894x, max sp. ratio 84692.737x, avg. ratio 0.000x) +#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 289262.6/138435.8/720277.1/1157050.3 tuned ops) +#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 10.3/ 8.5/ 13.4/ 41.4 untuned ops) +#pr: (and amortizes from untuned rsb in avg. 10.3, min. 8.5, max. 13.4 ops) #pr: (avg/min/max (avg) nnz per subm before successful tuning were 2/ 2/ 2) #pr: (avg/min/max (avg) nnz per subm after successful tuning were 6/ 6/ 6) #pr: (avg/min/max (avg) bytes per subm before successful tuning were 18/ 8/ 32) #pr: (avg/min/max (avg) bytes per subm after successful tuning were 54/ 24/ 96) #pr: (avg/min/max (avg) bytes per nnz before successful tuning were 4.000/ 4.000/ 4.000) -#pr: (avg/min/max operands (mtx,lhs,rhs) read bandwidth lower bound 4.388/ 2.452/ 7.098,GBps) -#pr: (avg/min/max operands (mtx,rhs:r;lhs:rw) bandwidth lower bound 21.036/ 2.839/ 8.647,GBps) +#pr: (avg/min/max operands (mtx,lhs,rhs) read bandwidth lower bound 2.549/ 1.425/ 4.124,GBps) +#pr: (avg/min/max operands (mtx,rhs:r;lhs:rw) bandwidth lower bound 12.222/ 1.650/ 5.024,GBps) #pr: (avg/min/max code balance (bytes read at least once per flop) 2.979/ 1.292/ 5.167) #pr: (avg/min/max (avg) bytes per nnz after successful tuning were 4.667/ 4.667/ 4.667) #pr: (matrix has been subdivided more/less/same in resp. 0 / 4 /0 cases) #pr: (matrix has used more/less/same threads in resp. 0 / 0 /4 cases) #pr: no unsuccessful rsb autotuning attempt (according to 1.01x threshold) -#pr: rsb auto tuning (either succ. or uns.) time was: on avg.: 0.07 s, min 0.07 s, max 0.07 s, tot 0.29 s (4 samples) -#pr: rsb auto tuning ( only successful ) time was: on avg.: 0.07 s, min 0.07 s, max 0.07 s, tot 0.29 s (4 samples) -#pr: best tun. rsb canon. mflops were: on avg. 1.936e+03, min 7.743e+02, max 3.097e+03 (4 samples) -#pr: ref. unt. rsb canon. mflops were: on avg. 7.751e-03, min 3.002e-03, max 1.254e-02 (4 samples) -#pr: best tun. rsb operation time was: on avg. 3.099e-08s, min 3.099e-08s, max 3.099e-08s, tot 1.240e-07s (4 samples) -#pr: ref. unt. rsb operation time was: on avg. 7.794e-03s, min 7.653e-03s, max 7.994e-03s, tot 3.118e-02s (4 samples) -#pr: min / max ratio of in-memory MEMSET bandwidth to extrapolated read bandwidth ratio: 4.259e+00 1.233e+01 -#pr: in-cache to in-memory MEMSET bandwidth ratio: 1.575e+00 +#pr: rsb auto tuning (either succ. or uns.) time was: on avg.: 0.02 s, min 0.01 s, max 0.04 s, tot 0.06 s (4 samples) +#pr: rsb auto tuning ( only successful ) time was: on avg.: 0.02 s, min 0.01 s, max 0.04 s, tot 0.06 s (4 samples) +#pr: best tun. rsb canon. mflops were: on avg. 1.125e+03, min 4.499e+02, max 1.800e+03 (4 samples) +#pr: ref. unt. rsb canon. mflops were: on avg. 8.142e-02, min 5.312e-03, max 1.529e-01 (4 samples) +#pr: best tun. rsb operation time was: on avg. 5.335e-08s, min 5.335e-08s, max 5.335e-08s, tot 2.134e-07s (4 samples) +#pr: ref. unt. rsb operation time was: on avg. 1.673e-03s, min 6.280e-04s, max 4.518e-03s, tot 6.692e-03s (4 samples) +#pr: min / max ratio of in-memory MEMSET bandwidth to extrapolated read bandwidth ratio: 1.113e+01 3.222e+01 +#pr: in-cache to in-memory MEMSET bandwidth ratio: 1.040e+00 #pr: ======== Limiting to both transA=N and nrhs=4: #pr: 4 samples (out of 8) matched the dump limiting criteria. #pr: Dump from a base of 8 samples (of max 16) ordered by (1,1,1,1,2,4,2) = (filename x cores x incX x incY x nrhs x typecode x transA). pr: BESTCODE MTX NR NC NNZ NRHS TYPE SYM TRANS NT AT-NT AT-MKL-NT BPNZ AT-BPNZ NSUBM AT-SUBM RSBBEST-MFLOPS OPTIME MKL-OPTIME AT-OPTIME AT-MKL-OPTIME AT-TIME RWminBW-GBps CB-bpf AT-MS CMFLOPS -pr: 9:R_R A 3 3 6 4 D S N 12 12 0 4.0000 4.6667 3 1 3097.33 7.967e-03 0.000e+00 3.099e-08 0.000e+00 7.201e-02 1.17e+01 2.79e+00 1 9.60e-05 -pr: 11:R_R A 3 3 6 4 S S N 12 12 0 4.0000 4.6667 3 1 3097.33 7.788e-03 0.000e+00 3.099e-08 0.000e+00 7.652e-02 6.32e+00 1.54e+00 1 9.60e-05 -pr: 13:R_R A 3 3 6 4 C S N 12 12 0 4.0000 4.6667 3 1 12389.33 4.446e-03 0.000e+00 3.099e-08 0.000e+00 6.784e-02 1.17e+01 6.98e-01 1 3.84e-04 -pr: 15:R_R A 3 3 6 4 Z S N 12 12 0 4.0000 4.6667 3 1 12389.33 7.998e-03 0.000e+00 3.099e-08 0.000e+00 7.218e-02 2.26e+01 1.32e+00 1 3.84e-04 +pr: 9:R_R A 3 3 6 4 D S N 12 12 0 4.0000 4.6667 3 1 1799.57 8.459e-04 0.000e+00 5.335e-08 0.000e+00 1.234e-02 6.82e+00 2.79e+00 1 9.60e-05 +pr: 11:R_R A 3 3 6 4 S S N 12 12 0 4.0000 4.6667 3 1 1799.57 4.320e-04 0.000e+00 5.335e-08 0.000e+00 9.853e-03 3.67e+00 1.54e+00 1 9.60e-05 +pr: 13:R_R A 3 3 6 4 C S N 12 12 0 4.0000 4.6667 3 1 7198.27 1.485e-03 0.000e+00 5.335e-08 0.000e+00 1.835e-02 6.82e+00 6.98e-01 1 3.84e-04 +pr: 15:R_R A 3 3 6 4 Z S N 12 12 0 4.0000 4.6667 3 1 7198.27 6.390e-04 0.000e+00 5.335e-08 0.000e+00 8.758e-03 1.31e+01 1.32e+00 1 3.84e-04 #pr: 4 samples (out of 8) matched the dump limiting criteria. #pr: below, we define 'successful' autotuning when speedup of 1.010000x is exceeded, and 'tuned' results even the ones which are same as untuned #pr: rsb autotuning was successful in 4 cases (100.00 %) and unsuccessful in 0 cases (0.00 %) -#pr: (in succ. cases rsb autotuning gave avg. 22745092.3 % faster, avg. sp. ratio 227451.923x, max sp. ratio 258046.154x, avg. ratio 0.000x) -#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 2327442.3/2188776.9/2468961.5/9309769.2 tuned ops) -#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 10.8/ 9.0/ 15.3/ 43.1 untuned ops) -#pr: (and amortizes from untuned rsb in avg. 10.8, min. 9.0, max. 15.3 ops) +#pr: (in succ. cases rsb autotuning gave avg. 1594089.9 % faster, avg. sp. ratio 15941.899x, max sp. ratio 27834.637x, avg. ratio 0.000x) +#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 231061.5/164174.3/343982.1/924245.8 tuned ops) +#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 15.9/ 12.4/ 22.8/ 63.5 untuned ops) +#pr: (and amortizes from untuned rsb in avg. 15.9, min. 12.4, max. 22.8 ops) #pr: (avg/min/max (avg) nnz per subm before successful tuning were 2/ 2/ 2) #pr: (avg/min/max (avg) nnz per subm after successful tuning were 6/ 6/ 6) #pr: (avg/min/max (avg) bytes per subm before successful tuning were 18/ 8/ 32) #pr: (avg/min/max (avg) bytes per subm after successful tuning were 54/ 24/ 96) #pr: (avg/min/max (avg) bytes per nnz before successful tuning were 4.000/ 4.000/ 4.000) -#pr: (avg/min/max operands (mtx,lhs,rhs) read bandwidth lower bound 9.615/ 4.775/ 16.390,GBps) -#pr: (avg/min/max operands (mtx,rhs:r;lhs:rw) bandwidth lower bound 52.397/ 6.324/ 22.585,GBps) +#pr: (avg/min/max operands (mtx,lhs,rhs) read bandwidth lower bound 5.586/ 2.774/ 9.523,GBps) +#pr: (avg/min/max operands (mtx,rhs:r;lhs:rw) bandwidth lower bound 30.443/ 3.674/ 13.122,GBps) #pr: (avg/min/max code balance (bytes read at least once per flop) 1.589/ 0.698/ 2.792) #pr: (avg/min/max (avg) bytes per nnz after successful tuning were 4.667/ 4.667/ 4.667) #pr: (matrix has been subdivided more/less/same in resp. 0 / 4 /0 cases) #pr: (matrix has used more/less/same threads in resp. 0 / 0 /4 cases) #pr: no unsuccessful rsb autotuning attempt (according to 1.01x threshold) -#pr: rsb auto tuning (either succ. or uns.) time was: on avg.: 0.07 s, min 0.07 s, max 0.08 s, tot 0.29 s (4 samples) -#pr: rsb auto tuning ( only successful ) time was: on avg.: 0.07 s, min 0.07 s, max 0.08 s, tot 0.29 s (4 samples) -#pr: best tun. rsb canon. mflops were: on avg. 7.743e+03, min 3.097e+03, max 1.239e+04 (4 samples) -#pr: ref. unt. rsb canon. mflops were: on avg. 3.969e-02, min 1.205e-02, max 8.637e-02 (4 samples) -#pr: best tun. rsb operation time was: on avg. 3.099e-08s, min 3.099e-08s, max 3.099e-08s, tot 1.240e-07s (4 samples) -#pr: ref. unt. rsb operation time was: on avg. 7.050e-03s, min 4.446e-03s, max 7.998e-03s, tot 2.820e-02s (4 samples) -#pr: min / max ratio of in-memory MEMSET bandwidth to extrapolated read bandwidth ratio: 1.845e+00 6.331e+00 -#pr: in-cache to in-memory MEMSET bandwidth ratio: 1.575e+00 +#pr: rsb auto tuning (either succ. or uns.) time was: on avg.: 0.01 s, min 0.01 s, max 0.02 s, tot 0.05 s (4 samples) +#pr: rsb auto tuning ( only successful ) time was: on avg.: 0.01 s, min 0.01 s, max 0.02 s, tot 0.05 s (4 samples) +#pr: best tun. rsb canon. mflops were: on avg. 4.499e+03, min 1.800e+03, max 7.198e+03 (4 samples) +#pr: ref. unt. rsb canon. mflops were: on avg. 2.988e-01, min 1.135e-01, max 6.010e-01 (4 samples) +#pr: best tun. rsb operation time was: on avg. 5.335e-08s, min 5.335e-08s, max 5.335e-08s, tot 2.134e-07s (4 samples) +#pr: ref. unt. rsb operation time was: on avg. 8.504e-04s, min 4.320e-04s, max 1.485e-03s, tot 3.402e-03s (4 samples) +#pr: min / max ratio of in-memory MEMSET bandwidth to extrapolated read bandwidth ratio: 4.821e+00 1.655e+01 +#pr: in-cache to in-memory MEMSET bandwidth ratio: 1.040e+00 #pr: rsb nrhs-to-overall-min-rhs speed ratio was: on avg. 4.000e+00 x, min 4.000e+00 x, max 4.000e+00 x (4 samples, the non-min-nrhs ones) #pr: ======== Limiting to transA=T: #pr: No sample (out of 8) matched the dump criteria -- skipping dump round. @@ -5048,65 +5084,65 @@ #pr: ======== All results (not limiting) #pr: Dump from a base of 8 samples (of max 16) ordered by (1,1,1,1,2,4,2) = (filename x cores x incX x incY x nrhs x typecode x transA). pr: BESTCODE MTX NR NC NNZ NRHS TYPE SYM TRANS NT AT-NT AT-MKL-NT BPNZ AT-BPNZ NSUBM AT-SUBM RSBBEST-MFLOPS OPTIME MKL-OPTIME AT-OPTIME AT-MKL-OPTIME AT-TIME RWminBW-GBps CB-bpf AT-MS CMFLOPS -pr: 1:R_R A 3 3 6 1 D S N 12 12 0 4.0000 4.6667 3 1 774.33 7.768e-03 0.000e+00 3.099e-08 0.000e+00 7.220e-02 4.78e+00 5.17e+00 1 2.40e-05 -pr: 3:R_R A 3 3 6 1 S S N 12 12 0 4.0000 4.6667 3 1 774.33 7.994e-03 0.000e+00 3.099e-08 0.000e+00 7.374e-02 2.84e+00 3.17e+00 1 2.40e-05 -pr: 5:R_R A 3 3 6 1 C S N 12 12 0 4.0000 4.6667 3 1 3097.33 7.763e-03 0.000e+00 3.099e-08 0.000e+00 7.209e-02 4.78e+00 1.29e+00 1 9.60e-05 -pr: 7:R_R A 3 3 6 1 Z S N 12 12 0 4.0000 4.6667 3 1 3097.33 7.653e-03 0.000e+00 3.099e-08 0.000e+00 7.232e-02 8.65e+00 2.29e+00 1 9.60e-05 -pr: 9:R_R A 3 3 6 4 D S N 12 12 0 4.0000 4.6667 3 1 3097.33 7.967e-03 0.000e+00 3.099e-08 0.000e+00 7.201e-02 1.17e+01 2.79e+00 1 9.60e-05 -pr: 11:R_R A 3 3 6 4 S S N 12 12 0 4.0000 4.6667 3 1 3097.33 7.788e-03 0.000e+00 3.099e-08 0.000e+00 7.652e-02 6.32e+00 1.54e+00 1 9.60e-05 -pr: 13:R_R A 3 3 6 4 C S N 12 12 0 4.0000 4.6667 3 1 12389.33 4.446e-03 0.000e+00 3.099e-08 0.000e+00 6.784e-02 1.17e+01 6.98e-01 1 3.84e-04 -pr: 15:R_R A 3 3 6 4 Z S N 12 12 0 4.0000 4.6667 3 1 12389.33 7.998e-03 0.000e+00 3.099e-08 0.000e+00 7.218e-02 2.26e+01 1.32e+00 1 3.84e-04 +pr: 1:R_R A 3 3 6 1 D S N 12 12 0 4.0000 4.6667 3 1 449.89 4.518e-03 0.000e+00 5.335e-08 0.000e+00 3.842e-02 2.77e+00 5.17e+00 1 2.40e-05 +pr: 3:R_R A 3 3 6 1 S S N 12 12 0 4.0000 4.6667 3 1 449.89 8.578e-04 0.000e+00 5.335e-08 0.000e+00 7.500e-03 1.65e+00 3.17e+00 1 2.40e-05 +pr: 5:R_R A 3 3 6 1 C S N 12 12 0 4.0000 4.6667 3 1 1799.57 6.881e-04 0.000e+00 5.335e-08 0.000e+00 7.385e-03 2.77e+00 1.29e+00 1 9.60e-05 +pr: 7:R_R A 3 3 6 1 Z S N 12 12 0 4.0000 4.6667 3 1 1799.57 6.280e-04 0.000e+00 5.335e-08 0.000e+00 8.415e-03 5.02e+00 2.29e+00 1 9.60e-05 +pr: 9:R_R A 3 3 6 4 D S N 12 12 0 4.0000 4.6667 3 1 1799.57 8.459e-04 0.000e+00 5.335e-08 0.000e+00 1.234e-02 6.82e+00 2.79e+00 1 9.60e-05 +pr: 11:R_R A 3 3 6 4 S S N 12 12 0 4.0000 4.6667 3 1 1799.57 4.320e-04 0.000e+00 5.335e-08 0.000e+00 9.853e-03 3.67e+00 1.54e+00 1 9.60e-05 +pr: 13:R_R A 3 3 6 4 C S N 12 12 0 4.0000 4.6667 3 1 7198.27 1.485e-03 0.000e+00 5.335e-08 0.000e+00 1.835e-02 6.82e+00 6.98e-01 1 3.84e-04 +pr: 15:R_R A 3 3 6 4 Z S N 12 12 0 4.0000 4.6667 3 1 7198.27 6.390e-04 0.000e+00 5.335e-08 0.000e+00 8.758e-03 1.31e+01 1.32e+00 1 3.84e-04 #pr: below, we define 'successful' autotuning when speedup of 1.010000x is exceeded, and 'tuned' results even the ones which are same as untuned #pr: rsb autotuning was successful in 8 cases (100.00 %) and unsuccessful in 0 cases (0.00 %) -#pr: (in succ. cases rsb autotuning gave avg. 23946534.6 % faster, avg. sp. ratio 239466.346x, max sp. ratio 258046.154x, avg. ratio 0.000x) -#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 2334667.3/2188776.9/2468961.5/18677338.5 tuned ops) -#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 10.1/ 9.0/ 15.3/ 80.4 untuned ops) -#pr: (and amortizes from untuned rsb in avg. 10.1, min. 9.0, max. 15.3 ops) +#pr: (in succ. cases rsb autotuning gave avg. 2365039.7 % faster, avg. sp. ratio 23651.397x, max sp. ratio 84692.737x, avg. ratio 0.000x) +#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 260162.0/138435.8/720277.1/2081296.1 tuned ops) +#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 13.1/ 8.5/ 22.8/104.8 untuned ops) +#pr: (and amortizes from untuned rsb in avg. 13.1, min. 8.5, max. 22.8 ops) #pr: (avg/min/max (avg) nnz per subm before successful tuning were 2/ 2/ 2) #pr: (avg/min/max (avg) nnz per subm after successful tuning were 6/ 6/ 6) #pr: (avg/min/max (avg) bytes per subm before successful tuning were 18/ 8/ 32) #pr: (avg/min/max (avg) bytes per subm after successful tuning were 54/ 24/ 96) #pr: (avg/min/max (avg) bytes per nnz before successful tuning were 4.000/ 4.000/ 4.000) -#pr: (avg/min/max operands (mtx,lhs,rhs) read bandwidth lower bound 7.001/ 2.452/ 16.390,GBps) -#pr: (avg/min/max operands (mtx,rhs:r;lhs:rw) bandwidth lower bound 73.433/ 2.839/ 22.585,GBps) +#pr: (avg/min/max operands (mtx,lhs,rhs) read bandwidth lower bound 4.068/ 1.425/ 9.523,GBps) +#pr: (avg/min/max operands (mtx,rhs:r;lhs:rw) bandwidth lower bound 42.665/ 1.650/ 13.122,GBps) #pr: (avg/min/max code balance (bytes read at least once per flop) 2.284/ 0.698/ 5.167) #pr: (avg/min/max (avg) bytes per nnz after successful tuning were 4.667/ 4.667/ 4.667) #pr: (matrix has been subdivided more/less/same in resp. 0 / 8 /0 cases) #pr: (matrix has used more/less/same threads in resp. 0 / 0 /8 cases) #pr: no unsuccessful rsb autotuning attempt (according to 1.01x threshold) -#pr: rsb auto tuning (either succ. or uns.) time was: on avg.: 0.07 s, min 0.07 s, max 0.08 s, tot 0.58 s (8 samples) -#pr: rsb auto tuning ( only successful ) time was: on avg.: 0.07 s, min 0.07 s, max 0.08 s, tot 0.58 s (8 samples) -#pr: best tun. rsb canon. mflops were: on avg. 4.840e+03, min 7.743e+02, max 1.239e+04 (8 samples) -#pr: ref. unt. rsb canon. mflops were: on avg. 2.372e-02, min 3.002e-03, max 8.637e-02 (8 samples) -#pr: best tun. rsb operation time was: on avg. 3.099e-08s, min 3.099e-08s, max 3.099e-08s, tot 2.480e-07s (8 samples) -#pr: ref. unt. rsb operation time was: on avg. 7.422e-03s, min 4.446e-03s, max 7.998e-03s, tot 5.938e-02s (8 samples) -#pr: min / max ratio of in-memory MEMSET bandwidth to extrapolated read bandwidth ratio: 1.845e+00 1.233e+01 -#pr: in-cache to in-memory MEMSET bandwidth ratio: 1.575e+00 +#pr: rsb auto tuning (either succ. or uns.) time was: on avg.: 0.01 s, min 0.01 s, max 0.04 s, tot 0.11 s (8 samples) +#pr: rsb auto tuning ( only successful ) time was: on avg.: 0.01 s, min 0.01 s, max 0.04 s, tot 0.11 s (8 samples) +#pr: best tun. rsb canon. mflops were: on avg. 2.812e+03, min 4.499e+02, max 7.198e+03 (8 samples) +#pr: ref. unt. rsb canon. mflops were: on avg. 1.901e-01, min 5.312e-03, max 6.010e-01 (8 samples) +#pr: best tun. rsb operation time was: on avg. 5.335e-08s, min 5.335e-08s, max 5.335e-08s, tot 4.268e-07s (8 samples) +#pr: ref. unt. rsb operation time was: on avg. 1.262e-03s, min 4.320e-04s, max 4.518e-03s, tot 1.009e-02s (8 samples) +#pr: min / max ratio of in-memory MEMSET bandwidth to extrapolated read bandwidth ratio: 4.821e+00 3.222e+01 +#pr: in-cache to in-memory MEMSET bandwidth ratio: 1.040e+00 #pr: rsb nrhs-to-overall-min-rhs speed ratio was: on avg. 4.000e+00 x, min 4.000e+00 x, max 4.000e+00 x (4 samples, the non-min-nrhs ones) -#pr: Record collection took 4.04 s. +#pr: Record collection took 0.74 s. #pr: Record comprises 40 memory benchmark samples (prepend RSB_PR_MBW=1 to dump this). -#pr: Record comprises 100 environment variables in 5413 bytes (prepend RSB_PR_ENV=1 to dump this). +#pr: Record comprises 100 environment variables in 5467 bytes (prepend RSB_PR_ENV=1 to dump this). # ====== END Total summary record. -#pr: ======== Saved a performance record of 16 samples to rsbench_pr__1788680920_gcc-14.2.rpr -# Removing the temporary record file rsbench_pr__1788680920_gcc-14.2.rpr.tmp. -# terminating run at 1788680930 (after 9.3s of w.c.t.) -srcdir="/build/reproducible-path/librsb-1.3.0.2+dfsg" /bin/bash ./scripts/doc-tests.sh +#pr: ======== Saved a performance record of 16 samples to rsbench_pr__1754271497_gcc-14.2.rpr +# Removing the temporary record file rsbench_pr__1754271497_gcc-14.2.rpr.tmp. +# terminating run at 1754271504 (after 6.2s of w.c.t.) +srcdir="/build/reproducible-path/librsb-1.3.0.2+dfsg" /bin/sh ./scripts/doc-tests.sh + set -o pipefail + test x/build/reproducible-path/librsb-1.3.0.2+dfsg = x -+ grep '^.\{71,\}' + cat /build/reproducible-path/librsb-1.3.0.2+dfsg/examples/autotune.c /build/reproducible-path/librsb-1.3.0.2+dfsg/examples/backsolve.c /build/reproducible-path/librsb-1.3.0.2+dfsg/examples/hello-spblas.c /build/reproducible-path/librsb-1.3.0.2+dfsg/examples/hello.c /build/reproducible-path/librsb-1.3.0.2+dfsg/examples/io-spblas.c /build/reproducible-path/librsb-1.3.0.2+dfsg/examples/power.c /build/reproducible-path/librsb-1.3.0.2+dfsg/examples/snippets.c /build/reproducible-path/librsb-1.3.0.2+dfsg/examples/transpose.c ++ grep '^.\{71,\}' + true -+ grep '^[^ ].\{80,\}' + cat /build/reproducible-path/librsb-1.3.0.2+dfsg/README ++ grep '^[^ ].\{80,\}' + true -++ wc -l ++ /build/reproducible-path/librsb-1.3.0.2+dfsg/rsbench -h +++ wc -l + test 63 -ge 61 ++ wc -c ++ /build/reproducible-path/librsb-1.3.0.2+dfsg/rsbench -h + test 2014 -ge 1966 -++ wc -l ++ /build/reproducible-path/librsb-1.3.0.2+dfsg/rsbench -oa -Ob -h +++ wc -l + test 182 -ge 157 ++ /build/reproducible-path/librsb-1.3.0.2+dfsg/rsbench -oa -Ob -h ++ wc -c @@ -5144,7 +5180,7 @@ type char codes:D S C Z gmake[4]: Entering directory '/build/reproducible-path/librsb-1.3.0.2+dfsg/examples' if test /build/reproducible-path/librsb-1.3.0.2+dfsg != /build/reproducible-path/librsb-1.3.0.2+dfsg ; then cp /build/reproducible-path/librsb-1.3.0.2+dfsg/pd.mtx /build/reproducible-path/librsb-1.3.0.2+dfsg/vf.mtx /build/reproducible-path/librsb-1.3.0.2+dfsg/examples ; fi -( PATH="/build/reproducible-path/librsb-1.3.0.2+dfsg:/usr/sbin:/usr/bin:/sbin:/bin:/usr/games" /bin/bash /build/reproducible-path/librsb-1.3.0.2+dfsg/examples/bench.sh; ) +( PATH="/build/reproducible-path/librsb-1.3.0.2+dfsg:/usr/sbin:/usr/bin:/sbin:/bin:/usr/games:/i/capture/the/path" /bin/sh /build/reproducible-path/librsb-1.3.0.2+dfsg/examples/bench.sh; ) + which rsbench /build/reproducible-path/librsb-1.3.0.2+dfsg/rsbench + BRF=test.rpr @@ -5154,15 +5190,15 @@ Will invoke autotuning for ~10.000000 s x 1 rounds, specifying verbosity=0 and threads=0. (>0 means no structure tuning; 0 means only structure tuning, <0 means tuning of both with (negated) thread count suggestion). # Requested no transposition. # performance record file set to: test.rpr -# beginning run at 1788680931 +# beginning run at 1754271504 # /build/reproducible-path/librsb-1.3.0.2+dfsg/.libs/rsbench -oa -Ob --bench --lower 100 --as-symmetric --types : -n 1 --notranspose --compare-competitors --verbose --verbose --write-performance-record=test.rpr # compiled with: CC=gcc CFLAGS=-g -O2 -Werror=implicit-function-declaration -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -# average timer granularity: 3.04e-08 s +# average timer granularity: 3.42e-08 s # Will write a final performance record to file test.rpr and periodic checkpoints to test.rpr.tmp # will NOT perform ancillary tests. # will flush cache memory: between each operation measurement series, and NOT between each operation. # will keep any zero encountered in the matrix. -# env: export PATH=/build/reproducible-path/librsb-1.3.0.2+dfsg:/usr/sbin:/usr/bin:/sbin:/bin:/usr/games +# env: export PATH=/build/reproducible-path/librsb-1.3.0.2+dfsg:/usr/sbin:/usr/bin:/sbin:/bin:/usr/games:/i/capture/the/path # env: export LD_LIBRARY_PATH=/build/reproducible-path/librsb-1.3.0.2+dfsg/.libs # env: HOSTNAME is not set # env: KMP_AFFINITY is not set @@ -5201,7 +5237,7 @@ # env: SLURM_NTASKS is not set # env: SLURM_STEP_TASKS_PER_NODE is not set # env: SLURM_TASKS_PER_NODE is not set -# detected hostname: codethink03-arm64 +# detected hostname: i-capture-the-hostname # user specified a verbosity level of 2 (each --verbose occurrence counts +1) # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 524288 bytes, per-thread 43690 bytes @@ -5221,29 +5257,29 @@ # This test will measure times in scanning arrays sized and aligned to fit in caches. # 2 cache levels detected Will fill struct with 40 samples... -# Memory benchmark took 4.944s +# Memory benchmark took 5.351s # auto-tuning oriented output implies times==0 iterations and sort-after-load. #pr: allocated a performance record for 4 samples (1120 bytes). # multi-type benchmarking (DSCZ) -- now using typecode D (last was D). # Cache block size total 524288 bytes, per-thread 43690 bytes -# so far, program took 4.946s of wall clock time; ancillary tests 0.000s; I/O 0.000s; checks 0.000s; conversions 0.000s; rsb/mkl tuning 0.000s/0.000s . +# so far, program took 5.353s of wall clock time; ancillary tests 0.000s; I/O 0.000s; checks 0.000s; conversions 0.000s; rsb/mkl tuning 0.000s/0.000s . # Using 1 threads # Using alpha=1 beta=1 order=cols for rsb_spmv/rsb_spsv/rsb_spmm/rsb_spsm. # will use input matrix flags: RSB_FLAG_USE_HALFWORD_INDICES, RSB_FLAG_SORTED_INPUT, RSB_FLAG_LOWER, RSB_FLAG_QUAD_PARTITIONING, RSB_FLAG_SYMMETRIC, RSB_FLAG_OWN_PARTITIONING_ARRAYS # Using 1 threads Building a matrix with 5050 nnz, 100 x 100 Duplicates check: 5050 - 0 = 5050 - converted COO to RSB in 6.029e-02 s (100.00 %) - analyzed arrays in 2.080e-02 s (34.51 %) - cleaned-up arrays in 1.001e-05 s (0.02 %) - deduplicated arrays in 7.868e-06 s (0.01 %) + converted COO to RSB in 1.399e-02 s (100.00 %) + analyzed arrays in 4.124e-03 s (29.47 %) + cleaned-up arrays in 1.121e-05 s (0.08 %) + deduplicated arrays in 1.097e-05 s (0.08 %) sorted arrays in 0.000e+00 s (0.00 %) - shuffled partitions in 2.399e-02 s (39.79 %) - memory allocations took 2.003e-05 s (0.03 %) - leafs setup took 2.003e-05 s (0.03 %) - halfword conversion took 1.543e-02 s (25.60 %) -Built (100 x 100)[0xaaaafddfe380]{D} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x2446196 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'LS' -# Constructed matrix (took 0.060s): (100 x 100)[0xaaaafddfe380]{D} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x2446196 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'LS' + shuffled partitions in 6.463e-03 s (46.19 %) + memory allocations took 1.979e-05 s (0.14 %) + leafs setup took 5.960e-06 s (0.04 %) + halfword conversion took 3.340e-03 s (23.87 %) +Built (100 x 100)[0xaaaae53733c0]{D} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x2446196 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'LS' +# Constructed matrix (took 0.014s): (100 x 100)[0xaaaae53733c0]{D} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x2446196 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'LS' # matrix consistency check took 0.000s (ok) RSB Sparse Blocks Autotuner invoked requesting max 6 splits and max 6 merges in 1 rounds, threads spec.0 (specify negative values to enable threads tuning). Will autotune matrix: 100 x 100, type D, 5050 nnz, 50 nnz/r, 4 subms, 3 lsubms, 2.1212 bpnz. @@ -5294,10 +5330,10 @@ # RSB_IO_WANT_SORT_METHOD: 0 # RSB_IO_WANT_SUBDIVISION_MULTIPLIER: 1 # librsb version 1.3.0.2 - 202212201855: Initialization success -3 iterations (1 th.) took 0.01575s; avg 0.00525s ( +/- 60.03/ 47.17 %); best 0.002099s; worst 0.007727s; std dev. 0.002347 (taking best). -Reference operation time is 0.0020988 s (9.625 Mflops) with 1 threads. -Starting merge (same threads) based auto-tuning procedure (transA=N, nrhs=1, order=cols) (max 6 steps, inclusive 3 grace steps) on: 100 x 100, type D, 5050 nnz, 50 nnz/r, 4 subms, 3 lsubms, 2.1212 bpnz (tpop: 0.002099 Mflops: 9.625) -Merge (3 -> 1 leaves) took w.c.t. of 9.799e-05s, ~7.796e-05s of computing time (of which 3.099e-05s sorting, 6.914e-06s analysis) +3 iterations (1 th.) took 0.003876s; avg 0.001292s ( +/- 16.48/ 8.43 %); best 0.001079s; worst 0.001401s; std dev. 0.0001506 (taking best). +Reference operation time is 0.00107908 s (18.72 Mflops) with 1 threads. +Starting merge (same threads) based auto-tuning procedure (transA=N, nrhs=1, order=cols) (max 6 steps, inclusive 3 grace steps) on: 100 x 100, type D, 5050 nnz, 50 nnz/r, 4 subms, 3 lsubms, 2.1212 bpnz (tpop: 0.001079 Mflops: 18.720) +Merge (3 -> 1 leaves) took w.c.t. of 7.2e-05s, ~6.008e-05s of computing time (of which 2.408e-05s sorting, 4.053e-06s analysis) # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 524288 bytes, per-thread 524288 bytes # RSB_IO_WANT_MEMORY_HIERARCHY_INFO_STRING: unset @@ -5328,8 +5364,8 @@ # RSB_IO_WANT_SORT_METHOD: 0 # RSB_IO_WANT_SUBDIVISION_MULTIPLIER: 1 # librsb version 1.3.0.2 - 202212201855: Initialization success -3 iterations (1 th.) took 5.507e-05s; avg 1.836e-05s ( +/- 12.99/ 19.48 %); best 1.597e-05s; worst 2.193e-05s; std dev. 2.575e-06 (taking best). -Reference operation time is 1.5974e-05 s (1265 Mflops) with 1 threads. +3 iterations (1 th.) took 3.099e-05s; avg 1.033e-05s ( +/- 14.62/ 17.69 %); best 8.821e-06s; worst 1.216e-05s; std dev. 1.381e-06 (taking best). +Reference operation time is 8.82149e-06 s (2290 Mflops) with 1 threads. # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 524288 bytes, per-thread 524288 bytes # RSB_IO_WANT_MEMORY_HIERARCHY_INFO_STRING: unset @@ -5345,16 +5381,16 @@ # RSB_IO_WANT_SORT_METHOD: 0 # RSB_IO_WANT_SUBDIVISION_MULTIPLIER: 1 # librsb version 1.3.0.2 - 202212201855: Initialization success -After merge step 1: tpop: 1.597e-05 s ~Mflops: 1264.551 nsubm:1 otn:1 -Applying merge (3 -> 1 leaves, 1 th.) yielded SPEEDUP of 131.388x: 0.002099s -> 1.597e-05s, so taking this instance. +After merge step 1: tpop: 8.821e-06 s ~Mflops: 2289.863 nsubm:1 otn:1 +Applying merge (3 -> 1 leaves, 1 th.) yielded SPEEDUP of 122.324x: 0.001079s -> 8.821e-06s, so taking this instance. Saved plot to test-tuning-lower-100x100-5050nz--D-N-1--mv-tuned_merge1_1x1th.eps Merged all the matrix leaves: no reason to continue merging. -A total of 1 merge steps (of max 6) (3 -> 1 subms) took 0.03314s (of which 0.000104s partitioning, 0.02441s I/O); computing times: 7.796e-05s in par. loops, 3.099e-05s sorting, 6.914e-06s analyzing) -Total merge + benchmarking process took 0.03314s, equivalent to 2074.6/15.8 new/old ops (0.01424s for 2 clones -- as 891.4/6.8 ops, or 445.7/3.4 ops per clone), SPEEDUP of 131.388x -Applying multi-merge (3 -> 1 leaves, 1 steps, 0 -> 1 th.sp.) yielded SPEEDUP of 131.388x (0.002099s -> 1.597e-05s), will amortize in 15.9 ops by saving 0.002083s per op. -In 1 tuning rounds (tot. 0.055s, 0.014s for constructor, 2 clones) obtained a SPEEDUP of 13038.8% (131.4x) (from 9.625 to 1265 Mflops). Employed 0.032s for I/O of matrix plots. +A total of 1 merge steps (of max 6) (3 -> 1 subms) took 0.02085s (of which 7.606e-05s partitioning, 0.01502s I/O); computing times: 6.008e-05s in par. loops, 2.408e-05s sorting, 4.053e-06s analyzing) +Total merge + benchmarking process took 0.02085s, equivalent to 2363.8/19.3 new/old ops (0.009042s for 2 clones -- as 1025.0/8.4 ops, or 512.5/4.2 ops per clone), SPEEDUP of 122.324x +Applying multi-merge (3 -> 1 leaves, 1 steps, 0 -> 1 th.sp.) yielded SPEEDUP of 122.324x (0.001079s -> 8.821e-06s), will amortize in 19.5 ops by saving 0.00107s per op. +In 1 tuning rounds (tot. 0.028s, 0.009s for constructor, 2 clones) obtained a SPEEDUP of 12132.4% (122.3x) (from 18.72 to 2290 Mflops). Employed 0.016s for I/O of matrix plots. #pr: updating sample at index 1 (0^th of 4), 0^th touch for (0,0,0,0,0,0,0). -First run of RSB Autotuner took 0.086971 s (2.099e-03 s -> 1.597e-05 s per spmv_sxsa) (tuned: 3 -> 1 lsubm). +First run of RSB Autotuner took 0.044189 s (1.079e-03 s -> 8.821e-06 s per spmv_sxsa) (tuned: 3 -> 1 lsubm). RSB Sparse Blocks Autotuner invoked requesting max 0 splits and max 0 merges in 1 rounds, auto threads spec. Will autotune matrix: 100 x 100, type D, 5050 nnz, 50 nnz/r, 1 subms, 1 lsubms, 2.0800 bpnz. Parameters: verbosity:1 mintimes:3 maxtimes:10 mindt:0 maxdt:10 @@ -5420,20 +5456,20 @@ # RSB_IO_WANT_SORT_METHOD: 0 # RSB_IO_WANT_SUBDIVISION_MULTIPLIER: 1 # librsb version 1.3.0.2 - 202212201855: Initialization success -3 iterations (1 th.) took 5.913e-05s; avg 1.971e-05s ( +/- 17.74/ 31.85 %); best 1.621e-05s; worst 2.599e-05s; std dev. 4.449e-06 (taking best). -Reference operation time is 1.62125e-05 s (1246 Mflops) with 1 threads. +3 iterations (1 th.) took 4.721e-05s; avg 1.574e-05s ( +/- 16.67/ 27.27 %); best 1.311e-05s; worst 2.003e-05s; std dev. 3.059e-06 (taking best). +Reference operation time is 1.3113e-05 s (1540 Mflops) with 1 threads. Building a matrix with 5050 nnz, 100 x 100 Duplicates check: 5050 - 0 = 5050 - converted COO to RSB in 4.671e-03 s (100.00 %) - analyzed arrays in 1.559e-03 s (33.38 %) - cleaned-up arrays in 2.599e-05 s (0.56 %) - deduplicated arrays in 2.098e-05 s (0.45 %) + converted COO to RSB in 4.321e-03 s (100.00 %) + analyzed arrays in 1.670e-03 s (38.65 %) + cleaned-up arrays in 2.003e-05 s (0.46 %) + deduplicated arrays in 1.693e-05 s (0.39 %) sorted arrays in 0.000e+00 s (0.00 %) - shuffled partitions in 3.051e-03 s (65.32 %) - memory allocations took 6.914e-06 s (0.15 %) + shuffled partitions in 2.600e-03 s (60.17 %) + memory allocations took 5.007e-06 s (0.12 %) leafs setup took 1.907e-06 s (0.04 %) - halfword conversion took 5.007e-06 s (0.11 %) -Built (100 x 100)[0xaaaafde08b50]{D} @ (0(0..100),0(0..100)) (5050 nnz, 50 nnz/r) flags 0x42644094 (coo:0, csr:1, hw:0, ic:1, fi:0), storage: 1, subm: 1, symflags:'LS' + halfword conversion took 7.153e-06 s (0.17 %) +Built (100 x 100)[0xaaaae537db90]{D} @ (0(0..100),0(0..100)) (5050 nnz, 50 nnz/r) flags 0x42644094 (coo:0, csr:1, hw:0, ic:1, fi:0), storage: 1, subm: 1, symflags:'LS' Starting autotuning stage, with subdivision of 1 (current threads=1, requested threads=0, max threads = 12). # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 524288 bytes, per-thread 524288 bytes @@ -5467,16 +5503,16 @@ # librsb version 1.3.0.2 - 202212201855: Initialization success Building a matrix with 5050 nnz, 100 x 100 Duplicates check: 5050 - 0 = 5050 - converted COO to RSB in 1.132e-02 s (100.00 %) - analyzed arrays in 3.855e-03 s (34.07 %) - cleaned-up arrays in 1.287e-05 s (0.11 %) - deduplicated arrays in 1.192e-05 s (0.11 %) + converted COO to RSB in 6.978e-03 s (100.00 %) + analyzed arrays in 2.352e-03 s (33.71 %) + cleaned-up arrays in 1.907e-05 s (0.27 %) + deduplicated arrays in 1.597e-05 s (0.23 %) sorted arrays in 0.000e+00 s (0.00 %) - shuffled partitions in 4.260e-03 s (37.65 %) - memory allocations took 4.292e-06 s (0.04 %) - leafs setup took 9.537e-07 s (0.01 %) - halfword conversion took 3.171e-03 s (28.02 %) -Built (100 x 100)[0xaaaafddfe6d0]{D} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x42646096 (coo:0, csr:1, hw:1, ic:1, fi:0), storage: 1, subm: 3, symflags:'LS' + shuffled partitions in 2.495e-03 s (35.76 %) + memory allocations took 1.907e-06 s (0.03 %) + leafs setup took 3.099e-06 s (0.04 %) + halfword conversion took 2.091e-03 s (29.96 %) +Built (100 x 100)[0xaaaae5373710]{D} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x42646096 (coo:0, csr:1, hw:1, ic:1, fi:0), storage: 1, subm: 3, symflags:'LS' # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 524288 bytes, per-thread 524288 bytes # RSB_IO_WANT_MEMORY_HIERARCHY_INFO_STRING: unset @@ -5522,9 +5558,9 @@ # RSB_IO_WANT_SORT_METHOD: 0 # RSB_IO_WANT_SUBDIVISION_MULTIPLIER: 0.25 # librsb version 1.3.0.2 - 202212201855: Initialization success -3 iterations (1 th.) took 0.006607s; avg 0.002202s ( +/- 5.88/ 7.03 %); best 0.002073s; worst 0.002357s; std dev. 0.0001174 (taking best). -Reference operation time is 0.00207281 s (9.745 Mflops) with 1 threads. -Challenging best inner round reference (1.62125e-05 s/1 threads) with: subdivision 0.25, 3 leaves, 2.121 bytes/nz, 0.00207281 s/0 threads (speedup 0.00782149 x), same?n. +3 iterations (1 th.) took 0.002765s; avg 0.0009216s ( +/- 14.27/ 25.10 %); best 0.0007901s; worst 0.001153s; std dev. 0.0001641 (taking best). +Reference operation time is 0.000790119 s (25.57 Mflops) with 1 threads. +Challenging best inner round reference (1.3113e-05 s/1 threads) with: subdivision 0.25, 3 leaves, 2.121 bytes/nz, 0.000790119 s/0 threads (speedup 0.0165963 x), same?n. New candidate clone performs slowly; discarding it: 100 x 100, type D, 5050 nnz, 50 nnz/r, 4 subms, 3 lsubms, 2.1212 bpnz # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 524288 bytes, per-thread 524288 bytes @@ -5558,16 +5594,16 @@ # librsb version 1.3.0.2 - 202212201855: Initialization success Building a matrix with 5050 nnz, 100 x 100 Duplicates check: 5050 - 0 = 5050 - converted COO to RSB in 1.094e-02 s (100.00 %) - analyzed arrays in 4.488e-03 s (41.02 %) - cleaned-up arrays in 1.216e-05 s (0.11 %) - deduplicated arrays in 1.097e-05 s (0.10 %) + converted COO to RSB in 5.577e-03 s (100.00 %) + analyzed arrays in 1.830e-03 s (32.81 %) + cleaned-up arrays in 1.192e-05 s (0.21 %) + deduplicated arrays in 1.287e-05 s (0.23 %) sorted arrays in 0.000e+00 s (0.00 %) - shuffled partitions in 3.918e-03 s (35.81 %) - memory allocations took 1.907e-06 s (0.02 %) - leafs setup took 3.099e-06 s (0.03 %) - halfword conversion took 2.506e-03 s (22.90 %) -Built (100 x 100)[0xaaaafddff0c0]{D} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x42646096 (coo:0, csr:1, hw:1, ic:1, fi:0), storage: 1, subm: 10, symflags:'LS' + shuffled partitions in 1.802e-03 s (32.31 %) + memory allocations took 4.292e-06 s (0.08 %) + leafs setup took 1.907e-06 s (0.03 %) + halfword conversion took 1.912e-03 s (34.29 %) +Built (100 x 100)[0xaaaae5374100]{D} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x42646096 (coo:0, csr:1, hw:1, ic:1, fi:0), storage: 1, subm: 10, symflags:'LS' # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 524288 bytes, per-thread 524288 bytes # RSB_IO_WANT_MEMORY_HIERARCHY_INFO_STRING: unset @@ -5613,9 +5649,9 @@ # RSB_IO_WANT_SORT_METHOD: 0 # RSB_IO_WANT_SUBDIVISION_MULTIPLIER: 0.5 # librsb version 1.3.0.2 - 202212201855: Initialization success -3 iterations (1 th.) took 0.003398s; avg 0.001133s ( +/- 15.25/ 29.08 %); best 0.0009599s; worst 0.001462s; std dev. 0.000233 (taking best). -Reference operation time is 0.000959873 s (21.04 Mflops) with 1 threads. -Challenging best inner round reference (1.62125e-05 s/1 threads) with: subdivision 0.5, 10 leaves, 2.206 bytes/nz, 0.000959873 s/0 threads (speedup 0.0168902 x), same?n. +3 iterations (1 th.) took 0.01065s; avg 0.00355s ( +/- 61.41/ 97.60 %); best 0.00137s; worst 0.007014s; std dev. 0.002477 (taking best). +Reference operation time is 0.00136995 s (14.75 Mflops) with 1 threads. +Challenging best inner round reference (1.3113e-05 s/1 threads) with: subdivision 0.5, 10 leaves, 2.206 bytes/nz, 0.00136995 s/0 threads (speedup 0.00957188 x), same?n. New candidate clone performs slowly; discarding it: 100 x 100, type D, 5050 nnz, 50 nnz/r, 14 subms, 10 lsubms, 2.2059 bpnz # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 524288 bytes, per-thread 524288 bytes @@ -5649,16 +5685,16 @@ # librsb version 1.3.0.2 - 202212201855: Initialization success Building a matrix with 5050 nnz, 100 x 100 Duplicates check: 5050 - 0 = 5050 - converted COO to RSB in 8.250e-03 s (100.00 %) - analyzed arrays in 3.403e-03 s (41.25 %) - cleaned-up arrays in 1.192e-05 s (0.14 %) - deduplicated arrays in 1.097e-05 s (0.13 %) + converted COO to RSB in 7.807e-03 s (100.00 %) + analyzed arrays in 3.207e-03 s (41.08 %) + cleaned-up arrays in 2.599e-05 s (0.33 %) + deduplicated arrays in 2.193e-05 s (0.28 %) sorted arrays in 0.000e+00 s (0.00 %) - shuffled partitions in 2.360e-03 s (28.60 %) - memory allocations took 4.053e-06 s (0.05 %) - leafs setup took 2.146e-06 s (0.03 %) - halfword conversion took 2.458e-03 s (29.79 %) -Built (100 x 100)[0xaaaafde08c70]{D} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x42646096 (coo:0, csr:1, hw:1, ic:1, fi:0), storage: 1, subm: 25, symflags:'LS' + shuffled partitions in 2.364e-03 s (30.28 %) + memory allocations took 8.106e-06 s (0.10 %) + leafs setup took 8.821e-06 s (0.11 %) + halfword conversion took 2.170e-03 s (27.80 %) +Built (100 x 100)[0xaaaae537dcb0]{D} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x42646096 (coo:0, csr:1, hw:1, ic:1, fi:0), storage: 1, subm: 25, symflags:'LS' # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 524288 bytes, per-thread 524288 bytes # RSB_IO_WANT_MEMORY_HIERARCHY_INFO_STRING: unset @@ -5704,9 +5740,9 @@ # RSB_IO_WANT_SORT_METHOD: 0 # RSB_IO_WANT_SUBDIVISION_MULTIPLIER: 1 # librsb version 1.3.0.2 - 202212201855: Initialization success -3 iterations (1 th.) took 0.002948s; avg 0.0009826s ( +/- 7.48/ 13.97 %); best 0.0009091s; worst 0.00112s; std dev. 9.713e-05 (taking best). -Reference operation time is 0.00090909 s (22.22 Mflops) with 1 threads. -Challenging best inner round reference (1.62125e-05 s/1 threads) with: subdivision 1, 25 leaves, 2.317 bytes/nz, 0.00090909 s/0 threads (speedup 0.0178337 x), same?n. +3 iterations (1 th.) took 0.00349s; avg 0.001163s ( +/- 11.36/ 7.19 %); best 0.001031s; worst 0.001247s; std dev. 9.454e-05 (taking best). +Reference operation time is 0.00103116 s (19.59 Mflops) with 1 threads. +Challenging best inner round reference (1.3113e-05 s/1 threads) with: subdivision 1, 25 leaves, 2.317 bytes/nz, 0.00103116 s/0 threads (speedup 0.0127168 x), same?n. New candidate clone performs slowly; discarding it: 100 x 100, type D, 5050 nnz, 50 nnz/r, 34 subms, 25 lsubms, 2.3168 bpnz # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 524288 bytes, per-thread 524288 bytes @@ -5740,16 +5776,16 @@ # librsb version 1.3.0.2 - 202212201855: Initialization success Building a matrix with 5050 nnz, 100 x 100 Duplicates check: 5050 - 0 = 5050 - converted COO to RSB in 9.177e-03 s (100.00 %) - analyzed arrays in 4.901e-03 s (53.40 %) - cleaned-up arrays in 1.884e-05 s (0.21 %) - deduplicated arrays in 1.717e-05 s (0.19 %) + converted COO to RSB in 6.618e-03 s (100.00 %) + analyzed arrays in 2.653e-03 s (40.09 %) + cleaned-up arrays in 2.098e-05 s (0.32 %) + deduplicated arrays in 1.812e-05 s (0.27 %) sorted arrays in 0.000e+00 s (0.00 %) - shuffled partitions in 2.245e-03 s (24.47 %) - memory allocations took 5.007e-06 s (0.05 %) - leafs setup took 2.861e-06 s (0.03 %) - halfword conversion took 1.986e-03 s (21.64 %) -Built (100 x 100)[0xaaaafde2f8e0]{D} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x42646096 (coo:0, csr:1, hw:1, ic:1, fi:0), storage: 1, subm: 36, symflags:'LS' + shuffled partitions in 1.930e-03 s (29.16 %) + memory allocations took 4.768e-06 s (0.07 %) + leafs setup took 2.861e-06 s (0.04 %) + halfword conversion took 1.986e-03 s (30.01 %) +Built (100 x 100)[0xaaaae53a4920]{D} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x42646096 (coo:0, csr:1, hw:1, ic:1, fi:0), storage: 1, subm: 36, symflags:'LS' # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 524288 bytes, per-thread 524288 bytes # RSB_IO_WANT_MEMORY_HIERARCHY_INFO_STRING: unset @@ -5795,9 +5831,9 @@ # RSB_IO_WANT_SORT_METHOD: 0 # RSB_IO_WANT_SUBDIVISION_MULTIPLIER: 2 # librsb version 1.3.0.2 - 202212201855: Initialization success -3 iterations (1 th.) took 0.003694s; avg 0.001231s ( +/- 8.55/ 14.92 %); best 0.001126s; worst 0.001415s; std dev. 0.0001303 (taking best). -Reference operation time is 0.00112605 s (17.94 Mflops) with 1 threads. -Challenging best inner round reference (1.62125e-05 s/1 threads) with: subdivision 2, 36 leaves, 2.383 bytes/nz, 0.00112605 s/0 threads (speedup 0.0143976 x), same?n. +3 iterations (1 th.) took 0.00448s; avg 0.001493s ( +/- 32.42/ 51.60 %); best 0.001009s; worst 0.002264s; std dev. 0.0005509 (taking best). +Reference operation time is 0.00100923 s (20.02 Mflops) with 1 threads. +Challenging best inner round reference (1.3113e-05 s/1 threads) with: subdivision 2, 36 leaves, 2.383 bytes/nz, 0.00100923 s/0 threads (speedup 0.0129931 x), same?n. New candidate clone performs slowly; discarding it: 100 x 100, type D, 5050 nnz, 50 nnz/r, 50 subms, 36 lsubms, 2.3834 bpnz # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 524288 bytes, per-thread 524288 bytes @@ -5831,16 +5867,16 @@ # librsb version 1.3.0.2 - 202212201855: Initialization success Building a matrix with 5050 nnz, 100 x 100 Duplicates check: 5050 - 0 = 5050 - converted COO to RSB in 6.914e-03 s (100.00 %) - analyzed arrays in 2.754e-03 s (39.83 %) - cleaned-up arrays in 1.216e-05 s (0.18 %) - deduplicated arrays in 9.775e-06 s (0.14 %) + converted COO to RSB in 5.837e-03 s (100.00 %) + analyzed arrays in 2.207e-03 s (37.81 %) + cleaned-up arrays in 1.597e-05 s (0.27 %) + deduplicated arrays in 1.502e-05 s (0.26 %) sorted arrays in 0.000e+00 s (0.00 %) - shuffled partitions in 1.655e-03 s (23.94 %) - memory allocations took 5.007e-06 s (0.07 %) - leafs setup took 2.861e-06 s (0.04 %) - halfword conversion took 2.474e-03 s (35.78 %) -Built (100 x 100)[0xaaaafde2f8e0]{D} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x42646096 (coo:0, csr:1, hw:1, ic:1, fi:0), storage: 1, subm: 36, symflags:'LS' + shuffled partitions in 1.712e-03 s (29.33 %) + memory allocations took 5.960e-06 s (0.10 %) + leafs setup took 3.099e-06 s (0.05 %) + halfword conversion took 1.877e-03 s (32.15 %) +Built (100 x 100)[0xaaaae53a4920]{D} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x42646096 (coo:0, csr:1, hw:1, ic:1, fi:0), storage: 1, subm: 36, symflags:'LS' # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 524288 bytes, per-thread 524288 bytes # RSB_IO_WANT_MEMORY_HIERARCHY_INFO_STRING: unset @@ -5886,11 +5922,11 @@ # RSB_IO_WANT_SORT_METHOD: 0 # RSB_IO_WANT_SUBDIVISION_MULTIPLIER: 4 # librsb version 1.3.0.2 - 202212201855: Initialization success -3 iterations (1 th.) took 0.004015s; avg 0.001338s ( +/- 39.93/ 40.84 %); best 0.0008039s; worst 0.001885s; std dev. 0.0004414 (taking best). -Reference operation time is 0.000803947 s (25.13 Mflops) with 1 threads. -Challenging best inner round reference (1.62125e-05 s/1 threads) with: subdivision 4, 36 leaves, 2.383 bytes/nz, 0.000803947 s/0 threads (speedup 0.0201661 x), same?n. +3 iterations (1 th.) took 0.003912s; avg 0.001304s ( +/- 6.66/ 7.36 %); best 0.001217s; worst 0.0014s; std dev. 7.493e-05 (taking best). +Reference operation time is 0.00121713 s (16.6 Mflops) with 1 threads. +Challenging best inner round reference (1.3113e-05 s/1 threads) with: subdivision 4, 36 leaves, 2.383 bytes/nz, 0.00121713 s/0 threads (speedup 0.0107738 x), same?n. New candidate clone performs slowly; discarding it: 100 x 100, type D, 5050 nnz, 50 nnz/r, 50 subms, 36 lsubms, 2.3834 bpnz -Best sparse multiply performance with subdivision multiplier of 1: 1245.96 Mflops. +Best sparse multiply performance with subdivision multiplier of 1: 1540.45 Mflops. # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 524288 bytes, per-thread 524288 bytes # RSB_IO_WANT_MEMORY_HIERARCHY_INFO_STRING: unset @@ -5906,23 +5942,23 @@ # RSB_IO_WANT_SORT_METHOD: 0 # RSB_IO_WANT_SUBDIVISION_MULTIPLIER: 1 # librsb version 1.3.0.2 - 202212201855: Initialization success -Last tuner inner round (1 of 1) took 0.0743029 s (eq. to 5e+03/ 5e+03 old/new op.times), gained local/global speedup 1 x (1.62125e-05 : 1.62125e-05) / 1 x (1.62125e-05 : 1.62125e-05). This is not amortizable ! +Last tuner inner round (1 of 1) took 0.0659521 s (eq. to 5e+03/ 5e+03 old/new op.times), gained local/global speedup 1 x (1.3113e-05 : 1.3113e-05) / 1 x (1.3113e-05 : 1.3113e-05). This is not amortizable ! Auto tuning inner round 1 did not find a configuration better than the original. -In 1 tuning rounds (tot. 0.074s, 0.053s for constructor, 0 clones) obtained NO speedup (best stays 1246 Mflops). -Second run of RSB Autotuner took 0.074337 s and estimated a speedup of 1.000000 x (1.621e-05 s -> 1.621e-05 s per op) in same matrix (1 -> 1 lsubm) +In 1 tuning rounds (tot. 0.066s, 0.04s for constructor, 0 clones) obtained NO speedup (best stays 1540 Mflops). +Second run of RSB Autotuner took 0.0659869 s and estimated a speedup of 1.000000 x (1.311e-05 s -> 1.311e-05 s per op) in same matrix (1 -> 1 lsubm) #min:1 #max:1 #sum:100 #norm:10 #used index storage compared to COO:10504 vs 40400 bytes (26.00%) ; compared to CSR:10504 vs 20604 bytes (50.99%) #%:CONSTRUCTOR_*:SORT SCAN INSERT SCAN+INSERT -%:CONSTRUCTOR_TIMES:lower-100x100-5050nz S N 1 100 100 5050 0.000000 0.020803 0.023991 0.044794 -%:UNSORTEDCOO2RSB_TIME:lower-100x100-5050nz S N 1 100 100 5050 0.044794 -%:RSB_SUBDIVISION_TIME:lower-100x100-5050nz S N 1 100 100 5050 0.020803 -%:RSB_SHUFFLE_TIME:lower-100x100-5050nz S N 1 100 100 5050 0.023991 +%:CONSTRUCTOR_TIMES:lower-100x100-5050nz S N 1 100 100 5050 0.000000 0.004124 0.006463 0.010587 +%:UNSORTEDCOO2RSB_TIME:lower-100x100-5050nz S N 1 100 100 5050 0.010587 +%:RSB_SUBDIVISION_TIME:lower-100x100-5050nz S N 1 100 100 5050 0.004124 +%:RSB_SHUFFLE_TIME:lower-100x100-5050nz S N 1 100 100 5050 0.006463 %:ROW_MAJOR_SORT_TIME:lower-100x100-5050nz S N 1 100 100 5050 0.000000 %:ROW_MAJOR_SORT_SCALING:lower-100x100-5050nz S N 1 100 100 5050 nan -%:SORTEDCOO2RSB_TIME:lower-100x100-5050nz S N 1 100 100 5050 0.044794 +%:SORTEDCOO2RSB_TIME:lower-100x100-5050nz S N 1 100 100 5050 0.010587 %:ROW_MAJOR_SORT_TO_MOP:lower-100x100-5050nz S N 1 100 100 5050 0.000 %:UNSORTEDCOO2RSB_SCALING:lower-100x100-5050nz S N 1 100 100 5050 1.00 %:SORTEDCOO2RSB_SCALING:lower-100x100-5050nz S N 1 100 100 5050 1.00 @@ -5937,34 +5973,34 @@ %:SM_MINMAXAVGNNZ:lower-100x100-5050nz S N 1 100 100 5050 5050 5050 5050 # %operation:matrix CONSTRUCTOR[1] SPMV[1] SPMV[1] -%operation:lower-100x100-5050nz 0.060287 1e+09 1e+09 +%operation:lower-100x100-5050nz 0.0139918 1e+09 1e+09 %constructor:matrix SORT[1] SCAN[1] SHUFFLE[1] INSERT[1] -%constructor:lower-100x100-5050nz 0 0.0208032 0 0.0239911 -# so far, program took 5.176s of wall clock time; ancillary tests 0.000s; I/O 0.000s; checks 0.000s; conversions 0.000s; rsb/mkl tuning 0.161s/0.000s . +%constructor:lower-100x100-5050nz 0 0.00412393 0 0.00646305 +# so far, program took 5.484s of wall clock time; ancillary tests 0.000s; I/O 0.000s; checks 0.000s; conversions 0.000s; rsb/mkl tuning 0.110s/0.000s . getrusage() stats: -ru_maxrss: 8 (maximum resident set size -- MB) -ru_stime : 0.06198s (system CPU time used) -ru_utime : 4.468s (user CPU time used) +ru_maxrss: 6 (maximum resident set size -- MB) +ru_stime : 0.04007s (system CPU time used) +ru_utime : 5.977s (user CPU time used) # multi-type benchmarking (DSCZ) -- now using typecode S (last was D). # Cache block size total 524288 bytes, per-thread 524288 bytes -# so far, program took 5.176s of wall clock time; ancillary tests 0.000s; I/O 0.000s; checks 0.000s; conversions 0.000s; rsb/mkl tuning 0.161s/0.000s . +# so far, program took 5.484s of wall clock time; ancillary tests 0.000s; I/O 0.000s; checks 0.000s; conversions 0.000s; rsb/mkl tuning 0.110s/0.000s . # Using 1 threads # Using alpha=1 beta=1 order=cols for rsb_spmv/rsb_spsv/rsb_spmm/rsb_spsm. # will use input matrix flags: RSB_FLAG_USE_HALFWORD_INDICES, RSB_FLAG_SORTED_INPUT, RSB_FLAG_LOWER, RSB_FLAG_QUAD_PARTITIONING, RSB_FLAG_SYMMETRIC, RSB_FLAG_OWN_PARTITIONING_ARRAYS # Using 1 threads Building a matrix with 5050 nnz, 100 x 100 Duplicates check: 5050 - 0 = 5050 - converted COO to RSB in 1.023e-02 s (100.00 %) - analyzed arrays in 1.565e-03 s (15.30 %) - cleaned-up arrays in 1.097e-05 s (0.11 %) - deduplicated arrays in 9.060e-06 s (0.09 %) + converted COO to RSB in 6.867e-03 s (100.00 %) + analyzed arrays in 1.243e-03 s (18.10 %) + cleaned-up arrays in 1.717e-05 s (0.25 %) + deduplicated arrays in 1.502e-05 s (0.22 %) sorted arrays in 0.000e+00 s (0.00 %) - shuffled partitions in 6.686e-03 s (65.34 %) - memory allocations took 1.907e-06 s (0.02 %) - leafs setup took 3.815e-06 s (0.04 %) - halfword conversion took 1.955e-03 s (19.11 %) -Built (100 x 100)[0xaaaafde08c70]{S} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x2446196 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'LS' -# Constructed matrix (took 0.010s): (100 x 100)[0xaaaafde08c70]{S} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x2446196 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'LS' + shuffled partitions in 4.166e-03 s (60.67 %) + memory allocations took 4.768e-06 s (0.07 %) + leafs setup took 4.053e-06 s (0.06 %) + halfword conversion took 1.416e-03 s (20.62 %) +Built (100 x 100)[0xaaaae537dcb0]{S} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x2446196 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'LS' +# Constructed matrix (took 0.007s): (100 x 100)[0xaaaae537dcb0]{S} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x2446196 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'LS' # matrix consistency check took 0.000s (ok) RSB Sparse Blocks Autotuner invoked requesting max 6 splits and max 6 merges in 1 rounds, threads spec.0 (specify negative values to enable threads tuning). Will autotune matrix: 100 x 100, type S, 5050 nnz, 50 nnz/r, 4 subms, 3 lsubms, 2.1212 bpnz. @@ -6015,10 +6051,10 @@ # RSB_IO_WANT_SORT_METHOD: 0 # RSB_IO_WANT_SUBDIVISION_MULTIPLIER: 1 # librsb version 1.3.0.2 - 202212201855: Initialization success -3 iterations (1 th.) took 0.002802s; avg 0.000934s ( +/- 1.93/ 1.08 %); best 0.000916s; worst 0.0009441s; std dev. 1.279e-05 (taking best). -Reference operation time is 0.000916004 s (22.05 Mflops) with 1 threads. -Starting merge (same threads) based auto-tuning procedure (transA=N, nrhs=1, order=cols) (max 6 steps, inclusive 3 grace steps) on: 100 x 100, type S, 5050 nnz, 50 nnz/r, 4 subms, 3 lsubms, 2.1212 bpnz (tpop: 0.000916 Mflops: 22.052) -Merge (3 -> 1 leaves) took w.c.t. of 5.412e-05s, ~4.601e-05s of computing time (of which 1.907e-05s sorting, 2.146e-06s analysis) +3 iterations (1 th.) took 0.002537s; avg 0.0008457s ( +/- 8.37/ 10.83 %); best 0.0007749s; worst 0.0009372s; std dev. 6.789e-05 (taking best). +Reference operation time is 0.00077486 s (26.07 Mflops) with 1 threads. +Starting merge (same threads) based auto-tuning procedure (transA=N, nrhs=1, order=cols) (max 6 steps, inclusive 3 grace steps) on: 100 x 100, type S, 5050 nnz, 50 nnz/r, 4 subms, 3 lsubms, 2.1212 bpnz (tpop: 0.0007749 Mflops: 26.069) +Merge (3 -> 1 leaves) took w.c.t. of 5.698e-05s, ~4.888e-05s of computing time (of which 2.003e-05s sorting, 2.861e-06s analysis) # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 524288 bytes, per-thread 524288 bytes # RSB_IO_WANT_MEMORY_HIERARCHY_INFO_STRING: unset @@ -6049,7 +6085,7 @@ # RSB_IO_WANT_SORT_METHOD: 0 # RSB_IO_WANT_SUBDIVISION_MULTIPLIER: 1 # librsb version 1.3.0.2 - 202212201855: Initialization success -3 iterations (1 th.) took 3.004e-05s; avg 1.001e-05s ( +/- 0.00/ 0.00 %); best 1.001e-05s; worst 1.001e-05s; std dev. 0 (taking best). +3 iterations (1 th.) took 3.219e-05s; avg 1.073e-05s ( +/- 6.67/ 13.33 %); best 1.001e-05s; worst 1.216e-05s; std dev. 1.012e-06 (taking best). Reference operation time is 1.00136e-05 s (2017 Mflops) with 1 threads. # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 524288 bytes, per-thread 524288 bytes @@ -6067,15 +6103,15 @@ # RSB_IO_WANT_SUBDIVISION_MULTIPLIER: 1 # librsb version 1.3.0.2 - 202212201855: Initialization success After merge step 1: tpop: 1.001e-05 s ~Mflops: 2017.260 nsubm:1 otn:1 -Applying merge (3 -> 1 leaves, 1 th.) yielded SPEEDUP of 91.476x: 0.000916s -> 1.001e-05s, so taking this instance. +Applying merge (3 -> 1 leaves, 1 th.) yielded SPEEDUP of 77.381x: 0.0007749s -> 1.001e-05s, so taking this instance. Saved plot to test-tuning-lower-100x100-5050nz--S-N-1--mv-tuned_merge1_1x1th.eps Merged all the matrix leaves: no reason to continue merging. -A total of 1 merge steps (of max 6) (3 -> 1 subms) took 0.0176s (of which 5.603e-05s partitioning, 0.01336s I/O); computing times: 4.601e-05s in par. loops, 1.907e-05s sorting, 2.146e-06s analyzing) -Total merge + benchmarking process took 0.0176s, equivalent to 1757.3/19.2 new/old ops (0.006865s for 2 clones -- as 685.6/7.5 ops, or 342.8/3.7 ops per clone), SPEEDUP of 91.476x -Applying multi-merge (3 -> 1 leaves, 1 steps, 0 -> 1 th.sp.) yielded SPEEDUP of 91.476x (0.000916s -> 1.001e-05s), will amortize in 19.4 ops by saving 0.000906s per op. -In 1 tuning rounds (tot. 0.023s, 0.0069s for constructor, 2 clones) obtained a SPEEDUP of 9047.6% (91.48x) (from 22.05 to 2017 Mflops). Employed 0.009s for I/O of matrix plots. +A total of 1 merge steps (of max 6) (3 -> 1 subms) took 0.01112s (of which 6.008e-05s partitioning, 0.007538s I/O); computing times: 4.888e-05s in par. loops, 2.003e-05s sorting, 2.861e-06s analyzing) +Total merge + benchmarking process took 0.01112s, equivalent to 1110.4/14.3 new/old ops (0.006156s for 2 clones -- as 614.8/7.9 ops, or 307.4/4.0 ops per clone), SPEEDUP of 77.381x +Applying multi-merge (3 -> 1 leaves, 1 steps, 0 -> 1 th.sp.) yielded SPEEDUP of 77.381x (0.0007749s -> 1.001e-05s), will amortize in 14.5 ops by saving 0.0007648s per op. +In 1 tuning rounds (tot. 0.017s, 0.0062s for constructor, 2 clones) obtained a SPEEDUP of 7638.1% (77.38x) (from 26.07 to 2017 Mflops). Employed 0.011s for I/O of matrix plots. #pr: updating sample at index 2 (1^th of 4), 0^th touch for (0,0,0,0,0,1,0). -First run of RSB Autotuner took 0.0324581 s (9.160e-04 s -> 1.001e-05 s per spmv_sxsa) (tuned: 3 -> 1 lsubm). +First run of RSB Autotuner took 0.0271039 s (7.749e-04 s -> 1.001e-05 s per spmv_sxsa) (tuned: 3 -> 1 lsubm). RSB Sparse Blocks Autotuner invoked requesting max 0 splits and max 0 merges in 1 rounds, auto threads spec. Will autotune matrix: 100 x 100, type S, 5050 nnz, 50 nnz/r, 1 subms, 1 lsubms, 2.0800 bpnz. Parameters: verbosity:1 mintimes:3 maxtimes:10 mindt:0 maxdt:10 @@ -6141,20 +6177,20 @@ # RSB_IO_WANT_SORT_METHOD: 0 # RSB_IO_WANT_SUBDIVISION_MULTIPLIER: 1 # librsb version 1.3.0.2 - 202212201855: Initialization success -3 iterations (1 th.) took 3.099e-05s; avg 1.033e-05s ( +/- 21.54/ 36.15 %); best 8.106e-06s; worst 1.407e-05s; std dev. 2.657e-06 (taking best). -Reference operation time is 8.10623e-06 s (2492 Mflops) with 1 threads. +3 iterations (1 th.) took 3.695e-05s; avg 1.232e-05s ( +/- 26.45/ 45.16 %); best 9.06e-06s; worst 1.788e-05s; std dev. 3.953e-06 (taking best). +Reference operation time is 9.05991e-06 s (2230 Mflops) with 1 threads. Building a matrix with 5050 nnz, 100 x 100 Duplicates check: 5050 - 0 = 5050 - converted COO to RSB in 3.208e-03 s (100.00 %) - analyzed arrays in 1.060e-03 s (33.04 %) - cleaned-up arrays in 1.216e-05 s (0.38 %) - deduplicated arrays in 1.097e-05 s (0.34 %) + converted COO to RSB in 2.450e-03 s (100.00 %) + analyzed arrays in 8.440e-04 s (34.45 %) + cleaned-up arrays in 1.478e-05 s (0.60 %) + deduplicated arrays in 1.407e-05 s (0.57 %) sorted arrays in 0.000e+00 s (0.00 %) - shuffled partitions in 2.118e-03 s (66.02 %) - memory allocations took 3.815e-06 s (0.12 %) - leafs setup took 9.537e-07 s (0.03 %) - halfword conversion took 2.146e-06 s (0.07 %) -Built (100 x 100)[0xaaaafde08b50]{S} @ (0(0..100),0(0..100)) (5050 nnz, 50 nnz/r) flags 0x42644094 (coo:0, csr:1, hw:0, ic:1, fi:0), storage: 1, subm: 1, symflags:'LS' + shuffled partitions in 1.564e-03 s (63.84 %) + memory allocations took 6.199e-06 s (0.25 %) + leafs setup took 2.146e-06 s (0.09 %) + halfword conversion took 3.815e-06 s (0.16 %) +Built (100 x 100)[0xaaaae537db90]{S} @ (0(0..100),0(0..100)) (5050 nnz, 50 nnz/r) flags 0x42644094 (coo:0, csr:1, hw:0, ic:1, fi:0), storage: 1, subm: 1, symflags:'LS' Starting autotuning stage, with subdivision of 1 (current threads=1, requested threads=0, max threads = 12). # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 524288 bytes, per-thread 524288 bytes @@ -6188,16 +6224,16 @@ # librsb version 1.3.0.2 - 202212201855: Initialization success Building a matrix with 5050 nnz, 100 x 100 Duplicates check: 5050 - 0 = 5050 - converted COO to RSB in 2.277e-03 s (100.00 %) - analyzed arrays in 1.279e-03 s (56.17 %) - cleaned-up arrays in 1.192e-05 s (0.52 %) - deduplicated arrays in 1.001e-05 s (0.44 %) + converted COO to RSB in 4.561e-03 s (100.00 %) + analyzed arrays in 1.040e-03 s (22.80 %) + cleaned-up arrays in 1.383e-05 s (0.30 %) + deduplicated arrays in 1.216e-05 s (0.27 %) sorted arrays in 0.000e+00 s (0.00 %) - shuffled partitions in 9.711e-04 s (42.65 %) - memory allocations took 9.537e-07 s (0.04 %) - leafs setup took 9.537e-07 s (0.04 %) - halfword conversion took 1.907e-06 s (0.08 %) -Built (100 x 100)[0xaaaafddff0c0]{S} @ (0(0..100),0(0..100)) (5050 nnz, 50 nnz/r) flags 0x42644096 (coo:0, csr:1, hw:1, ic:1, fi:0), storage: 1, subm: 1, symflags:'LS' + shuffled partitions in 3.481e-03 s (76.33 %) + memory allocations took 4.053e-06 s (0.09 %) + leafs setup took 3.815e-06 s (0.08 %) + halfword conversion took 5.007e-06 s (0.11 %) +Built (100 x 100)[0xaaaae5374100]{S} @ (0(0..100),0(0..100)) (5050 nnz, 50 nnz/r) flags 0x42644096 (coo:0, csr:1, hw:1, ic:1, fi:0), storage: 1, subm: 1, symflags:'LS' # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 524288 bytes, per-thread 524288 bytes # RSB_IO_WANT_MEMORY_HIERARCHY_INFO_STRING: unset @@ -6243,9 +6279,9 @@ # RSB_IO_WANT_SORT_METHOD: 0 # RSB_IO_WANT_SUBDIVISION_MULTIPLIER: 0.25 # librsb version 1.3.0.2 - 202212201855: Initialization success -3 iterations (1 th.) took 2.789e-05s; avg 9.298e-06s ( +/- 25.64/ 38.46 %); best 6.914e-06s; worst 1.287e-05s; std dev. 2.575e-06 (taking best). -Reference operation time is 6.91414e-06 s (2922 Mflops) with 1 threads. -Challenging best inner round reference (8.10623e-06 s/1 threads) with: subdivision 0.25, 1 leaves, 2.08 bytes/nz, 6.91414e-06 s/0 threads (speedup 1.17241 x), same?n. +3 iterations (1 th.) took 3.195e-05s; avg 1.065e-05s ( +/- 26.12/ 41.04 %); best 7.868e-06s; worst 1.502e-05s; std dev. 3.129e-06 (taking best). +Reference operation time is 7.86781e-06 s (2567 Mflops) with 1 threads. +Challenging best inner round reference (9.05991e-06 s/1 threads) with: subdivision 0.25, 1 leaves, 2.08 bytes/nz, 7.86781e-06 s/0 threads (speedup 1.15152 x), same?n. # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 524288 bytes, per-thread 524288 bytes # RSB_IO_WANT_MEMORY_HIERARCHY_INFO_STRING: unset @@ -6278,16 +6314,16 @@ # librsb version 1.3.0.2 - 202212201855: Initialization success Building a matrix with 5050 nnz, 100 x 100 Duplicates check: 5050 - 0 = 5050 - converted COO to RSB in 6.360e-03 s (100.00 %) - analyzed arrays in 2.074e-03 s (32.61 %) - cleaned-up arrays in 1.097e-05 s (0.17 %) - deduplicated arrays in 1.001e-05 s (0.16 %) + converted COO to RSB in 5.013e-03 s (100.00 %) + analyzed arrays in 1.689e-03 s (33.70 %) + cleaned-up arrays in 1.311e-05 s (0.26 %) + deduplicated arrays in 1.192e-05 s (0.24 %) sorted arrays in 0.000e+00 s (0.00 %) - shuffled partitions in 1.975e-03 s (31.05 %) - memory allocations took 5.007e-06 s (0.08 %) - leafs setup took 1.907e-06 s (0.03 %) - halfword conversion took 2.283e-03 s (35.90 %) -Built (100 x 100)[0xaaaafde08c70]{S} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x42646096 (coo:0, csr:1, hw:1, ic:1, fi:0), storage: 1, subm: 8, symflags:'LS' + shuffled partitions in 1.776e-03 s (35.43 %) + memory allocations took 2.861e-06 s (0.06 %) + leafs setup took 9.537e-07 s (0.02 %) + halfword conversion took 1.518e-03 s (30.28 %) +Built (100 x 100)[0xaaaae537dcb0]{S} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x42646096 (coo:0, csr:1, hw:1, ic:1, fi:0), storage: 1, subm: 8, symflags:'LS' # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 524288 bytes, per-thread 524288 bytes # RSB_IO_WANT_MEMORY_HIERARCHY_INFO_STRING: unset @@ -6333,9 +6369,9 @@ # RSB_IO_WANT_SORT_METHOD: 0 # RSB_IO_WANT_SUBDIVISION_MULTIPLIER: 0.5 # librsb version 1.3.0.2 - 202212201855: Initialization success -3 iterations (1 th.) took 0.003805s; avg 0.001268s ( +/- 28.96/ 39.31 %); best 0.000901s; worst 0.001767s; std dev. 0.0003655 (taking best). -Reference operation time is 0.000900984 s (22.42 Mflops) with 1 threads. -Challenging best inner round reference (6.91414e-06 s/0 threads) with: subdivision 0.5, 8 leaves, 2.185 bytes/nz, 0.000900984 s/0 threads (speedup 0.00767399 x), same?n. +3 iterations (1 th.) took 0.002568s; avg 0.000856s ( +/- 8.75/ 15.28 %); best 0.0007811s; worst 0.0009868s; std dev. 9.283e-05 (taking best). +Reference operation time is 0.000781059 s (25.86 Mflops) with 1 threads. +Challenging best inner round reference (7.86781e-06 s/0 threads) with: subdivision 0.5, 8 leaves, 2.185 bytes/nz, 0.000781059 s/0 threads (speedup 0.0100733 x), same?n. New candidate clone performs slowly; discarding it: 100 x 100, type S, 5050 nnz, 50 nnz/r, 11 subms, 8 lsubms, 2.1846 bpnz # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 524288 bytes, per-thread 524288 bytes @@ -6369,16 +6405,16 @@ # librsb version 1.3.0.2 - 202212201855: Initialization success Building a matrix with 5050 nnz, 100 x 100 Duplicates check: 5050 - 0 = 5050 - converted COO to RSB in 9.267e-03 s (100.00 %) - analyzed arrays in 5.647e-03 s (60.94 %) - cleaned-up arrays in 1.001e-05 s (0.11 %) - deduplicated arrays in 7.868e-06 s (0.08 %) + converted COO to RSB in 5.941e-03 s (100.00 %) + analyzed arrays in 2.970e-03 s (49.99 %) + cleaned-up arrays in 1.407e-05 s (0.24 %) + deduplicated arrays in 1.097e-05 s (0.18 %) sorted arrays in 0.000e+00 s (0.00 %) - shuffled partitions in 1.916e-03 s (20.67 %) - memory allocations took 4.292e-06 s (0.05 %) - leafs setup took 1.192e-06 s (0.01 %) - halfword conversion took 1.680e-03 s (18.13 %) -Built (100 x 100)[0xaaaafde08c70]{S} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x42646096 (coo:0, csr:1, hw:1, ic:1, fi:0), storage: 1, subm: 19, symflags:'LS' + shuffled partitions in 1.450e-03 s (24.40 %) + memory allocations took 3.099e-06 s (0.05 %) + leafs setup took 2.146e-06 s (0.04 %) + halfword conversion took 1.491e-03 s (25.09 %) +Built (100 x 100)[0xaaaae537dcb0]{S} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x42646096 (coo:0, csr:1, hw:1, ic:1, fi:0), storage: 1, subm: 19, symflags:'LS' # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 524288 bytes, per-thread 524288 bytes # RSB_IO_WANT_MEMORY_HIERARCHY_INFO_STRING: unset @@ -6424,9 +6460,9 @@ # RSB_IO_WANT_SORT_METHOD: 0 # RSB_IO_WANT_SUBDIVISION_MULTIPLIER: 1 # librsb version 1.3.0.2 - 202212201855: Initialization success -3 iterations (1 th.) took 0.003033s; avg 0.001011s ( +/- 29.86/ 36.29 %); best 0.0007091s; worst 0.001378s; std dev. 0.0002769 (taking best). -Reference operation time is 0.000709057 s (28.49 Mflops) with 1 threads. -Challenging best inner round reference (6.91414e-06 s/0 threads) with: subdivision 1, 19 leaves, 2.272 bytes/nz, 0.000709057 s/0 threads (speedup 0.00975118 x), same?n. +3 iterations (1 th.) took 0.002129s; avg 0.0007096s ( +/- 4.48/ 2.58 %); best 0.0006778s; worst 0.0007279s; std dev. 2.256e-05 (taking best). +Reference operation time is 0.000677824 s (29.8 Mflops) with 1 threads. +Challenging best inner round reference (7.86781e-06 s/0 threads) with: subdivision 1, 19 leaves, 2.272 bytes/nz, 0.000677824 s/0 threads (speedup 0.0116075 x), same?n. New candidate clone performs slowly; discarding it: 100 x 100, type S, 5050 nnz, 50 nnz/r, 26 subms, 19 lsubms, 2.2725 bpnz # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 524288 bytes, per-thread 524288 bytes @@ -6460,16 +6496,16 @@ # librsb version 1.3.0.2 - 202212201855: Initialization success Building a matrix with 5050 nnz, 100 x 100 Duplicates check: 5050 - 0 = 5050 - converted COO to RSB in 6.452e-03 s (100.00 %) - analyzed arrays in 2.062e-03 s (31.96 %) - cleaned-up arrays in 8.821e-06 s (0.14 %) - deduplicated arrays in 8.106e-06 s (0.13 %) + converted COO to RSB in 5.000e-03 s (100.00 %) + analyzed arrays in 1.439e-03 s (28.78 %) + cleaned-up arrays in 1.287e-05 s (0.26 %) + deduplicated arrays in 1.121e-05 s (0.22 %) sorted arrays in 0.000e+00 s (0.00 %) - shuffled partitions in 1.934e-03 s (29.98 %) - memory allocations took 6.914e-06 s (0.11 %) - leafs setup took 1.907e-06 s (0.03 %) - halfword conversion took 2.430e-03 s (37.67 %) -Built (100 x 100)[0xaaaafde08c70]{S} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x42646096 (coo:0, csr:1, hw:1, ic:1, fi:0), storage: 1, subm: 36, symflags:'LS' + shuffled partitions in 1.585e-03 s (31.70 %) + memory allocations took 5.245e-06 s (0.10 %) + leafs setup took 2.861e-06 s (0.06 %) + halfword conversion took 1.944e-03 s (38.88 %) +Built (100 x 100)[0xaaaae537dcb0]{S} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x42646096 (coo:0, csr:1, hw:1, ic:1, fi:0), storage: 1, subm: 36, symflags:'LS' # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 524288 bytes, per-thread 524288 bytes # RSB_IO_WANT_MEMORY_HIERARCHY_INFO_STRING: unset @@ -6515,9 +6551,9 @@ # RSB_IO_WANT_SORT_METHOD: 0 # RSB_IO_WANT_SUBDIVISION_MULTIPLIER: 2 # librsb version 1.3.0.2 - 202212201855: Initialization success -3 iterations (1 th.) took 0.002516s; avg 0.0008386s ( +/- 17.12/ 8.75 %); best 0.000695s; worst 0.000912s; std dev. 0.0001016 (taking best). -Reference operation time is 0.00069499 s (29.07 Mflops) with 1 threads. -Challenging best inner round reference (6.91414e-06 s/0 threads) with: subdivision 2, 36 leaves, 2.383 bytes/nz, 0.00069499 s/0 threads (speedup 0.00994854 x), same?n. +3 iterations (1 th.) took 0.002467s; avg 0.0008223s ( +/- 9.77/ 16.00 %); best 0.000742s; worst 0.0009539s; std dev. 9.381e-05 (taking best). +Reference operation time is 0.000741959 s (27.23 Mflops) with 1 threads. +Challenging best inner round reference (7.86781e-06 s/0 threads) with: subdivision 2, 36 leaves, 2.383 bytes/nz, 0.000741959 s/0 threads (speedup 0.0106041 x), same?n. New candidate clone performs slowly; discarding it: 100 x 100, type S, 5050 nnz, 50 nnz/r, 50 subms, 36 lsubms, 2.3834 bpnz # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 524288 bytes, per-thread 524288 bytes @@ -6551,16 +6587,16 @@ # librsb version 1.3.0.2 - 202212201855: Initialization success Building a matrix with 5050 nnz, 100 x 100 Duplicates check: 5050 - 0 = 5050 - converted COO to RSB in 7.724e-03 s (100.00 %) - analyzed arrays in 2.293e-03 s (29.69 %) - cleaned-up arrays in 1.097e-05 s (0.14 %) - deduplicated arrays in 9.060e-06 s (0.12 %) + converted COO to RSB in 6.169e-03 s (100.00 %) + analyzed arrays in 2.420e-03 s (39.23 %) + cleaned-up arrays in 1.407e-05 s (0.23 %) + deduplicated arrays in 1.287e-05 s (0.21 %) sorted arrays in 0.000e+00 s (0.00 %) - shuffled partitions in 2.921e-03 s (37.82 %) - memory allocations took 3.815e-06 s (0.05 %) - leafs setup took 5.007e-06 s (0.06 %) - halfword conversion took 2.481e-03 s (32.12 %) -Built (100 x 100)[0xaaaafde2a9f0]{S} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x42646096 (coo:0, csr:1, hw:1, ic:1, fi:0), storage: 1, subm: 36, symflags:'LS' + shuffled partitions in 2.498e-03 s (40.49 %) + memory allocations took 5.007e-06 s (0.08 %) + leafs setup took 3.099e-06 s (0.05 %) + halfword conversion took 1.216e-03 s (19.71 %) +Built (100 x 100)[0xaaaae539fa30]{S} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x42646096 (coo:0, csr:1, hw:1, ic:1, fi:0), storage: 1, subm: 36, symflags:'LS' # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 524288 bytes, per-thread 524288 bytes # RSB_IO_WANT_MEMORY_HIERARCHY_INFO_STRING: unset @@ -6606,11 +6642,11 @@ # RSB_IO_WANT_SORT_METHOD: 0 # RSB_IO_WANT_SUBDIVISION_MULTIPLIER: 4 # librsb version 1.3.0.2 - 202212201855: Initialization success -3 iterations (1 th.) took 0.003418s; avg 0.001139s ( +/- 16.61/ 8.92 %); best 0.0009501s; worst 0.001241s; std dev. 0.0001339 (taking best). -Reference operation time is 0.000950098 s (21.26 Mflops) with 1 threads. -Challenging best inner round reference (6.91414e-06 s/0 threads) with: subdivision 4, 36 leaves, 2.383 bytes/nz, 0.000950098 s/0 threads (speedup 0.00727729 x), same?n. +3 iterations (1 th.) took 0.002523s; avg 0.000841s ( +/- 23.43/ 22.47 %); best 0.000644s; worst 0.00103s; std dev. 0.0001577 (taking best). +Reference operation time is 0.000643969 s (31.37 Mflops) with 1 threads. +Challenging best inner round reference (7.86781e-06 s/0 threads) with: subdivision 4, 36 leaves, 2.383 bytes/nz, 0.000643969 s/0 threads (speedup 0.0122177 x), same?n. New candidate clone performs slowly; discarding it: 100 x 100, type S, 5050 nnz, 50 nnz/r, 50 subms, 36 lsubms, 2.3834 bpnz -Best sparse multiply performance with subdivision multiplier of 0.25: 2921.55 Mflops. +Best sparse multiply performance with subdivision multiplier of 0.25: 2567.42 Mflops. # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 524288 bytes, per-thread 524288 bytes # RSB_IO_WANT_MEMORY_HIERARCHY_INFO_STRING: unset @@ -6626,9 +6662,9 @@ # RSB_IO_WANT_SORT_METHOD: 0 # RSB_IO_WANT_SUBDIVISION_MULTIPLIER: 1 # librsb version 1.3.0.2 - 202212201855: Initialization success -Last tuner inner round (1 of 1) took 0.0496349 s (eq. to 6e+03/ 7e+03 old/new op.times), gained local/global speedup 1.17241 x (8.10623e-06 : 6.91414e-06) / 1.17241 x (8.10623e-06 : 6.91414e-06). This is amortizable in 41637 op.times. -In 1 tuning rounds (tot. 0.05s, 0.036s for constructor, 0 clones) obtained a SPEEDUP of 17.2% (1.172x) (from 2492 to 2922 Mflops). -Second run of RSB Autotuner took 0.0496621 s and estimated a speedup of 1.172414 x (8.106e-06 s -> 6.914e-06 s per op) in new matrix (1 -> 1 lsubm) +Last tuner inner round (1 of 1) took 0.04052 s (eq. to 4e+03/ 5e+03 old/new op.times), gained local/global speedup 1.15152 x (9.05991e-06 : 7.86781e-06) / 1.15152 x (9.05991e-06 : 7.86781e-06). This is amortizable in 33991 op.times. +In 1 tuning rounds (tot. 0.041s, 0.03s for constructor, 0 clones) obtained a SPEEDUP of 15.2% (1.152x) (from 2230 to 2567 Mflops). +Second run of RSB Autotuner took 0.0405579 s and estimated a speedup of 1.151515 x (9.060e-06 s -> 7.868e-06 s per op) in new matrix (1 -> 1 lsubm) RSB Autotuner suggested a new matrix: freeing the old one. #min:1 #max:1 @@ -6636,13 +6672,13 @@ #norm:10 #used index storage compared to COO:10504 vs 40400 bytes (26.00%) ; compared to CSR:10504 vs 20604 bytes (50.99%) #%:CONSTRUCTOR_*:SORT SCAN INSERT SCAN+INSERT -%:CONSTRUCTOR_TIMES:lower-100x100-5050nz S N 1 100 100 5050 0.000000 0.001565 0.006686 0.008251 -%:UNSORTEDCOO2RSB_TIME:lower-100x100-5050nz S N 1 100 100 5050 0.008251 -%:RSB_SUBDIVISION_TIME:lower-100x100-5050nz S N 1 100 100 5050 0.001565 -%:RSB_SHUFFLE_TIME:lower-100x100-5050nz S N 1 100 100 5050 0.006686 +%:CONSTRUCTOR_TIMES:lower-100x100-5050nz S N 1 100 100 5050 0.000000 0.001243 0.004166 0.005409 +%:UNSORTEDCOO2RSB_TIME:lower-100x100-5050nz S N 1 100 100 5050 0.005409 +%:RSB_SUBDIVISION_TIME:lower-100x100-5050nz S N 1 100 100 5050 0.001243 +%:RSB_SHUFFLE_TIME:lower-100x100-5050nz S N 1 100 100 5050 0.004166 %:ROW_MAJOR_SORT_TIME:lower-100x100-5050nz S N 1 100 100 5050 0.000000 %:ROW_MAJOR_SORT_SCALING:lower-100x100-5050nz S N 1 100 100 5050 nan -%:SORTEDCOO2RSB_TIME:lower-100x100-5050nz S N 1 100 100 5050 0.008251 +%:SORTEDCOO2RSB_TIME:lower-100x100-5050nz S N 1 100 100 5050 0.005409 %:ROW_MAJOR_SORT_TO_MOP:lower-100x100-5050nz S N 1 100 100 5050 0.000 %:UNSORTEDCOO2RSB_SCALING:lower-100x100-5050nz S N 1 100 100 5050 1.00 %:SORTEDCOO2RSB_SCALING:lower-100x100-5050nz S N 1 100 100 5050 1.00 @@ -6657,34 +6693,34 @@ %:SM_MINMAXAVGNNZ:lower-100x100-5050nz S N 1 100 100 5050 5050 5050 5050 # %operation:matrix CONSTRUCTOR[1] SPMV[1] SPMV[1] -%operation:lower-100x100-5050nz 0.0102329 1e+09 1e+09 +%operation:lower-100x100-5050nz 0.00686693 1e+09 1e+09 %constructor:matrix SORT[1] SCAN[1] SHUFFLE[1] INSERT[1] -%constructor:lower-100x100-5050nz 0 0.00156522 0 0.00668597 -# so far, program took 5.275s of wall clock time; ancillary tests 0.000s; I/O 0.000s; checks 0.000s; conversions 0.000s; rsb/mkl tuning 0.243s/0.000s . +%constructor:lower-100x100-5050nz 0 0.00124311 0 0.00416589 +# so far, program took 5.563s of wall clock time; ancillary tests 0.000s; I/O 0.000s; checks 0.000s; conversions 0.000s; rsb/mkl tuning 0.178s/0.000s . getrusage() stats: -ru_maxrss: 8 (maximum resident set size -- MB) -ru_stime : 0.07013s (system CPU time used) -ru_utime : 4.869s (user CPU time used) +ru_maxrss: 6 (maximum resident set size -- MB) +ru_stime : 0.04376s (system CPU time used) +ru_utime : 6.418s (user CPU time used) # multi-type benchmarking (DSCZ) -- now using typecode C (last was D). # Cache block size total 524288 bytes, per-thread 524288 bytes -# so far, program took 5.275s of wall clock time; ancillary tests 0.000s; I/O 0.000s; checks 0.000s; conversions 0.000s; rsb/mkl tuning 0.243s/0.000s . +# so far, program took 5.563s of wall clock time; ancillary tests 0.000s; I/O 0.000s; checks 0.000s; conversions 0.000s; rsb/mkl tuning 0.178s/0.000s . # Using 1 threads # Using alpha=1 beta=1 order=cols for rsb_spmv/rsb_spsv/rsb_spmm/rsb_spsm. # will use input matrix flags: RSB_FLAG_USE_HALFWORD_INDICES, RSB_FLAG_SORTED_INPUT, RSB_FLAG_LOWER, RSB_FLAG_QUAD_PARTITIONING, RSB_FLAG_SYMMETRIC, RSB_FLAG_OWN_PARTITIONING_ARRAYS # Using 1 threads Building a matrix with 5050 nnz, 100 x 100 Duplicates check: 5050 - 0 = 5050 - converted COO to RSB in 6.253e-03 s (100.00 %) - analyzed arrays in 1.005e-03 s (16.07 %) - cleaned-up arrays in 1.192e-05 s (0.19 %) - deduplicated arrays in 1.121e-05 s (0.18 %) + converted COO to RSB in 9.831e-03 s (100.00 %) + analyzed arrays in 8.490e-04 s (8.64 %) + cleaned-up arrays in 1.502e-05 s (0.15 %) + deduplicated arrays in 1.216e-05 s (0.12 %) sorted arrays in 0.000e+00 s (0.00 %) - shuffled partitions in 3.394e-03 s (54.28 %) - memory allocations took 3.815e-06 s (0.06 %) - leafs setup took 9.537e-07 s (0.02 %) - halfword conversion took 1.826e-03 s (29.20 %) -Built (100 x 100)[0xaaaafde08c70]{C} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x2446196 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'LS' -# Constructed matrix (took 0.006s): (100 x 100)[0xaaaafde08c70]{C} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x2446196 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'LS' + shuffled partitions in 6.493e-03 s (66.05 %) + memory allocations took 8.821e-06 s (0.09 %) + leafs setup took 2.861e-06 s (0.03 %) + halfword conversion took 2.448e-03 s (24.90 %) +Built (100 x 100)[0xaaaae537dcb0]{C} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x2446196 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'LS' +# Constructed matrix (took 0.010s): (100 x 100)[0xaaaae537dcb0]{C} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x2446196 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'LS' # matrix consistency check took 0.000s (ok) RSB Sparse Blocks Autotuner invoked requesting max 6 splits and max 6 merges in 1 rounds, threads spec.0 (specify negative values to enable threads tuning). Will autotune matrix: 100 x 100, type C, 5050 nnz, 50 nnz/r, 4 subms, 3 lsubms, 2.1212 bpnz. @@ -6735,10 +6771,10 @@ # RSB_IO_WANT_SORT_METHOD: 0 # RSB_IO_WANT_SUBDIVISION_MULTIPLIER: 1 # librsb version 1.3.0.2 - 202212201855: Initialization success -3 iterations (1 th.) took 0.003939s; avg 0.001313s ( +/- 55.37/ 85.23 %); best 0.000586s; worst 0.002432s; std dev. 0.000803 (taking best). -Reference operation time is 0.000586033 s (137.9 Mflops) with 1 threads. -Starting merge (same threads) based auto-tuning procedure (transA=N, nrhs=1, order=cols) (max 6 steps, inclusive 3 grace steps) on: 100 x 100, type C, 5050 nnz, 50 nnz/r, 4 subms, 3 lsubms, 2.1212 bpnz (tpop: 0.000586 Mflops: 137.876) -Merge (3 -> 1 leaves) took w.c.t. of 4.101e-05s, ~3.29e-05s of computing time (of which 1.383e-05s sorting, 9.537e-07s analysis) +3 iterations (1 th.) took 0.001816s; avg 0.0006053s ( +/- 2.36/ 1.26 %); best 0.000591s; worst 0.000613s; std dev. 1.012e-05 (taking best). +Reference operation time is 0.00059104 s (136.7 Mflops) with 1 threads. +Starting merge (same threads) based auto-tuning procedure (transA=N, nrhs=1, order=cols) (max 6 steps, inclusive 3 grace steps) on: 100 x 100, type C, 5050 nnz, 50 nnz/r, 4 subms, 3 lsubms, 2.1212 bpnz (tpop: 0.000591 Mflops: 136.708) +Merge (3 -> 1 leaves) took w.c.t. of 4.506e-05s, ~3.791e-05s of computing time (of which 1.693e-05s sorting, 1.907e-06s analysis) # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 524288 bytes, per-thread 524288 bytes # RSB_IO_WANT_MEMORY_HIERARCHY_INFO_STRING: unset @@ -6769,8 +6805,8 @@ # RSB_IO_WANT_SORT_METHOD: 0 # RSB_IO_WANT_SUBDIVISION_MULTIPLIER: 1 # librsb version 1.3.0.2 - 202212201855: Initialization success -3 iterations (1 th.) took 5.913e-05s; avg 1.971e-05s ( +/- 4.44/ 7.66 %); best 1.884e-05s; worst 2.122e-05s; std dev. 1.072e-06 (taking best). -Reference operation time is 1.88351e-05 s (4290 Mflops) with 1 threads. +3 iterations (1 th.) took 7.105e-05s; avg 2.368e-05s ( +/- 3.36/ 5.70 %); best 2.289e-05s; worst 2.503e-05s; std dev. 9.603e-07 (taking best). +Reference operation time is 2.28882e-05 s (3530 Mflops) with 1 threads. # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 524288 bytes, per-thread 524288 bytes # RSB_IO_WANT_MEMORY_HIERARCHY_INFO_STRING: unset @@ -6786,16 +6822,16 @@ # RSB_IO_WANT_SORT_METHOD: 0 # RSB_IO_WANT_SUBDIVISION_MULTIPLIER: 1 # librsb version 1.3.0.2 - 202212201855: Initialization success -After merge step 1: tpop: 1.884e-05 s ~Mflops: 4289.870 nsubm:1 otn:1 -Applying merge (3 -> 1 leaves, 1 th.) yielded SPEEDUP of 31.114x: 0.000586s -> 1.884e-05s, so taking this instance. +After merge step 1: tpop: 2.289e-05 s ~Mflops: 3530.206 nsubm:1 otn:1 +Applying merge (3 -> 1 leaves, 1 th.) yielded SPEEDUP of 25.823x: 0.000591s -> 2.289e-05s, so taking this instance. Saved plot to test-tuning-lower-100x100-5050nz--C-N-1--mv-tuned_merge1_1x1th.eps Merged all the matrix leaves: no reason to continue merging. -A total of 1 merge steps (of max 6) (3 -> 1 subms) took 0.02634s (of which 4.292e-05s partitioning, 0.01503s I/O); computing times: 3.29e-05s in par. loops, 1.383e-05s sorting, 9.537e-07s analyzing) -Total merge + benchmarking process took 0.02634s, equivalent to 1398.3/44.9 new/old ops (0.01635s for 2 clones -- as 868.0/27.9 ops, or 434.0/13.9 ops per clone), SPEEDUP of 31.114x -Applying multi-merge (3 -> 1 leaves, 1 steps, 0 -> 1 th.sp.) yielded SPEEDUP of 31.114x (0.000586s -> 1.884e-05s), will amortize in 46.4 ops by saving 0.0005672s per op. -In 1 tuning rounds (tot. 0.036s, 0.016s for constructor, 2 clones) obtained a SPEEDUP of 3011.4% (31.11x) (from 137.9 to 4290 Mflops). Employed 0.009s for I/O of matrix plots. +A total of 1 merge steps (of max 6) (3 -> 1 subms) took 0.008823s (of which 4.697e-05s partitioning, 0.006229s I/O); computing times: 3.791e-05s in par. loops, 1.693e-05s sorting, 1.907e-06s analyzing) +Total merge + benchmarking process took 0.008823s, equivalent to 385.5/14.9 new/old ops (0.003677s for 2 clones -- as 160.7/6.2 ops, or 80.3/3.1 ops per clone), SPEEDUP of 25.823x +Applying multi-merge (3 -> 1 leaves, 1 steps, 0 -> 1 th.sp.) yielded SPEEDUP of 25.823x (0.000591s -> 2.289e-05s), will amortize in 15.5 ops by saving 0.0005682s per op. +In 1 tuning rounds (tot. 0.012s, 0.0037s for constructor, 2 clones) obtained a SPEEDUP of 2482.3% (25.82x) (from 136.7 to 3530 Mflops). Employed 0.01s for I/O of matrix plots. #pr: updating sample at index 3 (2^th of 4), 0^th touch for (0,0,0,0,0,2,0). -First run of RSB Autotuner took 0.0445471 s (5.860e-04 s -> 1.884e-05 s per spmv_sxsa) (tuned: 3 -> 1 lsubm). +First run of RSB Autotuner took 0.0222769 s (5.910e-04 s -> 2.289e-05 s per spmv_sxsa) (tuned: 3 -> 1 lsubm). RSB Sparse Blocks Autotuner invoked requesting max 0 splits and max 0 merges in 1 rounds, auto threads spec. Will autotune matrix: 100 x 100, type C, 5050 nnz, 50 nnz/r, 1 subms, 1 lsubms, 2.0800 bpnz. Parameters: verbosity:1 mintimes:3 maxtimes:10 mindt:0 maxdt:10 @@ -6861,20 +6897,20 @@ # RSB_IO_WANT_SORT_METHOD: 0 # RSB_IO_WANT_SUBDIVISION_MULTIPLIER: 1 # librsb version 1.3.0.2 - 202212201855: Initialization success -3 iterations (1 th.) took 6.795e-05s; avg 2.265e-05s ( +/- 7.37/ 14.74 %); best 2.098e-05s; worst 2.599e-05s; std dev. 2.36e-06 (taking best). -Reference operation time is 2.09808e-05 s (3851 Mflops) with 1 threads. +3 iterations (1 th.) took 8.583e-05s; avg 2.861e-05s ( +/- 20.00/ 40.00 %); best 2.289e-05s; worst 4.005e-05s; std dev. 8.092e-06 (taking best). +Reference operation time is 2.28882e-05 s (3530 Mflops) with 1 threads. Building a matrix with 5050 nnz, 100 x 100 Duplicates check: 5050 - 0 = 5050 - converted COO to RSB in 6.374e-03 s (100.00 %) - analyzed arrays in 4.692e-03 s (73.61 %) - cleaned-up arrays in 1.001e-05 s (0.16 %) - deduplicated arrays in 8.106e-06 s (0.13 %) + converted COO to RSB in 1.907e-03 s (100.00 %) + analyzed arrays in 6.349e-04 s (33.29 %) + cleaned-up arrays in 1.097e-05 s (0.58 %) + deduplicated arrays in 9.060e-06 s (0.48 %) sorted arrays in 0.000e+00 s (0.00 %) - shuffled partitions in 1.658e-03 s (26.01 %) - memory allocations took 3.099e-06 s (0.05 %) - leafs setup took 9.537e-07 s (0.01 %) - halfword conversion took 1.907e-06 s (0.03 %) -Built (100 x 100)[0xaaaafde08b50]{C} @ (0(0..100),0(0..100)) (5050 nnz, 50 nnz/r) flags 0x42644094 (coo:0, csr:1, hw:0, ic:1, fi:0), storage: 1, subm: 1, symflags:'LS' + shuffled partitions in 1.242e-03 s (65.13 %) + memory allocations took 3.099e-06 s (0.16 %) + leafs setup took 2.861e-06 s (0.15 %) + halfword conversion took 3.099e-06 s (0.16 %) +Built (100 x 100)[0xaaaae537db90]{C} @ (0(0..100),0(0..100)) (5050 nnz, 50 nnz/r) flags 0x42644094 (coo:0, csr:1, hw:0, ic:1, fi:0), storage: 1, subm: 1, symflags:'LS' Starting autotuning stage, with subdivision of 1 (current threads=1, requested threads=0, max threads = 12). # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 524288 bytes, per-thread 524288 bytes @@ -6908,16 +6944,16 @@ # librsb version 1.3.0.2 - 202212201855: Initialization success Building a matrix with 5050 nnz, 100 x 100 Duplicates check: 5050 - 0 = 5050 - converted COO to RSB in 1.560e-02 s (100.00 %) - analyzed arrays in 5.483e-03 s (35.14 %) - cleaned-up arrays in 1.001e-05 s (0.06 %) - deduplicated arrays in 8.821e-06 s (0.06 %) + converted COO to RSB in 5.627e-03 s (100.00 %) + analyzed arrays in 1.067e-03 s (18.96 %) + cleaned-up arrays in 1.001e-05 s (0.18 %) + deduplicated arrays in 8.821e-06 s (0.16 %) sorted arrays in 0.000e+00 s (0.00 %) - shuffled partitions in 8.294e-03 s (53.16 %) - memory allocations took 1.907e-06 s (0.01 %) - leafs setup took 9.537e-07 s (0.01 %) - halfword conversion took 1.804e-03 s (11.56 %) -Built (100 x 100)[0xaaaafde08c70]{C} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x42646096 (coo:0, csr:1, hw:1, ic:1, fi:0), storage: 1, subm: 3, symflags:'LS' + shuffled partitions in 1.227e-03 s (21.81 %) + memory allocations took 1.907e-06 s (0.03 %) + leafs setup took 9.537e-07 s (0.02 %) + halfword conversion took 3.310e-03 s (58.82 %) +Built (100 x 100)[0xaaaae537dcb0]{C} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x42646096 (coo:0, csr:1, hw:1, ic:1, fi:0), storage: 1, subm: 3, symflags:'LS' # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 524288 bytes, per-thread 524288 bytes # RSB_IO_WANT_MEMORY_HIERARCHY_INFO_STRING: unset @@ -6963,9 +6999,9 @@ # RSB_IO_WANT_SORT_METHOD: 0 # RSB_IO_WANT_SUBDIVISION_MULTIPLIER: 0.25 # librsb version 1.3.0.2 - 202212201855: Initialization success -3 iterations (1 th.) took 0.004376s; avg 0.001459s ( +/- 30.42/ 43.84 %); best 0.001015s; worst 0.002098s; std dev. 0.0004633 (taking best). -Reference operation time is 0.00101495 s (79.61 Mflops) with 1 threads. -Challenging best inner round reference (2.09808e-05 s/1 threads) with: subdivision 0.25, 3 leaves, 2.121 bytes/nz, 0.00101495 s/0 threads (speedup 0.0206718 x), same?n. +3 iterations (1 th.) took 0.001793s; avg 0.0005976s ( +/- 0.62/ 0.57 %); best 0.0005939s; worst 0.0006011s; std dev. 2.929e-06 (taking best). +Reference operation time is 0.000593901 s (136 Mflops) with 1 threads. +Challenging best inner round reference (2.28882e-05 s/1 threads) with: subdivision 0.25, 3 leaves, 2.121 bytes/nz, 0.000593901 s/0 threads (speedup 0.0385387 x), same?n. New candidate clone performs slowly; discarding it: 100 x 100, type C, 5050 nnz, 50 nnz/r, 4 subms, 3 lsubms, 2.1212 bpnz # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 524288 bytes, per-thread 524288 bytes @@ -6999,16 +7035,16 @@ # librsb version 1.3.0.2 - 202212201855: Initialization success Building a matrix with 5050 nnz, 100 x 100 Duplicates check: 5050 - 0 = 5050 - converted COO to RSB in 9.815e-03 s (100.00 %) - analyzed arrays in 4.225e-03 s (43.05 %) - cleaned-up arrays in 1.097e-05 s (0.11 %) - deduplicated arrays in 9.060e-06 s (0.09 %) + converted COO to RSB in 4.934e-03 s (100.00 %) + analyzed arrays in 2.466e-03 s (49.98 %) + cleaned-up arrays in 1.001e-05 s (0.20 %) + deduplicated arrays in 1.001e-05 s (0.20 %) sorted arrays in 0.000e+00 s (0.00 %) - shuffled partitions in 3.052e-03 s (31.10 %) - memory allocations took 4.053e-06 s (0.04 %) - leafs setup took 1.907e-06 s (0.02 %) - halfword conversion took 2.511e-03 s (25.58 %) -Built (100 x 100)[0xaaaafde08c70]{C} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x42646096 (coo:0, csr:1, hw:1, ic:1, fi:0), storage: 1, subm: 10, symflags:'LS' + shuffled partitions in 1.205e-03 s (24.42 %) + memory allocations took 5.007e-06 s (0.10 %) + leafs setup took 1.907e-06 s (0.04 %) + halfword conversion took 1.236e-03 s (25.05 %) +Built (100 x 100)[0xaaaae537dcb0]{C} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x42646096 (coo:0, csr:1, hw:1, ic:1, fi:0), storage: 1, subm: 10, symflags:'LS' # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 524288 bytes, per-thread 524288 bytes # RSB_IO_WANT_MEMORY_HIERARCHY_INFO_STRING: unset @@ -7054,9 +7090,9 @@ # RSB_IO_WANT_SORT_METHOD: 0 # RSB_IO_WANT_SUBDIVISION_MULTIPLIER: 0.5 # librsb version 1.3.0.2 - 202212201855: Initialization success -3 iterations (1 th.) took 0.004874s; avg 0.001625s ( +/- 5.40/ 3.83 %); best 0.001537s; worst 0.001687s; std dev. 6.379e-05 (taking best). -Reference operation time is 0.00153708 s (52.57 Mflops) with 1 threads. -Challenging best inner round reference (2.09808e-05 s/1 threads) with: subdivision 0.5, 10 leaves, 2.206 bytes/nz, 0.00153708 s/0 threads (speedup 0.0136498 x), same?n. +3 iterations (1 th.) took 0.002622s; avg 0.000874s ( +/- 29.05/ 17.84 %); best 0.0006201s; worst 0.00103s; std dev. 0.0001811 (taking best). +Reference operation time is 0.000620127 s (130.3 Mflops) with 1 threads. +Challenging best inner round reference (2.28882e-05 s/1 threads) with: subdivision 0.5, 10 leaves, 2.206 bytes/nz, 0.000620127 s/0 threads (speedup 0.0369089 x), same?n. New candidate clone performs slowly; discarding it: 100 x 100, type C, 5050 nnz, 50 nnz/r, 14 subms, 10 lsubms, 2.2059 bpnz # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 524288 bytes, per-thread 524288 bytes @@ -7090,16 +7126,16 @@ # librsb version 1.3.0.2 - 202212201855: Initialization success Building a matrix with 5050 nnz, 100 x 100 Duplicates check: 5050 - 0 = 5050 - converted COO to RSB in 9.396e-03 s (100.00 %) - analyzed arrays in 3.815e-03 s (40.60 %) - cleaned-up arrays in 1.001e-05 s (0.11 %) - deduplicated arrays in 9.060e-06 s (0.10 %) + converted COO to RSB in 3.798e-03 s (100.00 %) + analyzed arrays in 1.256e-03 s (33.07 %) + cleaned-up arrays in 9.060e-06 s (0.24 %) + deduplicated arrays in 8.106e-06 s (0.21 %) sorted arrays in 0.000e+00 s (0.00 %) - shuffled partitions in 2.118e-03 s (22.54 %) - memory allocations took 1.907e-06 s (0.02 %) - leafs setup took 1.907e-06 s (0.02 %) - halfword conversion took 3.440e-03 s (36.61 %) -Built (100 x 100)[0xaaaafde08c70]{C} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x42646096 (coo:0, csr:1, hw:1, ic:1, fi:0), storage: 1, subm: 25, symflags:'LS' + shuffled partitions in 1.302e-03 s (34.28 %) + memory allocations took 4.768e-06 s (0.13 %) + leafs setup took 3.099e-06 s (0.08 %) + halfword conversion took 1.214e-03 s (31.96 %) +Built (100 x 100)[0xaaaae537dcb0]{C} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x42646096 (coo:0, csr:1, hw:1, ic:1, fi:0), storage: 1, subm: 25, symflags:'LS' # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 524288 bytes, per-thread 524288 bytes # RSB_IO_WANT_MEMORY_HIERARCHY_INFO_STRING: unset @@ -7145,9 +7181,9 @@ # RSB_IO_WANT_SORT_METHOD: 0 # RSB_IO_WANT_SUBDIVISION_MULTIPLIER: 1 # librsb version 1.3.0.2 - 202212201855: Initialization success -3 iterations (1 th.) took 0.003321s; avg 0.001107s ( +/- 19.33/ 18.15 %); best 0.0008931s; worst 0.001308s; std dev. 0.0001696 (taking best). -Reference operation time is 0.000893116 s (90.47 Mflops) with 1 threads. -Challenging best inner round reference (2.09808e-05 s/1 threads) with: subdivision 1, 25 leaves, 2.317 bytes/nz, 0.000893116 s/0 threads (speedup 0.0234917 x), same?n. +3 iterations (1 th.) took 0.001689s; avg 0.000563s ( +/- 3.74/ 6.04 %); best 0.0005419s; worst 0.000597s; std dev. 2.428e-05 (taking best). +Reference operation time is 0.000541925 s (149.1 Mflops) with 1 threads. +Challenging best inner round reference (2.28882e-05 s/1 threads) with: subdivision 1, 25 leaves, 2.317 bytes/nz, 0.000541925 s/0 threads (speedup 0.0422349 x), same?n. New candidate clone performs slowly; discarding it: 100 x 100, type C, 5050 nnz, 50 nnz/r, 34 subms, 25 lsubms, 2.3168 bpnz # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 524288 bytes, per-thread 524288 bytes @@ -7181,16 +7217,16 @@ # librsb version 1.3.0.2 - 202212201855: Initialization success Building a matrix with 5050 nnz, 100 x 100 Duplicates check: 5050 - 0 = 5050 - converted COO to RSB in 6.522e-03 s (100.00 %) - analyzed arrays in 2.798e-03 s (42.90 %) - cleaned-up arrays in 9.060e-06 s (0.14 %) - deduplicated arrays in 7.868e-06 s (0.12 %) - sorted arrays in 9.537e-07 s (0.01 %) - shuffled partitions in 1.550e-03 s (23.77 %) - memory allocations took 9.537e-07 s (0.01 %) - leafs setup took 2.146e-06 s (0.03 %) - halfword conversion took 2.153e-03 s (33.01 %) -Built (100 x 100)[0xaaaafde2f8e0]{C} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x42646096 (coo:0, csr:1, hw:1, ic:1, fi:0), storage: 1, subm: 36, symflags:'LS' + converted COO to RSB in 4.621e-03 s (100.00 %) + analyzed arrays in 1.422e-03 s (30.77 %) + cleaned-up arrays in 9.060e-06 s (0.20 %) + deduplicated arrays in 9.060e-06 s (0.20 %) + sorted arrays in 0.000e+00 s (0.00 %) + shuffled partitions in 1.220e-03 s (26.40 %) + memory allocations took 6.914e-06 s (0.15 %) + leafs setup took 3.099e-06 s (0.07 %) + halfword conversion took 1.951e-03 s (42.22 %) +Built (100 x 100)[0xaaaae53a4920]{C} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x42646096 (coo:0, csr:1, hw:1, ic:1, fi:0), storage: 1, subm: 36, symflags:'LS' # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 524288 bytes, per-thread 524288 bytes # RSB_IO_WANT_MEMORY_HIERARCHY_INFO_STRING: unset @@ -7236,9 +7272,9 @@ # RSB_IO_WANT_SORT_METHOD: 0 # RSB_IO_WANT_SUBDIVISION_MULTIPLIER: 2 # librsb version 1.3.0.2 - 202212201855: Initialization success -3 iterations (1 th.) took 0.002492s; avg 0.0008307s ( +/- 20.06/ 37.83 %); best 0.000664s; worst 0.001145s; std dev. 0.0002223 (taking best). -Reference operation time is 0.000663996 s (121.7 Mflops) with 1 threads. -Challenging best inner round reference (2.09808e-05 s/1 threads) with: subdivision 2, 36 leaves, 2.383 bytes/nz, 0.000663996 s/0 threads (speedup 0.0315978 x), same?n. +3 iterations (1 th.) took 0.003283s; avg 0.001094s ( +/- 39.96/ 49.59 %); best 0.0006571s; worst 0.001637s; std dev. 0.0004069 (taking best). +Reference operation time is 0.000657082 s (123 Mflops) with 1 threads. +Challenging best inner round reference (2.28882e-05 s/1 threads) with: subdivision 2, 36 leaves, 2.383 bytes/nz, 0.000657082 s/0 threads (speedup 0.0348331 x), same?n. New candidate clone performs slowly; discarding it: 100 x 100, type C, 5050 nnz, 50 nnz/r, 50 subms, 36 lsubms, 2.3834 bpnz # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 524288 bytes, per-thread 524288 bytes @@ -7272,16 +7308,16 @@ # librsb version 1.3.0.2 - 202212201855: Initialization success Building a matrix with 5050 nnz, 100 x 100 Duplicates check: 5050 - 0 = 5050 - converted COO to RSB in 5.495e-03 s (100.00 %) - analyzed arrays in 1.995e-03 s (36.30 %) - cleaned-up arrays in 9.060e-06 s (0.16 %) - deduplicated arrays in 6.914e-06 s (0.13 %) + converted COO to RSB in 4.768e-03 s (100.00 %) + analyzed arrays in 1.646e-03 s (34.52 %) + cleaned-up arrays in 1.097e-05 s (0.23 %) + deduplicated arrays in 1.001e-05 s (0.21 %) sorted arrays in 0.000e+00 s (0.00 %) - shuffled partitions in 1.795e-03 s (32.66 %) - memory allocations took 5.245e-06 s (0.10 %) - leafs setup took 4.053e-06 s (0.07 %) - halfword conversion took 1.680e-03 s (30.58 %) -Built (100 x 100)[0xaaaafde2f8e0]{C} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x42646096 (coo:0, csr:1, hw:1, ic:1, fi:0), storage: 1, subm: 36, symflags:'LS' + shuffled partitions in 1.249e-03 s (26.19 %) + memory allocations took 1.001e-05 s (0.21 %) + leafs setup took 3.099e-06 s (0.07 %) + halfword conversion took 1.836e-03 s (38.51 %) +Built (100 x 100)[0xaaaae53a4920]{C} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x42646096 (coo:0, csr:1, hw:1, ic:1, fi:0), storage: 1, subm: 36, symflags:'LS' # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 524288 bytes, per-thread 524288 bytes # RSB_IO_WANT_MEMORY_HIERARCHY_INFO_STRING: unset @@ -7327,11 +7363,11 @@ # RSB_IO_WANT_SORT_METHOD: 0 # RSB_IO_WANT_SUBDIVISION_MULTIPLIER: 4 # librsb version 1.3.0.2 - 202212201855: Initialization success -3 iterations (1 th.) took 0.002389s; avg 0.0007963s ( +/- 17.25/ 26.47 %); best 0.000659s; worst 0.001007s; std dev. 0.0001513 (taking best). -Reference operation time is 0.000658989 s (122.6 Mflops) with 1 threads. -Challenging best inner round reference (2.09808e-05 s/1 threads) with: subdivision 4, 36 leaves, 2.383 bytes/nz, 0.000658989 s/0 threads (speedup 0.0318379 x), same?n. +3 iterations (1 th.) took 0.002773s; avg 0.0009243s ( +/- 41.91/ 67.58 %); best 0.0005369s; worst 0.001549s; std dev. 0.0004459 (taking best). +Reference operation time is 0.000536919 s (150.5 Mflops) with 1 threads. +Challenging best inner round reference (2.28882e-05 s/1 threads) with: subdivision 4, 36 leaves, 2.383 bytes/nz, 0.000536919 s/0 threads (speedup 0.0426288 x), same?n. New candidate clone performs slowly; discarding it: 100 x 100, type C, 5050 nnz, 50 nnz/r, 50 subms, 36 lsubms, 2.3834 bpnz -Best sparse multiply performance with subdivision multiplier of 1: 3851.13 Mflops. +Best sparse multiply performance with subdivision multiplier of 1: 3530.21 Mflops. # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 524288 bytes, per-thread 524288 bytes # RSB_IO_WANT_MEMORY_HIERARCHY_INFO_STRING: unset @@ -7347,23 +7383,23 @@ # RSB_IO_WANT_SORT_METHOD: 0 # RSB_IO_WANT_SUBDIVISION_MULTIPLIER: 1 # librsb version 1.3.0.2 - 202212201855: Initialization success -Last tuner inner round (1 of 1) took 0.0718832 s (eq. to 3e+03/ 3e+03 old/new op.times), gained local/global speedup 1 x (2.09808e-05 : 2.09808e-05) / 1 x (2.09808e-05 : 2.09808e-05). This is not amortizable ! +Last tuner inner round (1 of 1) took 0.039825 s (eq. to 2e+03/ 2e+03 old/new op.times), gained local/global speedup 1 x (2.28882e-05 : 2.28882e-05) / 1 x (2.28882e-05 : 2.28882e-05). This is not amortizable ! Auto tuning inner round 1 did not find a configuration better than the original. -In 1 tuning rounds (tot. 0.072s, 0.054s for constructor, 0 clones) obtained NO speedup (best stays 3851 Mflops). -Second run of RSB Autotuner took 0.0719049 s and estimated a speedup of 1.000000 x (2.098e-05 s -> 2.098e-05 s per op) in same matrix (1 -> 1 lsubm) +In 1 tuning rounds (tot. 0.04s, 0.027s for constructor, 0 clones) obtained NO speedup (best stays 3530 Mflops). +Second run of RSB Autotuner took 0.03985 s and estimated a speedup of 1.000000 x (2.289e-05 s -> 2.289e-05 s per op) in same matrix (1 -> 1 lsubm) #min:1 0 #max:1 0 #sum:100 0 #norm:10 0 #used index storage compared to COO:10504 vs 40400 bytes (26.00%) ; compared to CSR:10504 vs 20604 bytes (50.99%) #%:CONSTRUCTOR_*:SORT SCAN INSERT SCAN+INSERT -%:CONSTRUCTOR_TIMES:lower-100x100-5050nz S N 1 100 100 5050 0.000000 0.001005 0.003394 0.004399 -%:UNSORTEDCOO2RSB_TIME:lower-100x100-5050nz S N 1 100 100 5050 0.004399 -%:RSB_SUBDIVISION_TIME:lower-100x100-5050nz S N 1 100 100 5050 0.001005 -%:RSB_SHUFFLE_TIME:lower-100x100-5050nz S N 1 100 100 5050 0.003394 +%:CONSTRUCTOR_TIMES:lower-100x100-5050nz S N 1 100 100 5050 0.000000 0.000849 0.006493 0.007342 +%:UNSORTEDCOO2RSB_TIME:lower-100x100-5050nz S N 1 100 100 5050 0.007342 +%:RSB_SUBDIVISION_TIME:lower-100x100-5050nz S N 1 100 100 5050 0.000849 +%:RSB_SHUFFLE_TIME:lower-100x100-5050nz S N 1 100 100 5050 0.006493 %:ROW_MAJOR_SORT_TIME:lower-100x100-5050nz S N 1 100 100 5050 0.000000 %:ROW_MAJOR_SORT_SCALING:lower-100x100-5050nz S N 1 100 100 5050 nan -%:SORTEDCOO2RSB_TIME:lower-100x100-5050nz S N 1 100 100 5050 0.004399 +%:SORTEDCOO2RSB_TIME:lower-100x100-5050nz S N 1 100 100 5050 0.007342 %:ROW_MAJOR_SORT_TO_MOP:lower-100x100-5050nz S N 1 100 100 5050 0.000 %:UNSORTEDCOO2RSB_SCALING:lower-100x100-5050nz S N 1 100 100 5050 1.00 %:SORTEDCOO2RSB_SCALING:lower-100x100-5050nz S N 1 100 100 5050 1.00 @@ -7378,34 +7414,34 @@ %:SM_MINMAXAVGNNZ:lower-100x100-5050nz S N 1 100 100 5050 5050 5050 5050 # %operation:matrix CONSTRUCTOR[1] SPMV[1] SPMV[1] -%operation:lower-100x100-5050nz 0.006253 1e+09 1e+09 +%operation:lower-100x100-5050nz 0.00983095 1e+09 1e+09 %constructor:matrix SORT[1] SCAN[1] SHUFFLE[1] INSERT[1] -%constructor:lower-100x100-5050nz 0 0.00100493 0 0.00339413 -# so far, program took 5.403s of wall clock time; ancillary tests 0.000s; I/O 0.000s; checks 0.000s; conversions 0.000s; rsb/mkl tuning 0.360s/0.000s . +%constructor:lower-100x100-5050nz 0 0.000849009 0 0.00649309 +# so far, program took 5.638s of wall clock time; ancillary tests 0.000s; I/O 0.000s; checks 0.000s; conversions 0.000s; rsb/mkl tuning 0.240s/0.000s . getrusage() stats: -ru_maxrss: 8 (maximum resident set size -- MB) -ru_stime : 0.08276s (system CPU time used) -ru_utime : 5.279s (user CPU time used) +ru_maxrss: 6 (maximum resident set size -- MB) +ru_stime : 0.05605s (system CPU time used) +ru_utime : 6.787s (user CPU time used) # multi-type benchmarking (DSCZ) -- now using typecode Z (last was D). # Cache block size total 524288 bytes, per-thread 524288 bytes -# so far, program took 5.403s of wall clock time; ancillary tests 0.000s; I/O 0.000s; checks 0.000s; conversions 0.000s; rsb/mkl tuning 0.360s/0.000s . +# so far, program took 5.638s of wall clock time; ancillary tests 0.000s; I/O 0.000s; checks 0.000s; conversions 0.000s; rsb/mkl tuning 0.240s/0.000s . # Using 1 threads # Using alpha=1 beta=1 order=cols for rsb_spmv/rsb_spsv/rsb_spmm/rsb_spsm. # will use input matrix flags: RSB_FLAG_USE_HALFWORD_INDICES, RSB_FLAG_SORTED_INPUT, RSB_FLAG_LOWER, RSB_FLAG_QUAD_PARTITIONING, RSB_FLAG_SYMMETRIC, RSB_FLAG_OWN_PARTITIONING_ARRAYS # Using 1 threads Building a matrix with 5050 nnz, 100 x 100 Duplicates check: 5050 - 0 = 5050 - converted COO to RSB in 6.630e-03 s (100.00 %) - analyzed arrays in 8.531e-04 s (12.87 %) - cleaned-up arrays in 1.311e-05 s (0.20 %) - deduplicated arrays in 1.001e-05 s (0.15 %) + converted COO to RSB in 4.996e-03 s (100.00 %) + analyzed arrays in 9.871e-04 s (19.76 %) + cleaned-up arrays in 1.001e-05 s (0.20 %) + deduplicated arrays in 7.868e-06 s (0.16 %) sorted arrays in 0.000e+00 s (0.00 %) - shuffled partitions in 3.345e-03 s (50.45 %) - memory allocations took 4.768e-06 s (0.07 %) - leafs setup took 1.907e-06 s (0.03 %) - halfword conversion took 2.401e-03 s (36.22 %) -Built (100 x 100)[0xaaaafde08c70]{Z} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x2446196 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'LS' -# Constructed matrix (took 0.007s): (100 x 100)[0xaaaafde08c70]{Z} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x2446196 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'LS' + shuffled partitions in 2.628e-03 s (52.60 %) + memory allocations took 3.099e-06 s (0.06 %) + leafs setup took 1.001e-05 s (0.20 %) + halfword conversion took 1.348e-03 s (26.98 %) +Built (100 x 100)[0xaaaae537dcb0]{Z} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x2446196 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'LS' +# Constructed matrix (took 0.005s): (100 x 100)[0xaaaae537dcb0]{Z} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x2446196 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'LS' # matrix consistency check took 0.000s (ok) RSB Sparse Blocks Autotuner invoked requesting max 6 splits and max 6 merges in 1 rounds, threads spec.0 (specify negative values to enable threads tuning). Will autotune matrix: 100 x 100, type Z, 5050 nnz, 50 nnz/r, 4 subms, 3 lsubms, 2.1212 bpnz. @@ -7456,10 +7492,10 @@ # RSB_IO_WANT_SORT_METHOD: 0 # RSB_IO_WANT_SUBDIVISION_MULTIPLIER: 1 # librsb version 1.3.0.2 - 202212201855: Initialization success -3 iterations (1 th.) took 0.002551s; avg 0.0008504s ( +/- 4.64/ 6.21 %); best 0.0008109s; worst 0.0009031s; std dev. 3.882e-05 (taking best). -Reference operation time is 0.000810862 s (99.65 Mflops) with 1 threads. -Starting merge (same threads) based auto-tuning procedure (transA=N, nrhs=1, order=cols) (max 6 steps, inclusive 3 grace steps) on: 100 x 100, type Z, 5050 nnz, 50 nnz/r, 4 subms, 3 lsubms, 2.1212 bpnz (tpop: 0.0008109 Mflops: 99.647) -Merge (3 -> 1 leaves) took w.c.t. of 5.198e-05s, ~4.387e-05s of computing time (of which 2.289e-05s sorting, 1.907e-06s analysis) +3 iterations (1 th.) took 0.002293s; avg 0.0007644s ( +/- 7.61/ 6.74 %); best 0.0007062s; worst 0.0008159s; std dev. 4.502e-05 (taking best). +Reference operation time is 0.000706196 s (114.4 Mflops) with 1 threads. +Starting merge (same threads) based auto-tuning procedure (transA=N, nrhs=1, order=cols) (max 6 steps, inclusive 3 grace steps) on: 100 x 100, type Z, 5050 nnz, 50 nnz/r, 4 subms, 3 lsubms, 2.1212 bpnz (tpop: 0.0007062 Mflops: 114.416) +Merge (3 -> 1 leaves) took w.c.t. of 6.199e-05s, ~5.198e-05s of computing time (of which 2.408e-05s sorting, 3.099e-06s analysis) # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 524288 bytes, per-thread 524288 bytes # RSB_IO_WANT_MEMORY_HIERARCHY_INFO_STRING: unset @@ -7490,8 +7526,8 @@ # RSB_IO_WANT_SORT_METHOD: 0 # RSB_IO_WANT_SUBDIVISION_MULTIPLIER: 1 # librsb version 1.3.0.2 - 202212201855: Initialization success -3 iterations (1 th.) took 6.986e-05s; avg 2.329e-05s ( +/- 1.71/ 2.39 %); best 2.289e-05s; worst 2.384e-05s; std dev. 4.052e-07 (taking best). -Reference operation time is 2.28882e-05 s (3530 Mflops) with 1 threads. +3 iterations (1 th.) took 9.894e-05s; avg 3.298e-05s ( +/- 3.13/ 2.65 %); best 3.195e-05s; worst 3.386e-05s; std dev. 7.867e-07 (taking best). +Reference operation time is 3.19481e-05 s (2529 Mflops) with 1 threads. # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 524288 bytes, per-thread 524288 bytes # RSB_IO_WANT_MEMORY_HIERARCHY_INFO_STRING: unset @@ -7507,16 +7543,16 @@ # RSB_IO_WANT_SORT_METHOD: 0 # RSB_IO_WANT_SUBDIVISION_MULTIPLIER: 1 # librsb version 1.3.0.2 - 202212201855: Initialization success -After merge step 1: tpop: 2.289e-05 s ~Mflops: 3530.206 nsubm:1 otn:1 -Applying merge (3 -> 1 leaves, 1 th.) yielded SPEEDUP of 35.427x: 0.0008109s -> 2.289e-05s, so taking this instance. +After merge step 1: tpop: 3.195e-05 s ~Mflops: 2529.103 nsubm:1 otn:1 +Applying merge (3 -> 1 leaves, 1 th.) yielded SPEEDUP of 22.104x: 0.0007062s -> 3.195e-05s, so taking this instance. Saved plot to test-tuning-lower-100x100-5050nz--Z-N-1--mv-tuned_merge1_1x1th.eps Merged all the matrix leaves: no reason to continue merging. -A total of 1 merge steps (of max 6) (3 -> 1 subms) took 0.01213s (of which 5.388e-05s partitioning, 0.009535s I/O); computing times: 4.387e-05s in par. loops, 2.289e-05s sorting, 1.907e-06s analyzing) -Total merge + benchmarking process took 0.01213s, equivalent to 529.8/15.0 new/old ops (0.00468s for 2 clones -- as 204.5/5.8 ops, or 102.2/2.9 ops per clone), SPEEDUP of 35.427x -Applying multi-merge (3 -> 1 leaves, 1 steps, 0 -> 1 th.sp.) yielded SPEEDUP of 35.427x (0.0008109s -> 2.289e-05s), will amortize in 15.4 ops by saving 0.000788s per op. -In 1 tuning rounds (tot. 0.017s, 0.0047s for constructor, 2 clones) obtained a SPEEDUP of 3442.7% (35.43x) (from 99.65 to 3530 Mflops). Employed 0.0075s for I/O of matrix plots. +A total of 1 merge steps (of max 6) (3 -> 1 subms) took 0.008935s (of which 6.604e-05s partitioning, 0.006498s I/O); computing times: 5.198e-05s in par. loops, 2.408e-05s sorting, 3.099e-06s analyzing) +Total merge + benchmarking process took 0.008935s, equivalent to 279.7/12.7 new/old ops (0.004066s for 2 clones -- as 127.3/5.8 ops, or 63.6/2.9 ops per clone), SPEEDUP of 22.104x +Applying multi-merge (3 -> 1 leaves, 1 steps, 0 -> 1 th.sp.) yielded SPEEDUP of 22.104x (0.0007062s -> 3.195e-05s), will amortize in 13.3 ops by saving 0.0006742s per op. +In 1 tuning rounds (tot. 0.013s, 0.0041s for constructor, 2 clones) obtained a SPEEDUP of 2110.4% (22.1x) (from 114.4 to 2529 Mflops). Employed 0.0053s for I/O of matrix plots. #pr: updating sample at index 4 (3^th of 4), 0^th touch for (0,0,0,0,0,3,0). -First run of RSB Autotuner took 0.024636 s (8.109e-04 s -> 2.289e-05 s per spmv_sxsa) (tuned: 3 -> 1 lsubm). +First run of RSB Autotuner took 0.018955 s (7.062e-04 s -> 3.195e-05 s per spmv_sxsa) (tuned: 3 -> 1 lsubm). RSB Sparse Blocks Autotuner invoked requesting max 0 splits and max 0 merges in 1 rounds, auto threads spec. Will autotune matrix: 100 x 100, type Z, 5050 nnz, 50 nnz/r, 1 subms, 1 lsubms, 2.0800 bpnz. Parameters: verbosity:1 mintimes:3 maxtimes:10 mindt:0 maxdt:10 @@ -7582,20 +7618,20 @@ # RSB_IO_WANT_SORT_METHOD: 0 # RSB_IO_WANT_SUBDIVISION_MULTIPLIER: 1 # librsb version 1.3.0.2 - 202212201855: Initialization success -3 iterations (1 th.) took 6.294e-05s; avg 2.098e-05s ( +/- 10.23/ 14.77 %); best 1.884e-05s; worst 2.408e-05s; std dev. 2.245e-06 (taking best). +3 iterations (1 th.) took 6.58e-05s; avg 2.193e-05s ( +/- 14.13/ 27.17 %); best 1.884e-05s; worst 2.789e-05s; std dev. 4.216e-06 (taking best). Reference operation time is 1.88351e-05 s (4290 Mflops) with 1 threads. Building a matrix with 5050 nnz, 100 x 100 Duplicates check: 5050 - 0 = 5050 - converted COO to RSB in 7.549e-03 s (100.00 %) - analyzed arrays in 5.307e-03 s (70.30 %) - cleaned-up arrays in 9.060e-06 s (0.12 %) - deduplicated arrays in 7.868e-06 s (0.10 %) + converted COO to RSB in 2.334e-03 s (100.00 %) + analyzed arrays in 8.922e-04 s (38.23 %) + cleaned-up arrays in 1.001e-05 s (0.43 %) + deduplicated arrays in 6.914e-06 s (0.30 %) sorted arrays in 0.000e+00 s (0.00 %) - shuffled partitions in 2.221e-03 s (29.42 %) - memory allocations took 2.146e-06 s (0.03 %) - leafs setup took 1.192e-06 s (0.02 %) - halfword conversion took 9.537e-07 s (0.01 %) -Built (100 x 100)[0xaaaafde08b50]{Z} @ (0(0..100),0(0..100)) (5050 nnz, 50 nnz/r) flags 0x42644094 (coo:0, csr:1, hw:0, ic:1, fi:0), storage: 1, subm: 1, symflags:'LS' + shuffled partitions in 1.155e-03 s (49.48 %) + memory allocations took 2.649e-04 s (11.35 %) + leafs setup took 3.099e-06 s (0.13 %) + halfword conversion took 1.907e-06 s (0.08 %) +Built (100 x 100)[0xaaaae537db90]{Z} @ (0(0..100),0(0..100)) (5050 nnz, 50 nnz/r) flags 0x42644094 (coo:0, csr:1, hw:0, ic:1, fi:0), storage: 1, subm: 1, symflags:'LS' Starting autotuning stage, with subdivision of 1 (current threads=1, requested threads=0, max threads = 12). # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 524288 bytes, per-thread 524288 bytes @@ -7629,16 +7665,16 @@ # librsb version 1.3.0.2 - 202212201855: Initialization success Building a matrix with 5050 nnz, 100 x 100 Duplicates check: 5050 - 0 = 5050 - converted COO to RSB in 5.852e-03 s (100.00 %) - analyzed arrays in 2.382e-03 s (40.70 %) - cleaned-up arrays in 9.060e-06 s (0.15 %) - deduplicated arrays in 7.868e-06 s (0.13 %) + converted COO to RSB in 4.711e-03 s (100.00 %) + analyzed arrays in 1.634e-03 s (34.69 %) + cleaned-up arrays in 1.001e-05 s (0.21 %) + deduplicated arrays in 8.106e-06 s (0.17 %) sorted arrays in 0.000e+00 s (0.00 %) - shuffled partitions in 1.855e-03 s (31.70 %) - memory allocations took 2.861e-06 s (0.05 %) - leafs setup took 2.861e-06 s (0.05 %) - halfword conversion took 1.592e-03 s (27.21 %) -Built (100 x 100)[0xaaaafde08c70]{Z} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x42646096 (coo:0, csr:1, hw:1, ic:1, fi:0), storage: 1, subm: 6, symflags:'LS' + shuffled partitions in 1.392e-03 s (29.55 %) + memory allocations took 5.722e-06 s (0.12 %) + leafs setup took 1.907e-06 s (0.04 %) + halfword conversion took 1.658e-03 s (35.19 %) +Built (100 x 100)[0xaaaae537dcb0]{Z} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x42646096 (coo:0, csr:1, hw:1, ic:1, fi:0), storage: 1, subm: 6, symflags:'LS' # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 524288 bytes, per-thread 524288 bytes # RSB_IO_WANT_MEMORY_HIERARCHY_INFO_STRING: unset @@ -7684,9 +7720,9 @@ # RSB_IO_WANT_SORT_METHOD: 0 # RSB_IO_WANT_SUBDIVISION_MULTIPLIER: 0.25 # librsb version 1.3.0.2 - 202212201855: Initialization success -3 iterations (1 th.) took 0.002579s; avg 0.0008597s ( +/- 27.64/ 19.92 %); best 0.000622s; worst 0.001031s; std dev. 0.0001734 (taking best). -Reference operation time is 0.000622034 s (129.9 Mflops) with 1 threads. -Challenging best inner round reference (1.88351e-05 s/1 threads) with: subdivision 0.25, 6 leaves, 2.163 bytes/nz, 0.000622034 s/0 threads (speedup 0.0302798 x), same?n. +3 iterations (1 th.) took 0.001969s; avg 0.0006563s ( +/- 16.95/ 25.99 %); best 0.000545s; worst 0.0008268s; std dev. 0.0001224 (taking best). +Reference operation time is 0.000545025 s (148.3 Mflops) with 1 threads. +Challenging best inner round reference (1.88351e-05 s/1 threads) with: subdivision 0.25, 6 leaves, 2.163 bytes/nz, 0.000545025 s/0 threads (speedup 0.0345582 x), same?n. New candidate clone performs slowly; discarding it: 100 x 100, type Z, 5050 nnz, 50 nnz/r, 8 subms, 6 lsubms, 2.1632 bpnz # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 524288 bytes, per-thread 524288 bytes @@ -7720,16 +7756,16 @@ # librsb version 1.3.0.2 - 202212201855: Initialization success Building a matrix with 5050 nnz, 100 x 100 Duplicates check: 5050 - 0 = 5050 - converted COO to RSB in 5.389e-03 s (100.00 %) - analyzed arrays in 2.196e-03 s (40.75 %) - cleaned-up arrays in 8.821e-06 s (0.16 %) - deduplicated arrays in 8.106e-06 s (0.15 %) + converted COO to RSB in 3.311e-03 s (100.00 %) + analyzed arrays in 1.396e-03 s (42.16 %) + cleaned-up arrays in 9.060e-06 s (0.27 %) + deduplicated arrays in 8.106e-06 s (0.24 %) sorted arrays in 0.000e+00 s (0.00 %) - shuffled partitions in 1.728e-03 s (32.07 %) - memory allocations took 3.099e-06 s (0.06 %) - leafs setup took 2.861e-06 s (0.05 %) - halfword conversion took 1.441e-03 s (26.74 %) -Built (100 x 100)[0xaaaafde08c70]{Z} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x42646096 (coo:0, csr:1, hw:1, ic:1, fi:0), storage: 1, subm: 16, symflags:'LS' + shuffled partitions in 9.482e-04 s (28.64 %) + memory allocations took 2.861e-06 s (0.09 %) + leafs setup took 1.907e-06 s (0.06 %) + halfword conversion took 9.439e-04 s (28.51 %) +Built (100 x 100)[0xaaaae537dcb0]{Z} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x42646096 (coo:0, csr:1, hw:1, ic:1, fi:0), storage: 1, subm: 16, symflags:'LS' # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 524288 bytes, per-thread 524288 bytes # RSB_IO_WANT_MEMORY_HIERARCHY_INFO_STRING: unset @@ -7775,9 +7811,9 @@ # RSB_IO_WANT_SORT_METHOD: 0 # RSB_IO_WANT_SUBDIVISION_MULTIPLIER: 0.5 # librsb version 1.3.0.2 - 202212201855: Initialization success -3 iterations (1 th.) took 0.002423s; avg 0.0008077s ( +/- 17.05/ 14.77 %); best 0.00067s; worst 0.000927s; std dev. 0.0001057 (taking best). -Reference operation time is 0.000669956 s (120.6 Mflops) with 1 threads. -Challenging best inner round reference (1.88351e-05 s/1 threads) with: subdivision 0.5, 16 leaves, 2.25 bytes/nz, 0.000669956 s/0 threads (speedup 0.0281139 x), same?n. +3 iterations (1 th.) took 0.007825s; avg 0.002608s ( +/- 79.49/139.65 %); best 0.000535s; worst 0.006251s; std dev. 0.002584 (taking best). +Reference operation time is 0.000535011 s (151 Mflops) with 1 threads. +Challenging best inner round reference (1.88351e-05 s/1 threads) with: subdivision 0.5, 16 leaves, 2.25 bytes/nz, 0.000535011 s/0 threads (speedup 0.035205 x), same?n. New candidate clone performs slowly; discarding it: 100 x 100, type Z, 5050 nnz, 50 nnz/r, 22 subms, 16 lsubms, 2.2503 bpnz # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 524288 bytes, per-thread 524288 bytes @@ -7811,16 +7847,16 @@ # librsb version 1.3.0.2 - 202212201855: Initialization success Building a matrix with 5050 nnz, 100 x 100 Duplicates check: 5050 - 0 = 5050 - converted COO to RSB in 6.678e-03 s (100.00 %) - analyzed arrays in 3.084e-03 s (46.18 %) - cleaned-up arrays in 9.060e-06 s (0.14 %) - deduplicated arrays in 7.868e-06 s (0.12 %) + converted COO to RSB in 5.367e-03 s (100.00 %) + analyzed arrays in 1.699e-03 s (31.66 %) + cleaned-up arrays in 8.821e-06 s (0.16 %) + deduplicated arrays in 8.106e-06 s (0.15 %) sorted arrays in 0.000e+00 s (0.00 %) - shuffled partitions in 1.906e-03 s (28.54 %) - memory allocations took 4.053e-06 s (0.06 %) - leafs setup took 3.099e-06 s (0.05 %) - halfword conversion took 1.664e-03 s (24.92 %) -Built (100 x 100)[0xaaaafde57030]{Z} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x42646096 (coo:0, csr:1, hw:1, ic:1, fi:0), storage: 1, subm: 36, symflags:'LS' + shuffled partitions in 1.396e-03 s (26.01 %) + memory allocations took 7.153e-06 s (0.13 %) + leafs setup took 5.007e-06 s (0.09 %) + halfword conversion took 2.242e-03 s (41.78 %) +Built (100 x 100)[0xaaaae53cc070]{Z} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x42646096 (coo:0, csr:1, hw:1, ic:1, fi:0), storage: 1, subm: 36, symflags:'LS' # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 524288 bytes, per-thread 524288 bytes # RSB_IO_WANT_MEMORY_HIERARCHY_INFO_STRING: unset @@ -7866,9 +7902,9 @@ # RSB_IO_WANT_SORT_METHOD: 0 # RSB_IO_WANT_SUBDIVISION_MULTIPLIER: 1 # librsb version 1.3.0.2 - 202212201855: Initialization success -3 iterations (1 th.) took 0.002289s; avg 0.000763s ( +/- 17.82/ 35.27 %); best 0.000627s; worst 0.001032s; std dev. 0.0001903 (taking best). -Reference operation time is 0.000627041 s (128.9 Mflops) with 1 threads. -Challenging best inner round reference (1.88351e-05 s/1 threads) with: subdivision 1, 36 leaves, 2.383 bytes/nz, 0.000627041 s/0 threads (speedup 0.030038 x), same?n. +3 iterations (1 th.) took 0.001592s; avg 0.0005307s ( +/- 1.62/ 0.99 %); best 0.0005221s; worst 0.000536s; std dev. 6.119e-06 (taking best). +Reference operation time is 0.000522137 s (154.7 Mflops) with 1 threads. +Challenging best inner round reference (1.88351e-05 s/1 threads) with: subdivision 1, 36 leaves, 2.383 bytes/nz, 0.000522137 s/0 threads (speedup 0.0360731 x), same?n. New candidate clone performs slowly; discarding it: 100 x 100, type Z, 5050 nnz, 50 nnz/r, 50 subms, 36 lsubms, 2.3834 bpnz # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 524288 bytes, per-thread 524288 bytes @@ -7902,16 +7938,16 @@ # librsb version 1.3.0.2 - 202212201855: Initialization success Building a matrix with 5050 nnz, 100 x 100 Duplicates check: 5050 - 0 = 5050 - converted COO to RSB in 1.705e-02 s (100.00 %) - analyzed arrays in 1.936e-03 s (11.36 %) - cleaned-up arrays in 9.060e-06 s (0.05 %) - deduplicated arrays in 7.868e-06 s (0.05 %) + converted COO to RSB in 3.022e-03 s (100.00 %) + analyzed arrays in 1.019e-03 s (33.72 %) + cleaned-up arrays in 1.097e-05 s (0.36 %) + deduplicated arrays in 9.060e-06 s (0.30 %) sorted arrays in 0.000e+00 s (0.00 %) - shuffled partitions in 1.141e-02 s (66.92 %) - memory allocations took 4.053e-06 s (0.02 %) - leafs setup took 5.007e-06 s (0.03 %) - halfword conversion took 3.676e-03 s (21.56 %) -Built (100 x 100)[0xaaaafde57030]{Z} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x42646096 (coo:0, csr:1, hw:1, ic:1, fi:0), storage: 1, subm: 36, symflags:'LS' + shuffled partitions in 1.007e-03 s (33.33 %) + memory allocations took 5.007e-06 s (0.17 %) + leafs setup took 1.907e-06 s (0.06 %) + halfword conversion took 9.689e-04 s (32.06 %) +Built (100 x 100)[0xaaaae53cc070]{Z} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x42646096 (coo:0, csr:1, hw:1, ic:1, fi:0), storage: 1, subm: 36, symflags:'LS' # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 524288 bytes, per-thread 524288 bytes # RSB_IO_WANT_MEMORY_HIERARCHY_INFO_STRING: unset @@ -7957,9 +7993,9 @@ # RSB_IO_WANT_SORT_METHOD: 0 # RSB_IO_WANT_SUBDIVISION_MULTIPLIER: 2 # librsb version 1.3.0.2 - 202212201855: Initialization success -3 iterations (1 th.) took 0.004351s; avg 0.00145s ( +/- 54.15/ 82.52 %); best 0.0006649s; worst 0.002647s; std dev. 0.0008599 (taking best). -Reference operation time is 0.000664949 s (121.5 Mflops) with 1 threads. -Challenging best inner round reference (1.88351e-05 s/1 threads) with: subdivision 2, 36 leaves, 2.383 bytes/nz, 0.000664949 s/0 threads (speedup 0.0283256 x), same?n. +3 iterations (1 th.) took 0.003043s; avg 0.001014s ( +/- 47.86/ 34.57 %); best 0.0005288s; worst 0.001365s; std dev. 0.0003544 (taking best). +Reference operation time is 0.000528812 s (152.8 Mflops) with 1 threads. +Challenging best inner round reference (1.88351e-05 s/1 threads) with: subdivision 2, 36 leaves, 2.383 bytes/nz, 0.000528812 s/0 threads (speedup 0.0356177 x), same?n. New candidate clone performs slowly; discarding it: 100 x 100, type Z, 5050 nnz, 50 nnz/r, 50 subms, 36 lsubms, 2.3834 bpnz # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 524288 bytes, per-thread 524288 bytes @@ -7993,16 +8029,16 @@ # librsb version 1.3.0.2 - 202212201855: Initialization success Building a matrix with 5050 nnz, 100 x 100 Duplicates check: 5050 - 0 = 5050 - converted COO to RSB in 1.118e-02 s (100.00 %) - analyzed arrays in 3.585e-03 s (32.07 %) - cleaned-up arrays in 9.060e-06 s (0.08 %) - deduplicated arrays in 7.868e-06 s (0.07 %) + converted COO to RSB in 5.445e-03 s (100.00 %) + analyzed arrays in 2.029e-03 s (37.27 %) + cleaned-up arrays in 9.775e-06 s (0.18 %) + deduplicated arrays in 9.060e-06 s (0.17 %) sorted arrays in 0.000e+00 s (0.00 %) - shuffled partitions in 2.502e-03 s (22.38 %) - memory allocations took 6.199e-06 s (0.06 %) - leafs setup took 4.053e-06 s (0.04 %) - halfword conversion took 5.065e-03 s (45.30 %) -Built (100 x 100)[0xaaaafde57030]{Z} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x42646096 (coo:0, csr:1, hw:1, ic:1, fi:0), storage: 1, subm: 36, symflags:'LS' + shuffled partitions in 1.714e-03 s (31.48 %) + memory allocations took 3.099e-06 s (0.06 %) + leafs setup took 2.861e-06 s (0.05 %) + halfword conversion took 1.677e-03 s (30.80 %) +Built (100 x 100)[0xaaaae53cc070]{Z} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x42646096 (coo:0, csr:1, hw:1, ic:1, fi:0), storage: 1, subm: 36, symflags:'LS' # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 524288 bytes, per-thread 524288 bytes # RSB_IO_WANT_MEMORY_HIERARCHY_INFO_STRING: unset @@ -8048,9 +8084,9 @@ # RSB_IO_WANT_SORT_METHOD: 0 # RSB_IO_WANT_SUBDIVISION_MULTIPLIER: 4 # librsb version 1.3.0.2 - 202212201855: Initialization success -3 iterations (1 th.) took 0.002725s; avg 0.0009084s ( +/- 3.91/ 4.49 %); best 0.0008729s; worst 0.0009491s; std dev. 3.137e-05 (taking best). -Reference operation time is 0.00087285 s (92.57 Mflops) with 1 threads. -Challenging best inner round reference (1.88351e-05 s/1 threads) with: subdivision 4, 36 leaves, 2.383 bytes/nz, 0.00087285 s/0 threads (speedup 0.0215788 x), same?n. +3 iterations (1 th.) took 0.002514s; avg 0.000838s ( +/- 23.64/ 24.35 %); best 0.0006399s; worst 0.001042s; std dev. 0.0001643 (taking best). +Reference operation time is 0.000639915 s (126.3 Mflops) with 1 threads. +Challenging best inner round reference (1.88351e-05 s/1 threads) with: subdivision 4, 36 leaves, 2.383 bytes/nz, 0.000639915 s/0 threads (speedup 0.0294337 x), same?n. New candidate clone performs slowly; discarding it: 100 x 100, type Z, 5050 nnz, 50 nnz/r, 50 subms, 36 lsubms, 2.3834 bpnz Best sparse multiply performance with subdivision multiplier of 1: 4289.87 Mflops. # librsb version 1.3.0.2 - 202212201855: Initializing @@ -8068,23 +8104,23 @@ # RSB_IO_WANT_SORT_METHOD: 0 # RSB_IO_WANT_SUBDIVISION_MULTIPLIER: 1 # librsb version 1.3.0.2 - 202212201855: Initialization success -Last tuner inner round (1 of 1) took 0.0699759 s (eq. to 4e+03/ 4e+03 old/new op.times), gained local/global speedup 1 x (1.88351e-05 : 1.88351e-05) / 1 x (1.88351e-05 : 1.88351e-05). This is not amortizable ! +Last tuner inner round (1 of 1) took 0.0428262 s (eq. to 2e+03/ 2e+03 old/new op.times), gained local/global speedup 1 x (1.88351e-05 : 1.88351e-05) / 1 x (1.88351e-05 : 1.88351e-05). This is not amortizable ! Auto tuning inner round 1 did not find a configuration better than the original. -In 1 tuning rounds (tot. 0.07s, 0.054s for constructor, 0 clones) obtained NO speedup (best stays 4290 Mflops). -Second run of RSB Autotuner took 0.0699971 s and estimated a speedup of 1.000000 x (1.884e-05 s -> 1.884e-05 s per op) in same matrix (1 -> 1 lsubm) +In 1 tuning rounds (tot. 0.043s, 0.025s for constructor, 0 clones) obtained NO speedup (best stays 4290 Mflops). +Second run of RSB Autotuner took 0.0428581 s and estimated a speedup of 1.000000 x (1.884e-05 s -> 1.884e-05 s per op) in same matrix (1 -> 1 lsubm) #min:1 0 #max:1 0 #sum:100 0 #norm:10 0 #used index storage compared to COO:10504 vs 40400 bytes (26.00%) ; compared to CSR:10504 vs 20604 bytes (50.99%) #%:CONSTRUCTOR_*:SORT SCAN INSERT SCAN+INSERT -%:CONSTRUCTOR_TIMES:lower-100x100-5050nz S N 1 100 100 5050 0.000000 0.000853 0.003345 0.004198 -%:UNSORTEDCOO2RSB_TIME:lower-100x100-5050nz S N 1 100 100 5050 0.004198 -%:RSB_SUBDIVISION_TIME:lower-100x100-5050nz S N 1 100 100 5050 0.000853 -%:RSB_SHUFFLE_TIME:lower-100x100-5050nz S N 1 100 100 5050 0.003345 +%:CONSTRUCTOR_TIMES:lower-100x100-5050nz S N 1 100 100 5050 0.000000 0.000987 0.002628 0.003615 +%:UNSORTEDCOO2RSB_TIME:lower-100x100-5050nz S N 1 100 100 5050 0.003615 +%:RSB_SUBDIVISION_TIME:lower-100x100-5050nz S N 1 100 100 5050 0.000987 +%:RSB_SHUFFLE_TIME:lower-100x100-5050nz S N 1 100 100 5050 0.002628 %:ROW_MAJOR_SORT_TIME:lower-100x100-5050nz S N 1 100 100 5050 0.000000 %:ROW_MAJOR_SORT_SCALING:lower-100x100-5050nz S N 1 100 100 5050 nan -%:SORTEDCOO2RSB_TIME:lower-100x100-5050nz S N 1 100 100 5050 0.004198 +%:SORTEDCOO2RSB_TIME:lower-100x100-5050nz S N 1 100 100 5050 0.003615 %:ROW_MAJOR_SORT_TO_MOP:lower-100x100-5050nz S N 1 100 100 5050 0.000 %:UNSORTEDCOO2RSB_SCALING:lower-100x100-5050nz S N 1 100 100 5050 1.00 %:SORTEDCOO2RSB_SCALING:lower-100x100-5050nz S N 1 100 100 5050 1.00 @@ -8099,68 +8135,68 @@ %:SM_MINMAXAVGNNZ:lower-100x100-5050nz S N 1 100 100 5050 5050 5050 5050 # %operation:matrix CONSTRUCTOR[1] SPMV[1] SPMV[1] -%operation:lower-100x100-5050nz 0.00662994 1e+09 1e+09 +%operation:lower-100x100-5050nz 0.00499606 1e+09 1e+09 %constructor:matrix SORT[1] SCAN[1] SHUFFLE[1] INSERT[1] -%constructor:lower-100x100-5050nz 0 0.000853062 0 0.00334501 -# so far, program took 5.516s of wall clock time; ancillary tests 0.000s; I/O 0.000s; checks 0.000s; conversions 0.000s; rsb/mkl tuning 0.455s/0.000s . +%constructor:lower-100x100-5050nz 0 0.000987053 0 0.00262809 +# so far, program took 5.708s of wall clock time; ancillary tests 0.000s; I/O 0.000s; checks 0.000s; conversions 0.000s; rsb/mkl tuning 0.302s/0.000s . getrusage() stats: -ru_maxrss: 8 (maximum resident set size -- MB) -ru_stime : 0.09537s (system CPU time used) -ru_utime : 5.653s (user CPU time used) +ru_maxrss: 6 (maximum resident set size -- MB) +ru_stime : 0.0678s (system CPU time used) +ru_utime : 7.136s (user CPU time used) # benchmarking terminated --- finalizing run. # ====== BEGIN Total summary record. #pr: ======== All results (not limiting) #pr: Dump from a base of 4 samples (of max 4) ordered by (1,1,1,1,1,4,1) = (filename x cores x incX x incY x nrhs x typecode x transA). pr: BESTCODE MTX NR NC NNZ NRHS TYPE SYM TRANS NT AT-NT AT-MKL-NT BPNZ AT-BPNZ NSUBM AT-SUBM RSBBEST-MFLOPS OPTIME MKL-OPTIME AT-OPTIME AT-MKL-OPTIME AT-TIME RWminBW-GBps CB-bpf AT-MS CMFLOPS -pr: 1:R_R lower-100x100-5050nz 100 100 5050 1 D S N 1 1 0 2.1212 2.0800 3 1 1264.55 2.099e-03 0.000e+00 1.597e-05 0.000e+00 8.697e-02 3.34e+00 2.60e+00 1 2.02e-02 -pr: 2:R_R lower-100x100-5050nz 100 100 5050 1 S S N 1 1 0 2.1212 2.0800 3 1 2017.26 9.160e-04 0.000e+00 1.001e-05 0.000e+00 3.246e-02 3.19e+00 1.56e+00 1 2.02e-02 -pr: 3:R_R lower-100x100-5050nz 100 100 5050 1 C S N 1 1 0 2.1212 2.0800 3 1 4289.87 5.860e-04 0.000e+00 1.884e-05 0.000e+00 4.455e-02 2.83e+00 6.50e-01 1 8.08e-02 -pr: 4:R_R lower-100x100-5050nz 100 100 5050 1 Z S N 1 1 0 2.1212 2.0800 3 1 3530.21 8.109e-04 0.000e+00 2.289e-05 0.000e+00 2.464e-02 4.20e+00 1.17e+00 1 8.08e-02 +pr: 1:R_R lower-100x100-5050nz 100 100 5050 1 D S N 1 1 0 2.1212 2.0800 3 1 2289.86 1.079e-03 0.000e+00 8.821e-06 0.000e+00 4.419e-02 6.04e+00 2.60e+00 1 2.02e-02 +pr: 2:R_R lower-100x100-5050nz 100 100 5050 1 S S N 1 1 0 2.1212 2.0800 3 1 2017.26 7.749e-04 0.000e+00 1.001e-05 0.000e+00 2.710e-02 3.19e+00 1.56e+00 1 2.02e-02 +pr: 3:R_R lower-100x100-5050nz 100 100 5050 1 C S N 1 1 0 2.1212 2.0800 3 1 3530.21 5.910e-04 0.000e+00 2.289e-05 0.000e+00 2.228e-02 2.33e+00 6.50e-01 1 8.08e-02 +pr: 4:R_R lower-100x100-5050nz 100 100 5050 1 Z S N 1 1 0 2.1212 2.0800 3 1 2529.10 7.062e-04 0.000e+00 3.195e-05 0.000e+00 1.895e-02 3.01e+00 1.17e+00 1 8.08e-02 #pr: below, we define 'successful' autotuning when speedup of 1.010000x is exceeded, and 'tuned' results even the ones which are same as untuned #pr: rsb autotuning was successful in 4 cases (100.00 %) and unsuccessful in 0 cases (0.00 %) -#pr: (in succ. cases rsb autotuning gave avg. 7135.1 % faster, avg. sp. ratio 72.351x, max sp. ratio 131.388x, avg. ratio 0.000x) -#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 3031.9/1076.4/5444.5/12127.4 tuned ops) -#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 45.8/ 30.4/ 76.0/183.3 untuned ops) -#pr: (and amortizes from untuned rsb in avg. 46.8, min. 31.3, max. 78.5 ops) +#pr: (in succ. cases rsb autotuning gave avg. 6090.8 % faster, avg. sp. ratio 61.908x, max sp. ratio 122.324x, avg. ratio 0.000x) +#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 2320.6/593.3/5009.2/9282.6 tuned ops) +#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 35.1/ 26.8/ 41.0/140.5 untuned ops) +#pr: (and amortizes from untuned rsb in avg. 36.0, min. 28.1, max. 41.3 ops) #pr: (avg/min/max (avg) nnz per subm before successful tuning were 1683/ 1683/ 1683) #pr: (avg/min/max (avg) nnz per subm after successful tuning were 5050/ 5050/ 5050) #pr: (avg/min/max (avg) bytes per subm before successful tuning were 15150/ 6733/ 26933) #pr: (avg/min/max (avg) bytes per subm after successful tuning were 45450/ 20200/ 80800) #pr: (avg/min/max (avg) bytes per nnz before successful tuning were 2.121/ 2.121/ 2.121) -#pr: (avg/min/max operands (mtx,lhs,rhs) read bandwidth lower bound 3.337/ 2.788/ 4.129,GBps) -#pr: (avg/min/max operands (mtx,rhs:r;lhs:rw) bandwidth lower bound 13.552/ 2.830/ 4.199,GBps) +#pr: (avg/min/max operands (mtx,lhs,rhs) read bandwidth lower bound 3.587/ 2.294/ 5.952,GBps) +#pr: (avg/min/max operands (mtx,rhs:r;lhs:rw) bandwidth lower bound 14.566/ 2.329/ 6.043,GBps) #pr: (avg/min/max code balance (bytes read at least once per flop) 1.495/ 0.650/ 2.599) #pr: (avg/min/max (avg) bytes per nnz after successful tuning were 2.080/ 2.080/ 2.080) #pr: (matrix has been subdivided more/less/same in resp. 0 / 4 /0 cases) #pr: (matrix has used more/less/same threads in resp. 0 / 0 /4 cases) #pr: no unsuccessful rsb autotuning attempt (according to 1.01x threshold) -#pr: rsb auto tuning (either succ. or uns.) time was: on avg.: 0.05 s, min 0.02 s, max 0.09 s, tot 0.19 s (4 samples) -#pr: rsb auto tuning ( only successful ) time was: on avg.: 0.05 s, min 0.02 s, max 0.09 s, tot 0.19 s (4 samples) -#pr: best tun. rsb canon. mflops were: on avg. 2.775e+03, min 1.265e+03, max 4.290e+03 (4 samples) -#pr: ref. unt. rsb canon. mflops were: on avg. 6.730e+01, min 9.625e+00, max 1.379e+02 (4 samples) -#pr: best tun. rsb operation time was: on avg. 1.693e-05s, min 1.001e-05s, max 2.289e-05s, tot 6.771e-05s (4 samples) -#pr: ref. unt. rsb operation time was: on avg. 1.103e-03s, min 5.860e-04s, max 2.099e-03s, tot 4.412e-03s (4 samples) -#pr: min / max ratio of in-memory MEMSET bandwidth to extrapolated read bandwidth ratio: 1.156e+01 1.713e+01 -#pr: in-cache to in-memory MEMSET bandwidth ratio: 4.804e-01 -#pr: Record collection took 0.49 s. +#pr: rsb auto tuning (either succ. or uns.) time was: on avg.: 0.03 s, min 0.02 s, max 0.04 s, tot 0.11 s (4 samples) +#pr: rsb auto tuning ( only successful ) time was: on avg.: 0.03 s, min 0.02 s, max 0.04 s, tot 0.11 s (4 samples) +#pr: best tun. rsb canon. mflops were: on avg. 2.592e+03, min 2.017e+03, max 3.530e+03 (4 samples) +#pr: ref. unt. rsb canon. mflops were: on avg. 7.398e+01, min 1.872e+01, max 1.367e+02 (4 samples) +#pr: best tun. rsb operation time was: on avg. 1.842e-05s, min 8.821e-06s, max 3.195e-05s, tot 7.367e-05s (4 samples) +#pr: ref. unt. rsb operation time was: on avg. 7.878e-04s, min 5.910e-04s, max 1.079e-03s, tot 3.151e-03s (4 samples) +#pr: min / max ratio of in-memory MEMSET bandwidth to extrapolated read bandwidth ratio: 7.716e+00 2.002e+01 +#pr: in-cache to in-memory MEMSET bandwidth ratio: 1.038e+00 +#pr: Record collection took 0.31 s. #pr: Record comprises 40 memory benchmark samples (prepend RSB_PR_MBW=1 to dump this). -#pr: Record comprises 99 environment variables in 5459 bytes (prepend RSB_PR_ENV=1 to dump this). +#pr: Record comprises 99 environment variables in 5513 bytes (prepend RSB_PR_ENV=1 to dump this). # ====== END Total summary record. #pr: ======== Saved a performance record of 4 samples to test.rpr # Removing the temporary record file test.rpr.tmp. -# terminating run at 1788680936 (after 5.5s of w.c.t.) +# terminating run at 1754271510 (after 5.7s of w.c.t.) + ls -ltr test-tuning-lower-100x100-5050nz--C-N-1--base.eps test-tuning-lower-100x100-5050nz--C-N-1--mv-tuned_merge1_1x1th.eps test-tuning-lower-100x100-5050nz--D-N-1--base.eps test-tuning-lower-100x100-5050nz--D-N-1--mv-tuned_merge1_1x1th.eps test-tuning-lower-100x100-5050nz--S-N-1--base.eps test-tuning-lower-100x100-5050nz--S-N-1--mv-tuned_merge1_1x1th.eps test-tuning-lower-100x100-5050nz--Z-N-1--base.eps test-tuning-lower-100x100-5050nz--Z-N-1--mv-tuned_merge1_1x1th.eps --rw-r--r-- 1 pbuilder1 pbuilder1 85638 Sep 5 19:48 test-tuning-lower-100x100-5050nz--D-N-1--base.eps --rw-r--r-- 1 pbuilder1 pbuilder1 84559 Sep 5 19:48 test-tuning-lower-100x100-5050nz--D-N-1--mv-tuned_merge1_1x1th.eps --rw-r--r-- 1 pbuilder1 pbuilder1 85639 Sep 5 19:48 test-tuning-lower-100x100-5050nz--S-N-1--base.eps --rw-r--r-- 1 pbuilder1 pbuilder1 84560 Sep 5 19:48 test-tuning-lower-100x100-5050nz--S-N-1--mv-tuned_merge1_1x1th.eps --rw-r--r-- 1 pbuilder1 pbuilder1 85639 Sep 5 19:48 test-tuning-lower-100x100-5050nz--C-N-1--base.eps --rw-r--r-- 1 pbuilder1 pbuilder1 84559 Sep 5 19:48 test-tuning-lower-100x100-5050nz--C-N-1--mv-tuned_merge1_1x1th.eps --rw-r--r-- 1 pbuilder1 pbuilder1 85638 Sep 5 19:48 test-tuning-lower-100x100-5050nz--Z-N-1--base.eps --rw-r--r-- 1 pbuilder1 pbuilder1 84560 Sep 5 19:48 test-tuning-lower-100x100-5050nz--Z-N-1--mv-tuned_merge1_1x1th.eps +-rw-r--r-- 1 pbuilder2 pbuilder2 85642 Aug 4 15:38 test-tuning-lower-100x100-5050nz--D-N-1--base.eps +-rw-r--r-- 1 pbuilder2 pbuilder2 84564 Aug 4 15:38 test-tuning-lower-100x100-5050nz--D-N-1--mv-tuned_merge1_1x1th.eps +-rw-r--r-- 1 pbuilder2 pbuilder2 85643 Aug 4 15:38 test-tuning-lower-100x100-5050nz--S-N-1--base.eps +-rw-r--r-- 1 pbuilder2 pbuilder2 84566 Aug 4 15:38 test-tuning-lower-100x100-5050nz--S-N-1--mv-tuned_merge1_1x1th.eps +-rw-r--r-- 1 pbuilder2 pbuilder2 85644 Aug 4 15:38 test-tuning-lower-100x100-5050nz--C-N-1--base.eps +-rw-r--r-- 1 pbuilder2 pbuilder2 84566 Aug 4 15:38 test-tuning-lower-100x100-5050nz--C-N-1--mv-tuned_merge1_1x1th.eps +-rw-r--r-- 1 pbuilder2 pbuilder2 85644 Aug 4 15:38 test-tuning-lower-100x100-5050nz--Z-N-1--base.eps +-rw-r--r-- 1 pbuilder2 pbuilder2 84566 Aug 4 15:38 test-tuning-lower-100x100-5050nz--Z-N-1--mv-tuned_merge1_1x1th.eps + rsbench --read-performance-record test.rpr + ls -ltr test.txt --rw-r--r-- 1 pbuilder1 pbuilder1 4094 Sep 5 19:48 test.txt +-rw-r--r-- 1 pbuilder2 pbuilder2 4092 Aug 4 15:38 test.txt + RSB_PR_WLTC=2 + RSB_PR_SR=0 + rsbench --read-performance-record test.rpr @@ -8170,29 +8206,29 @@ /usr/bin/kpsepath ++ kpsepath tex ++ sed 's/!!//g;s/:/\n/g;' -+ find . /nonexistent/first-build/.texlive2025/texmf-config/tex/kpsewhich// /nonexistent/first-build/.texlive2025/texmf-var/tex/kpsewhich// /nonexistent/first-build/texmf/tex/kpsewhich// /usr/local/share/texmf/tex/kpsewhich// /etc/texmf/tex/kpsewhich// /var/lib/texmf/tex/kpsewhich// /usr/share/texmf/tex/kpsewhich// /usr/share/texlive/texmf-dist/tex/kpsewhich// /nonexistent/first-build/.texlive2025/texmf-config/tex/generic// /nonexistent/first-build/.texlive2025/texmf-var/tex/generic// /nonexistent/first-build/texmf/tex/generic// /usr/local/share/texmf/tex/generic// /etc/texmf/tex/generic// /var/lib/texmf/tex/generic// /usr/share/texmf/tex/generic// /usr/share/texlive/texmf-dist/tex/generic// /nonexistent/first-build/.texlive2025/texmf-config/tex/latex// /nonexistent/first-build/.texlive2025/texmf-var/tex/latex// /nonexistent/first-build/texmf/tex/latex// /usr/local/share/texmf/tex/latex// /etc/texmf/tex/latex// /var/lib/texmf/tex/latex// /usr/share/texmf/tex/latex// /usr/share/texlive/texmf-dist/tex/latex// /nonexistent/first-build/.texlive2025/texmf-config/tex/// /nonexistent/first-build/.texlive2025/texmf-var/tex/// /nonexistent/first-build/texmf/tex/// /usr/local/share/texmf/tex/// /etc/texmf/tex/// /var/lib/texmf/tex/// /usr/share/texmf/tex/// /usr/share/texlive/texmf-dist/tex/// -name sciposter.cls -find: '/nonexistent/first-build/.texlive2025/texmf-config/tex/kpsewhich//': No such file or directory -find: '/nonexistent/first-build/.texlive2025/texmf-var/tex/kpsewhich//': No such file or directory -find: '/nonexistent/first-build/texmf/tex/kpsewhich//': No such file or directory ++ find . /nonexistent/second-build/.texlive2025/texmf-config/tex/kpsewhich// /nonexistent/second-build/.texlive2025/texmf-var/tex/kpsewhich// /nonexistent/second-build/texmf/tex/kpsewhich// /usr/local/share/texmf/tex/kpsewhich// /etc/texmf/tex/kpsewhich// /var/lib/texmf/tex/kpsewhich// /usr/share/texmf/tex/kpsewhich// /usr/share/texlive/texmf-dist/tex/kpsewhich// /nonexistent/second-build/.texlive2025/texmf-config/tex/generic// /nonexistent/second-build/.texlive2025/texmf-var/tex/generic// /nonexistent/second-build/texmf/tex/generic// /usr/local/share/texmf/tex/generic// /etc/texmf/tex/generic// /var/lib/texmf/tex/generic// /usr/share/texmf/tex/generic// /usr/share/texlive/texmf-dist/tex/generic// /nonexistent/second-build/.texlive2025/texmf-config/tex/latex// /nonexistent/second-build/.texlive2025/texmf-var/tex/latex// /nonexistent/second-build/texmf/tex/latex// /usr/local/share/texmf/tex/latex// /etc/texmf/tex/latex// /var/lib/texmf/tex/latex// /usr/share/texmf/tex/latex// /usr/share/texlive/texmf-dist/tex/latex// /nonexistent/second-build/.texlive2025/texmf-config/tex/// /nonexistent/second-build/.texlive2025/texmf-var/tex/// /nonexistent/second-build/texmf/tex/// /usr/local/share/texmf/tex/// /etc/texmf/tex/// /var/lib/texmf/tex/// /usr/share/texmf/tex/// /usr/share/texlive/texmf-dist/tex/// -name sciposter.cls +find: '/nonexistent/second-build/.texlive2025/texmf-config/tex/kpsewhich//': No such file or directory +find: '/nonexistent/second-build/.texlive2025/texmf-var/tex/kpsewhich//': No such file or directory +find: '/nonexistent/second-build/texmf/tex/kpsewhich//': No such file or directory find: '/usr/local/share/texmf/tex/kpsewhich//': No such file or directory find: '/etc/texmf/tex/kpsewhich//': No such file or directory find: '/var/lib/texmf/tex/kpsewhich//': No such file or directory find: '/usr/share/texmf/tex/kpsewhich//': No such file or directory find: '/usr/share/texlive/texmf-dist/tex/kpsewhich//': No such file or directory -find: '/nonexistent/first-build/.texlive2025/texmf-config/tex/generic//': No such file or directory -find: '/nonexistent/first-build/.texlive2025/texmf-var/tex/generic//': No such file or directory -find: '/nonexistent/first-build/texmf/tex/generic//': No such file or directory +find: '/nonexistent/second-build/.texlive2025/texmf-config/tex/generic//': No such file or directory +find: '/nonexistent/second-build/.texlive2025/texmf-var/tex/generic//': No such file or directory +find: '/nonexistent/second-build/texmf/tex/generic//': No such file or directory find: '/usr/local/share/texmf/tex/generic//': No such file or directory find: '/usr/share/texmf/tex/generic//': No such file or directory -find: '/nonexistent/first-build/.texlive2025/texmf-config/tex/latex//': No such file or directory -find: '/nonexistent/first-build/.texlive2025/texmf-var/tex/latex//': No such file or directory -find: '/nonexistent/first-build/texmf/tex/latex//': No such file or directory +find: '/nonexistent/second-build/.texlive2025/texmf-config/tex/latex//': No such file or directory +find: '/nonexistent/second-build/.texlive2025/texmf-var/tex/latex//': No such file or directory +find: '/nonexistent/second-build/texmf/tex/latex//': No such file or directory find: '/usr/local/share/texmf/tex/latex//': No such file or directory find: '/etc/texmf/tex/latex//': No such file or directory find: '/var/lib/texmf/tex/latex//': No such file or directory -find: '/nonexistent/first-build/.texlive2025/texmf-config/tex///': No such file or directory -find: '/nonexistent/first-build/.texlive2025/texmf-var/tex///': No such file or directory -find: '/nonexistent/first-build/texmf/tex///': No such file or directory +find: '/nonexistent/second-build/.texlive2025/texmf-config/tex///': No such file or directory +find: '/nonexistent/second-build/.texlive2025/texmf-var/tex///': No such file or directory +find: '/nonexistent/second-build/texmf/tex///': No such file or directory find: '/usr/local/share/texmf/tex///': No such file or directory + exit 0 for mf in pd.mtx vf.mtx ; do if test -f /build/reproducible-path/librsb-1.3.0.2+dfsg/examples/$mf ; then true; else cp -p /build/reproducible-path/librsb-1.3.0.2+dfsg/$mf /build/reproducible-path/librsb-1.3.0.2+dfsg/examples/$mf ; fi; done @@ -8207,7 +8243,7 @@ This error may be safely ignored. Correctly allocated a matrix. Summary information of the matrix: -(3 x 3)[0xaaaaf21be4a0]{D} @ (0(0..3),0(0..3)) (3 nnz, 1 nnz/r) flags 0x2040384 (coo:1, csr:0, hw:0, ic:1, fi:0), storage: 40, subm: 1, symflags:'' +(3 x 3)[0xaaaac96024a0]{D} @ (0(0..3),0(0..3)) (3 nnz, 1 nnz/r) flags 0x2040384 (coo:1, csr:0, hw:0, ic:1, fi:0), storage: 40, subm: 1, symflags:'' Correctly performed a SPMV. Correctly freed the matrix. Correctly finalized the library. @@ -8222,7 +8258,7 @@ This error may be safely ignored. Correctly allocated a matrix. Summary information of the matrix: -(3 x 3)[0xaaaae53b44a0]{D} @ (0(0..3),0(0..3)) (3 nnz, 1 nnz/r) flags 0x2040384 (coo:1, csr:0, hw:0, ic:1, fi:0), storage: 40, subm: 1, symflags:'' +(3 x 3)[0xaaaaf2da94a0]{D} @ (0(0..3),0(0..3)) (3 nnz, 1 nnz/r) flags 0x2040384 (coo:1, csr:0, hw:0, ic:1, fi:0), storage: 40, subm: 1, symflags:'' Correctly performed a SPMV. Correctly freed the matrix. Correctly finalized the library. @@ -8286,51 +8322,51 @@ Done. Building a matrix with 5 nnz, 5 x 5 Duplicates check: 5 - 0 = 5 - converted COO to RSB in 1.426e-02 s (100.00 %) - analyzed arrays in 4.139e-03 s (29.03 %) - cleaned-up arrays in 0.000e+00 s (0.00 %) - deduplicated arrays in 1.192e-06 s (0.01 %) - sorted arrays in 1.975e-03 s (13.85 %) - shuffled partitions in 4.084e-03 s (28.65 %) - memory allocations took 5.960e-06 s (0.04 %) - leafs setup took 9.537e-07 s (0.01 %) - halfword conversion took 4.051e-03 s (28.41 %) -Built (5 x 5)[0xaaaae53b6820]{D} @ (0(0..0),0(0..0)) (5 nnz, 1 nnz/r) flags 0x2046186 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 2, symflags:'' + converted COO to RSB in 7.276e-03 s (100.00 %) + analyzed arrays in 2.561e-03 s (35.20 %) + cleaned-up arrays in 1.192e-06 s (0.02 %) + deduplicated arrays in 9.537e-07 s (0.01 %) + sorted arrays in 6.180e-04 s (8.49 %) + shuffled partitions in 2.049e-03 s (28.16 %) + memory allocations took 5.722e-06 s (0.08 %) + leafs setup took 2.146e-06 s (0.03 %) + halfword conversion took 2.038e-03 s (28.01 %) +Built (5 x 5)[0xaaaaf2dab820]{D} @ (0(0..0),0(0..0)) (5 nnz, 1 nnz/r) flags 0x2046186 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 2, symflags:'' Allocated matrix of 5 nonzeroes: -(5 x 5)[0xaaaae53b6820]{D} @ (0(0..0),0(0..0)) (5 nnz, 1 nnz/r) flags 0x2046186 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 2, symflags:'' +(5 x 5)[0xaaaaf2dab820]{D} @ (0(0..0),0(0..0)) (5 nnz, 1 nnz/r) flags 0x2046186 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 2, symflags:'' -Before auto-tuning, 100 multiplications took 0.111207s. +Before auto-tuning, 100 multiplications took 0.094502s. Threads autotuning (may take more than 1.500000s)... Will use autotuning routine to sample matrix: 5 x 5, type D, 5 nnz, 1 nnz/r, 3 subms, 2 lsubms, 4.0000 bpnz. Parameters: verbosity:1 mintimes:3 maxtimes:10 mindt:0 maxdt:0.1 -Sampling (15 x 0.1 s stages, transA=N, nrhs=2, timer gran.=6.47545e-08), 12 suggested as starting thread count(default). -3 iterations (12 th.) took 0.00247s; avg 0.0008233s ( +/- 4.30/ 2.28 %); best 0.000788s; worst 0.0008421s; std dev. 2.502e-05 (taking best). -Reference operation time is 0.000787973 s (0.02538 Mflops) with 12 threads. -3 iterations (12 th.) took 0.002478s; avg 0.000826s ( +/- 0.37/ 0.24 %); best 0.000823s; worst 0.000828s; std dev. 2.171e-06 (taking best). -Reference operation time is 0.000823021 s (0.0243 Mflops) with 12 threads. -After 0.004993s, autotuning routine did not find a better threads count configuration. -(5 x 5)[0xaaaae53b6820]{D} @ (0(0..0),0(0..0)) (5 nnz, 1 nnz/r) flags 0x2046186 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 2, symflags:'' -After threads auto-tuning, 100 multiplications took 0.115203s -- effective speedup of 0.965312 x +Sampling (15 x 0.1 s stages, transA=N, nrhs=2, timer gran.=7.82013e-08), 12 suggested as starting thread count(default). +3 iterations (12 th.) took 0.001873s; avg 0.0006243s ( +/- 4.07/ 2.34 %); best 0.0005989s; worst 0.000639s; std dev. 1.805e-05 (taking best). +Reference operation time is 0.000598907 s (0.03339 Mflops) with 12 threads. +3 iterations (12 th.) took 0.002334s; avg 0.000778s ( +/- 18.76/ 25.33 %); best 0.000632s; worst 0.0009751s; std dev. 0.0001446 (taking best). +Reference operation time is 0.000632048 s (0.03164 Mflops) with 12 threads. +After 0.004259s, autotuning routine did not find a better threads count configuration. +(5 x 5)[0xaaaaf2dab820]{D} @ (0(0..0),0(0..0)) (5 nnz, 1 nnz/r) flags 0x2046186 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 2, symflags:'' +After threads auto-tuning, 100 multiplications took 0.074232s -- effective speedup of 1.27306 x Matrix autotuning (may take more than 1.500000s; using 12 threads )... Will autotune matrix: 5 x 5, type D, 5 nnz, 1 nnz/r, 3 subms, 2 lsubms, 4.0000 bpnz. Parameters: verbosity:1 mintimes:3 maxtimes:10 mindt:0 maxdt:0.1 -Starting autotuning (15 x 0.1 s stages, transA=N, nrhs=2, timer gran.=6.47545e-08), 12 suggested as starting thread count. -3 iterations (12 th.) took 0.002489s; avg 0.0008297s ( +/- 0.57/ 0.40 %); best 0.0008249s; worst 0.000833s; std dev. 3.46e-06 (taking best). -Reference operation time is 0.000824928 s (0.02424 Mflops) with 12 threads. -Starting merge (user-supplied threads) based auto-tuning procedure (transA=N, nrhs=2, order=cols) (max 6 steps, inclusive 3 grace steps) on: 5 x 5, type D, 5 nnz, 1 nnz/r, 3 subms, 2 lsubms, 4.0000 bpnz (tpop: 0.0008249 Mflops: 0.024) -Merge (2 -> 1 leaves) took w.c.t. of 1.311e-05s, ~3.099e-06s of computing time (of which 1.192e-06s sorting, 2.146e-06s analysis) -3 iterations (12 th.) took 1.192e-06s; avg 3.974e-07s ( +/- 83.70/200.00 %); best 6.475e-08s; worst 1.192e-06s; std dev. 5.62e-07 (taking best). -Reference operation time is 6.47545e-08 s (308.9 Mflops) with 12 threads. -After merge step 1: tpop: 6.475e-08 s ~Mflops: 308.859 nsubm:1 otn:12 -Applying merge (2 -> 1 leaves, 12 th.) yielded SPEEDUP of 12739.323x: 0.0008249s -> 6.475e-08s, so taking this instance. +Starting autotuning (15 x 0.1 s stages, transA=N, nrhs=2, timer gran.=7.82013e-08), 12 suggested as starting thread count. +3 iterations (12 th.) took 0.002071s; avg 0.0006904s ( +/- 14.94/ 28.64 %); best 0.0005872s; worst 0.0008881s; std dev. 0.0001399 (taking best). +Reference operation time is 0.000587225 s (0.03406 Mflops) with 12 threads. +Starting merge (user-supplied threads) based auto-tuning procedure (transA=N, nrhs=2, order=cols) (max 6 steps, inclusive 3 grace steps) on: 5 x 5, type D, 5 nnz, 1 nnz/r, 3 subms, 2 lsubms, 4.0000 bpnz (tpop: 0.0005872 Mflops: 0.034) +Merge (2 -> 1 leaves) took w.c.t. of 1.597e-05s, ~2.861e-06s of computing time (of which 0s sorting, 2.861e-06s analysis) +3 iterations (12 th.) took 1.907e-06s; avg 6.358e-07s ( +/- 87.70/ 50.00 %); best 7.82e-08s; worst 9.537e-07s; std dev. 4.496e-07 (taking best). +Reference operation time is 7.82013e-08 s (255.8 Mflops) with 12 threads. +After merge step 1: tpop: 7.82e-08 s ~Mflops: 255.750 nsubm:1 otn:12 +Applying merge (2 -> 1 leaves, 12 th.) yielded SPEEDUP of 7509.146x: 0.0005872s -> 7.82e-08s, so taking this instance. Merged all the matrix leaves: no reason to continue merging. -A total of 1 merge steps (of max 6) (2 -> 1 subms) took 0.002476s (of which 3.695e-05s partitioning, 0s I/O); computing times: 3.099e-06s in par. loops, 1.192e-06s sorting, 2.146e-06s analyzing) -Total merge + benchmarking process took 0.002476s, equivalent to 38236.4/3.0 new/old ops (0.004917s for 2 clones -- as 75935.2/6.0 ops, or 37967.6/3.0 ops per clone), SPEEDUP of 12739.323x -Applying multi-merge (2 -> 1 leaves, 1 steps, 12 -> 12 th.sp.) yielded SPEEDUP of 12739.323x (0.0008249s -> 6.475e-08s), will amortize in 3.0 ops by saving 0.0008249s per op. -In 1 tuning rounds (tot. 0.0075s, 0.0049s for constructor, 2 clones) obtained a SPEEDUP of 1273832.3% (1.274e+04x) (from 0.02424 to 308.9 Mflops). -After 0.007484s, autotuning routine declared speedup of 12739.3 x, when using threads count of 12. -(5 x 5)[0xaaaae53b9d70]{D} @ (0(0..5),0(0..5)) (5 nnz, 1 nnz/r) flags 0x2040186 (coo:1, csr:0, hw:1, ic:1, fi:0), storage: 40, subm: 1, symflags:'' -After threads auto-tuning, 100 multiplications took 0.000010s -- further speedup of 11504.7 x +A total of 1 merge steps (of max 6) (2 -> 1 subms) took 0.001911s (of which 3.815e-05s partitioning, 0s I/O); computing times: 2.861e-06s in par. loops, 0s sorting, 2.861e-06s analyzing) +Total merge + benchmarking process took 0.001911s, equivalent to 24439.0/3.3 new/old ops (0.003868s for 2 clones -- as 49463.4/6.6 ops, or 24731.7/3.3 ops per clone), SPEEDUP of 7509.146x +Applying multi-merge (2 -> 1 leaves, 1 steps, 12 -> 12 th.sp.) yielded SPEEDUP of 7509.146x (0.0005872s -> 7.82e-08s), will amortize in 3.3 ops by saving 0.0005871s per op. +In 1 tuning rounds (tot. 0.006s, 0.0039s for constructor, 2 clones) obtained a SPEEDUP of 750814.6% (7509x) (from 0.03406 to 255.8 Mflops). +After 0.006037s, autotuning routine declared speedup of 7509.15 x, when using threads count of 12. +(5 x 5)[0xaaaaf2daed70]{D} @ (0(0..5),0(0..5)) (5 nnz, 1 nnz/r) flags 0x2040186 (coo:1, csr:0, hw:1, ic:1, fi:0), storage: 40, subm: 1, symflags:'' +After threads auto-tuning, 100 multiplications took 0.000012s -- further speedup of 6227.02 x 0/2 0 0 -> 0 1/2 1 0 -> 5 0/2 0 3 -> 0 @@ -8341,7 +8377,7 @@ Correctly initialized the library. Correctly allocated a matrix with 7 nonzeroes. Summary information of the matrix: -(6 x 6)[0xaaaae53b6820]{D} @ (0(1..2),0(5..6)) (1 nnz, 0.17 nnz/r) flags 0x20443ee (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 1, symflags:'UT' +(6 x 6)[0xaaaaf2dab820]{D} @ (0(1..2),0(5..6)) (1 nnz, 0.17 nnz/r) flags 0x20443ee (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 1, symflags:'UT' Matrix printout: %%MatrixMarket matrix coordinate real general 6 6 1 @@ -8492,68 +8528,61 @@ Creating 500 x 500 matrix with 62500 nonzeroes. Building a matrix with 62500 nnz, 500 x 500 Duplicates check: 62500 - 0 = 62500 - converted COO to RSB in 4.387e-02 s (100.00 %) - analyzed arrays in 8.084e-03 s (18.43 %) - cleaned-up arrays in 1.259e-04 s (0.29 %) - deduplicated arrays in 1.302e-04 s (0.30 %) - sorted arrays in 1.952e-02 s (44.49 %) - shuffled partitions in 1.332e-02 s (30.37 %) - memory allocations took 3.505e-05 s (0.08 %) - leafs setup took 9.060e-06 s (0.02 %) - halfword conversion took 2.644e-03 s (6.03 %) -Built (500 x 500)[0xaaaadfa4f2d0]{D} @ (0(0..0),0(0..0)) (62500 nnz, 1.2e+02 nnz/r) flags 0x2046186 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 55, symflags:'' + converted COO to RSB in 1.593e-02 s (100.00 %) + analyzed arrays in 1.888e-03 s (11.85 %) + cleaned-up arrays in 1.631e-04 s (1.02 %) + deduplicated arrays in 1.252e-04 s (0.79 %) + sorted arrays in 8.100e-03 s (50.86 %) + shuffled partitions in 3.924e-03 s (24.64 %) + memory allocations took 3.219e-05 s (0.20 %) + leafs setup took 9.060e-06 s (0.06 %) + halfword conversion took 1.681e-03 s (10.56 %) +Built (500 x 500)[0xaaab0e6c92d0]{D} @ (0(0..0),0(0..0)) (62500 nnz, 1.2e+02 nnz/r) flags 0x2046186 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 55, symflags:'' Allocated matrix of 62500 nonzeroes: -(500 x 500)[0xaaaadfa4f2d0]{D} @ (0(0..0),0(0..0)) (62500 nnz, 1.2e+02 nnz/r) flags 0x2046186 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 55, symflags:'' +(500 x 500)[0xaaab0e6c92d0]{D} @ (0(0..0),0(0..0)) (62500 nnz, 1.2e+02 nnz/r) flags 0x2046186 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 55, symflags:'' -Before auto-tuning, 100 multiplications took 0.110334s. +Before auto-tuning, 100 multiplications took 0.123914s. Threads autotuning (may take more than 1.500000s)... -Will use autotuning routine to sample matrix: 500 x 500, type D, 62500 nnz, 1.2e+02 nnz/r, 75 subms, 55 lsubms, 2.1196 bpnz. +Will use autotuning routine to sample matrix: 500 x 500, type D, 62500 nnz, 1.2e+02 nnz/r, 75 subms, 55 lsubms, 2.1195 bpnz. Parameters: verbosity:1 mintimes:3 maxtimes:10 mindt:0 maxdt:0.1 -Sampling (15 x 0.1 s stages, transA=N, nrhs=2, timer gran.=3.40939e-08), 12 suggested as starting thread count(default). -3 iterations (12 th.) took 0.001596s; avg 0.0005321s ( +/- 1.51/ 2.08 %); best 0.000524s; worst 0.0005431s; std dev. 8.074e-06 (taking best). -Reference operation time is 0.000524044 s (477.1 Mflops) with 12 threads. -3 iterations (12 th.) took 0.002008s; avg 0.0006693s ( +/- 19.18/ 36.39 %); best 0.000541s; worst 0.0009129s; std dev. 0.0001723 (taking best). -Reference operation time is 0.000540972 s (462.1 Mflops) with 12 threads. -After 0.003672s, autotuning routine did not find a better threads count configuration. -(500 x 500)[0xaaaadfa4f2d0]{D} @ (0(0..0),0(0..0)) (62500 nnz, 1.2e+02 nnz/r) flags 0x2046186 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 55, symflags:'' -After threads auto-tuning, 100 multiplications took 0.099618s -- effective speedup of 1.10757 x +Sampling (15 x 0.1 s stages, transA=N, nrhs=2, timer gran.=4.39048e-08), 12 suggested as starting thread count(default). +3 iterations (12 th.) took 0.002769s; avg 0.000923s ( +/- 20.26/ 28.72 %); best 0.000736s; worst 0.001188s; std dev. 0.0001926 (taking best). +Reference operation time is 0.000735998 s (339.7 Mflops) with 12 threads. +3 iterations (12 th.) took 0.00399s; avg 0.00133s ( +/- 49.93/ 66.47 %); best 0.0006659s; worst 0.002214s; std dev. 0.0006508 (taking best). +Reference operation time is 0.000665903 s (375.4 Mflops) with 12 threads. +After 0.006832s, autotuning routine did not find a better threads count configuration. +(500 x 500)[0xaaab0e6c92d0]{D} @ (0(0..0),0(0..0)) (62500 nnz, 1.2e+02 nnz/r) flags 0x2046186 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 55, symflags:'' +After threads auto-tuning, 100 multiplications took 0.116174s -- effective speedup of 1.06662 x Matrix autotuning (may take more than 1.500000s; using 12 threads )... -Will autotune matrix: 500 x 500, type D, 62500 nnz, 1.2e+02 nnz/r, 75 subms, 55 lsubms, 2.1196 bpnz. +Will autotune matrix: 500 x 500, type D, 62500 nnz, 1.2e+02 nnz/r, 75 subms, 55 lsubms, 2.1195 bpnz. Parameters: verbosity:1 mintimes:3 maxtimes:10 mindt:0 maxdt:0.1 -Starting autotuning (15 x 0.1 s stages, transA=N, nrhs=2, timer gran.=3.40939e-08), 12 suggested as starting thread count. -3 iterations (12 th.) took 0.001539s; avg 0.000513s ( +/- 4.49/ 7.59 %); best 0.00049s; worst 0.0005519s; std dev. 2.769e-05 (taking best). -Reference operation time is 0.00048995 s (510.3 Mflops) with 12 threads. -Starting merge (user-supplied threads) based auto-tuning procedure (transA=N, nrhs=2, order=cols) (max 6 steps, inclusive 3 grace steps) on: 500 x 500, type D, 62500 nnz, 1.2e+02 nnz/r, 75 subms, 55 lsubms, 2.1196 bpnz (tpop: 0.00049 Mflops: 510.256) -Merge (55 -> 37 leaves) took w.c.t. of 0.001846s, ~0.006261s of computing time (of which 0.0006392s sorting, 8.106e-06s analysis) -3 iterations (12 th.) took 0.009971s; avg 0.003324s ( +/- 71.66/134.47 %); best 0.000942s; worst 0.007793s; std dev. 0.003163 (taking best). -Reference operation time is 0.000941992 s (265.4 Mflops) with 12 threads. -After merge step 1: tpop: 0.000942 s ~Mflops: 265.395 nsubm:37 otn:12 -Applying merge (55 -> 37 leaves, 12 th.) yielded SLOWDOWN (1th of 3 tolerable) of 1.923x: 0.00049s -> 0.000942s. +Starting autotuning (15 x 0.1 s stages, transA=N, nrhs=2, timer gran.=4.39048e-08), 12 suggested as starting thread count. +3 iterations (12 th.) took 0.002597s; avg 0.0008657s ( +/- 13.38/ 8.59 %); best 0.0007498s; worst 0.0009401s; std dev. 8.303e-05 (taking best). +Reference operation time is 0.000749826 s (333.4 Mflops) with 12 threads. +Starting merge (user-supplied threads) based auto-tuning procedure (transA=N, nrhs=2, order=cols) (max 6 steps, inclusive 3 grace steps) on: 500 x 500, type D, 62500 nnz, 1.2e+02 nnz/r, 75 subms, 55 lsubms, 2.1195 bpnz (tpop: 0.0007498 Mflops: 333.410) +Merge (55 -> 37 leaves) took w.c.t. of 0.0004208s, ~0.001565s of computing time (of which 0.000277s sorting, 1.001e-05s analysis) +3 iterations (12 th.) took 0.001823s; avg 0.0006076s ( +/- 17.05/ 22.93 %); best 0.000504s; worst 0.000747s; std dev. 0.0001023 (taking best). +Reference operation time is 0.000504017 s (496 Mflops) with 12 threads. +After merge step 1: tpop: 0.000504 s ~Mflops: 496.015 nsubm:37 otn:12 +Applying merge (55 -> 37 leaves, 12 th.) yielded SPEEDUP of 1.488x: 0.0007498s -> 0.000504s, so taking this instance. +Merge (37 -> 25 leaves) took w.c.t. of 0.0004909s, ~0.000551s of computing time (of which 0.0004549s sorting, 8.106e-06s analysis) +3 iterations (12 th.) took 0.003151s; avg 0.00105s ( +/- 55.05/ 82.03 %); best 0.0004721s; worst 0.001912s; std dev. 0.000621 (taking best). +Reference operation time is 0.000472069 s (529.6 Mflops) with 12 threads. +After merge step 2: tpop: 0.0004721 s ~Mflops: 529.584 nsubm:25 otn:12 +Applying merge (37 -> 25 leaves, 12 th.) yielded SPEEDUP of 1.068x: 0.000504s -> 0.0004721s, so taking this instance. +Merge (25 -> 19 leaves) took w.c.t. of 0.0002022s, ~7.796e-05s of computing time (of which 3.6e-05s sorting, 5.007e-06s analysis) +3 iterations (12 th.) took 0.01435s; avg 0.004784s ( +/- 87.84/159.72 %); best 0.000582s; worst 0.01243s; std dev. 0.005412 (taking best). +Reference operation time is 0.00058198 s (429.6 Mflops) with 12 threads. +After merge step 3: tpop: 0.000582 s ~Mflops: 429.568 nsubm:19 otn:12 +Applying merge (25 -> 19 leaves, 12 th.) yielded SLOWDOWN (1th of 3 tolerable) of 1.233x: 0.0004721s -> 0.000582s. Skipping further merge based tests after 1 definite performance degradations in a row (and last exceeding limit). -A total of 1 merge steps (of max 6) (55 -> 37 subms) took 0.01184s (of which 0.001855s partitioning, 0s I/O); computing times: 0.006261s in par. loops, 0.0006392s sorting, 8.106e-06s analyzing) -Total merge + benchmarking process took 0.01184s, equivalent to 24.2/24.2 new/old ops (0.001539s for 1 clones -- as 3.1/3.1 ops, or 3.1/3.1 ops per clone), SPEEDUP of 1.000x (NO SPEEDUP) -Merging based autotuning FAILED (=NO SPEEDUP); let's try splitting then... -3 iterations (12 th.) took 0.005305s; avg 0.001768s ( +/- 39.72/ 48.62 %); best 0.001066s; worst 0.002628s; std dev. 0.0006474 (taking best). -Reference operation time is 0.00106597 s (234.5 Mflops) with 12 threads. -Starting split (user-supplied threads) based auto-tuning procedure (transA=N, nrhs=2, order=cols) (max 6 steps, inclusive 3 grace steps) on: 500 x 500, type D, 62500 nnz, 1.2e+02 nnz/r, 75 subms, 55 lsubms, 2.1196 bpnz (tpop: 0.001066 Mflops: 234.528) -Split (55 -> 136 leaves, 75 -> 183 subms) took 0.001253s (of which: 5.96e-06s analysis, -4.829e+10s mem.mgmt); compute time: 0.0007744s overall, 0.000175s searches, 0.0005994s shuffle, 0.0002468s switch, 3.195e-05s quadrants. -3 iterations (12 th.) took 0.002855s; avg 0.0009516s ( +/- 17.20/ 25.77 %); best 0.000788s; worst 0.001197s; std dev. 0.0001766 (taking best). -Reference operation time is 0.000787973 s (317.3 Mflops) with 12 threads. -After split step 1: tpop: 0.000788 s ~Mflops: 317.270 nsubm:136 otn:12 -Applying split (55 -> 136 leaves, 12 th.) yielded SPEEDUP of 1.353x: 0.001066s -> 0.000788s, so taking this instance. -Split (136 -> 340 leaves, 183 -> 455 subms) took 0.00086s (of which: 1.216e-05s analysis, -1.216e+11s mem.mgmt); compute time: 0.001461s overall, 0.0001924s searches, 0.001268s shuffle, 0.0006599s switch, 0.0001345s quadrants. -3 iterations (12 th.) took 0.01413s; avg 0.00471s ( +/- 77.62/119.30 %); best 0.001054s; worst 0.01033s; std dev. 0.004032 (taking best). -Reference operation time is 0.00105405 s (237.2 Mflops) with 12 threads. -After split step 2: tpop: 0.001054 s ~Mflops: 237.181 nsubm:340 otn:12 -Applying split (136 -> 340 leaves, 12 th.) yielded SLOWDOWN (1th of 3 tolerable) of 1.338x: 0.000788s -> 0.001054s. -Skipping further split based tests after 1 definite performance degradations in a row (and last exceeding limit). -A total of 2 split steps (of max 6) (55 -> 340 subms) took 0.02257s (of which 0.002446s partitioning, 0s I/O); computing times: 0.002235s in par. loops, 0.0003674s sorting, 1.812e-05s analyzing) -Total split + benchmarking process took 0.02257s, equivalent to 28.6/21.2 new/old ops (0.005562s for 2 clones -- as 7.1/5.2 ops, or 3.5/2.6 ops per clone), SPEEDUP of 1.353x -Applying multi-split (55 -> 136 leaves, 1 steps, 12 -> 12 th.sp.) yielded SPEEDUP of 1.353x (0.001066s -> 0.000788s), will amortize in 81.2 ops by saving 0.000278s per op. -In 1 tuning rounds (tot. 0.046s, 0.0071s for constructor, 3 clones) obtained a SPEEDUP of 35.3% (1.353x) (from 234.5 to 317.3 Mflops). -After 0.045774s, autotuning routine declared speedup of 1.3528 x, when using threads count of 12. -(500 x 500)[0xaaaadfb52bf0]{D} @ (0(0..0),0(0..0)) (62500 nnz, 1.2e+02 nnz/r) flags 0x2046186 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 136, symflags:'' -After threads auto-tuning, 100 multiplications took 0.142585s -- further speedup of 0.698656 x +A total of 3 merge steps (of max 6) (55 -> 19 subms) took 0.02468s (of which 0.001149s partitioning, 0s I/O); computing times: 0.002194s in par. loops, 0.0007679s sorting, 2.313e-05s analyzing) +Total merge + benchmarking process took 0.02468s, equivalent to 52.3/32.9 new/old ops (0.005649s for 3 clones -- as 12.0/7.5 ops, or 4.0/2.5 ops per clone), SPEEDUP of 1.588x +Applying multi-merge (55 -> 25 leaves, 2 steps, 12 -> 12 th.sp.) yielded SPEEDUP of 1.588x (0.0007498s -> 0.0004721s), will amortize in 88.9 ops by saving 0.0002778s per op. +In 1 tuning rounds (tot. 0.029s, 0.0056s for constructor, 3 clones) obtained a SPEEDUP of 58.8% (1.588x) (from 333.4 to 529.6 Mflops). +After 0.029081s, autotuning routine declared speedup of 1.58838 x, when using threads count of 12. +(500 x 500)[0xaaab0e7ccbf0]{D} @ (0(0..0),0(0..0)) (62500 nnz, 1.2e+02 nnz/r) flags 0x2046186 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 25, symflags:'' +After threads auto-tuning, 100 multiplications took 0.094129s -- further speedup of 1.2342 x librsb timer-based profiling is not supported in this build. If you wish to have it, re-configure librsb with its support. So you can safely ignore the error you might just have seen printed out on screen. /build/reproducible-path/librsb-1.3.0.2+dfsg/examples/backsolve Hello, RSB! @@ -8561,19 +8590,19 @@ Correctly initialized the library. Building a matrix with 7 nnz, 6 x 6 Duplicates check: 1 - 0 = 1 - converted COO to RSB in 1.393e-02 s (100.00 %) - analyzed arrays in 9.797e-03 s (70.31 %) - cleaned-up arrays in 4.053e-06 s (0.03 %) - deduplicated arrays in 9.537e-07 s (0.01 %) - sorted arrays in 9.537e-07 s (0.01 %) - shuffled partitions in 4.105e-03 s (29.46 %) - memory allocations took 1.192e-05 s (0.09 %) - leafs setup took 4.053e-06 s (0.03 %) - halfword conversion took 6.914e-06 s (0.05 %) -Built (6 x 6)[0xaaaaef1e04d0]{D} @ (0(0..1),0(5..6)) (1 nnz, 0.17 nnz/r) flags 0x20443ee (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 1, symflags:'UT' + converted COO to RSB in 3.049e-03 s (100.00 %) + analyzed arrays in 1.992e-03 s (65.33 %) + cleaned-up arrays in 4.053e-06 s (0.13 %) + deduplicated arrays in 1.192e-06 s (0.04 %) + sorted arrays in 9.537e-07 s (0.03 %) + shuffled partitions in 1.028e-03 s (33.71 %) + memory allocations took 1.001e-05 s (0.33 %) + leafs setup took 3.099e-06 s (0.10 %) + halfword conversion took 9.060e-06 s (0.30 %) +Built (6 x 6)[0xaaab02f954d0]{D} @ (0(0..1),0(5..6)) (1 nnz, 0.17 nnz/r) flags 0x20443ee (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 1, symflags:'UT' Correctly allocated a matrix with 7 nonzeroes. Summary information of the matrix: -(6 x 6)[0xaaaaef1e04d0]{D} @ (0(0..1),0(5..6)) (1 nnz, 0.17 nnz/r) flags 0x20443ee (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 1, symflags:'UT' +(6 x 6)[0xaaab02f954d0]{D} @ (0(0..1),0(5..6)) (1 nnz, 0.17 nnz/r) flags 0x20443ee (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 1, symflags:'UT' Matrix printout: %%MatrixMarket matrix coordinate real general 6 6 1 @@ -8599,55 +8628,55 @@ 1 1 Will autotune matrix: 6 x 6, type D, 1 nnz, 0.17 nnz/r, 1 subms, 1 lsubms, 4.0000 bpnz. -Parameters: verbosity:1 mintimes:3 maxtimes:10 mindt:0 maxdt:2.999e-08 -3 iterations (12 th.) took 2.408e-05s; avg 8.027e-06s ( +/- 99.63/185.15 %); best 2.999e-08s; worst 2.289e-05s; std dev. 1.052e-05 (taking best). -Reference operation time is 2.99931e-08 s (66.68 Mflops) with 12 threads. -Starting merge (same threads) based auto-tuning procedure (transA=N, nrhs=1, order=cols) (max 6 steps, inclusive 3 grace steps) on: 6 x 6, type D, 1 nnz, 0.17 nnz/r, 1 subms, 1 lsubms, 4.0000 bpnz (tpop: 2.999e-08 Mflops: 66.682) +Parameters: verbosity:1 mintimes:3 maxtimes:10 mindt:0 maxdt:3.095e-08 +3 iterations (12 th.) took 3.099e-05s; avg 1.033e-05s ( +/- 99.70/200.00 %); best 3.095e-08s; worst 3.099e-05s; std dev. 1.461e-05 (taking best). +Reference operation time is 3.09467e-08 s (64.63 Mflops) with 12 threads. +Starting merge (same threads) based auto-tuning procedure (transA=N, nrhs=1, order=cols) (max 6 steps, inclusive 3 grace steps) on: 6 x 6, type D, 1 nnz, 0.17 nnz/r, 1 subms, 1 lsubms, 4.0000 bpnz (tpop: 3.095e-08 Mflops: 64.627) Merge (1 -> 1 leaves) took w.c.t. of 0s, ~0s of computing time (of which 0s sorting, 0s analysis) -3 iterations (12 th.) took 1.192e-06s; avg 3.974e-07s ( +/- 92.45/200.00 %); best 2.999e-08s; worst 1.192e-06s; std dev. 5.62e-07 (taking best). -Reference operation time is 2.99931e-08 s (66.68 Mflops) with 12 threads. -After merge step 1: tpop: 2.999e-08 s ~Mflops: 66.682 nsubm:1 otn:12 -Applying merge (1 -> 1 leaves, 12 th.) yielded NEGLIGIBLE change (1th in a row) (old/new=1.00000x): 2.999e-08s -> 2.999e-08s, so IGNORING this instance. +3 iterations (12 th.) took 9.537e-07s; avg 3.179e-07s ( +/- 90.27/200.00 %); best 3.095e-08s; worst 9.537e-07s; std dev. 4.496e-07 (taking best). +Reference operation time is 3.09467e-08 s (64.63 Mflops) with 12 threads. +After merge step 1: tpop: 3.095e-08 s ~Mflops: 64.627 nsubm:1 otn:12 +Applying merge (1 -> 1 leaves, 12 th.) yielded NEGLIGIBLE change (1th in a row) (old/new=1.00000x): 3.095e-08s -> 3.095e-08s, so IGNORING this instance. Merged all the matrix leaves: no reason to continue merging. -A total of 1 merge steps (of max 6) (1 -> 1 subms) took 9.06e-06s (of which 1.907e-06s partitioning, 0s I/O); computing times: 0s in par. loops, 0s sorting, 0s analyzing) -Total merge + benchmarking process took 9.06e-06s, equivalent to 302.1/302.1 new/old ops (0.01196s for 1 clones -- as 398855.3/398855.3 ops, or 398855.3/398855.3 ops per clone), SPEEDUP of 1.000x (NO SPEEDUP) +A total of 1 merge steps (of max 6) (1 -> 1 subms) took 9.775e-06s (of which 2.861e-06s partitioning, 0s I/O); computing times: 0s in par. loops, 0s sorting, 0s analyzing) +Total merge + benchmarking process took 9.775e-06s, equivalent to 315.9/315.9 new/old ops (0.002706s for 1 clones -- as 87434.5/87434.5 ops, or 87434.5/87434.5 ops per clone), SPEEDUP of 1.000x (NO SPEEDUP) Merging based autotuning FAILED (=NO SPEEDUP); let's try splitting then... -3 iterations (12 th.) took 5.007e-06s; avg 1.669e-06s ( +/- 98.20/200.00 %); best 2.999e-08s; worst 5.007e-06s; std dev. 2.36e-06 (taking best). -Reference operation time is 2.99931e-08 s (66.68 Mflops) with 12 threads. -Starting split (same threads) based auto-tuning procedure (transA=N, nrhs=1, order=cols) (max 6 steps, inclusive 3 grace steps) on: 6 x 6, type D, 1 nnz, 0.17 nnz/r, 1 subms, 1 lsubms, 4.0000 bpnz (tpop: 2.999e-08 Mflops: 66.682) -Split (1 -> 1 leaves, 1 -> 1 subms) took 1.788e-05s (of which: 3.099e-06s analysis, 0s mem.mgmt); compute time: 0s overall, 0s searches, 0s shuffle, 0s switch, 0s quadrants. -3 iterations (12 th.) took 9.537e-07s; avg 3.179e-07s ( +/- 90.57/200.00 %); best 2.999e-08s; worst 9.537e-07s; std dev. 4.496e-07 (taking best). -Reference operation time is 2.99931e-08 s (66.68 Mflops) with 12 threads. -After split step 1: tpop: 2.999e-08 s ~Mflops: 66.682 nsubm:1 otn:12 -Applying split (1 -> 1 leaves, 12 th.) yielded NEGLIGIBLE change (1th in a row) (old/new=1.00000x): 2.999e-08s -> 2.999e-08s, so IGNORING this instance. +3 iterations (12 th.) took 6.914e-06s; avg 2.305e-06s ( +/- 98.66/200.00 %); best 3.095e-08s; worst 6.914e-06s; std dev. 3.259e-06 (taking best). +Reference operation time is 3.09467e-08 s (64.63 Mflops) with 12 threads. +Starting split (same threads) based auto-tuning procedure (transA=N, nrhs=1, order=cols) (max 6 steps, inclusive 3 grace steps) on: 6 x 6, type D, 1 nnz, 0.17 nnz/r, 1 subms, 1 lsubms, 4.0000 bpnz (tpop: 3.095e-08 Mflops: 64.627) +Split (1 -> 1 leaves, 1 -> 1 subms) took 2.503e-05s (of which: 4.053e-06s analysis, 0s mem.mgmt); compute time: 0s overall, 0s searches, 0s shuffle, 0s switch, 0s quadrants. +3 iterations (12 th.) took 0s; avg 0s ( +/- -inf/ nan %); best 3.095e-08s; worst 0s; std dev. 0 (taking best). +Reference operation time is 3.09467e-08 s (64.63 Mflops) with 12 threads. +After split step 1: tpop: 3.095e-08 s ~Mflops: 64.627 nsubm:1 otn:12 +Applying split (1 -> 1 leaves, 12 th.) yielded NEGLIGIBLE change (1th in a row) (old/new=1.00000x): 3.095e-08s -> 3.095e-08s, so IGNORING this instance. +Split (1 -> 1 leaves, 1 -> 1 subms) took 1.907e-06s (of which: 0s analysis, 0s mem.mgmt); compute time: 0s overall, 0s searches, 0s shuffle, 0s switch, 0s quadrants. +3 iterations (12 th.) took 1.192e-06s; avg 3.974e-07s ( +/- 92.21/200.00 %); best 3.095e-08s; worst 1.192e-06s; std dev. 5.62e-07 (taking best). +Reference operation time is 3.09467e-08 s (64.63 Mflops) with 12 threads. +After split step 2: tpop: 3.095e-08 s ~Mflops: 64.627 nsubm:1 otn:12 +Applying split (1 -> 1 leaves, 12 th.) yielded NEGLIGIBLE change (2th in a row) (old/new=1.00000x): 3.095e-08s -> 3.095e-08s, so IGNORING this instance. +Split (1 -> 1 leaves, 1 -> 1 subms) took 5.007e-06s (of which: 0s analysis, 0s mem.mgmt); compute time: 0s overall, 0s searches, 0s shuffle, 0s switch, 0s quadrants. +3 iterations (12 th.) took 2.146e-06s; avg 7.153e-07s ( +/- 95.67/200.00 %); best 3.095e-08s; worst 2.146e-06s; std dev. 1.012e-06 (taking best). +Reference operation time is 3.09467e-08 s (64.63 Mflops) with 12 threads. +After split step 3: tpop: 3.095e-08 s ~Mflops: 64.627 nsubm:1 otn:12 +Applying split (1 -> 1 leaves, 12 th.) yielded NEGLIGIBLE change (3th in a row) (old/new=1.00000x): 3.095e-08s -> 3.095e-08s, so IGNORING this instance. Split (1 -> 1 leaves, 1 -> 1 subms) took 9.537e-07s (of which: 0s analysis, 0s mem.mgmt); compute time: 0s overall, 0s searches, 0s shuffle, 0s switch, 0s quadrants. -3 iterations (12 th.) took 2.861e-06s; avg 9.537e-07s ( +/- 96.86/100.00 %); best 2.999e-08s; worst 1.907e-06s; std dev. 7.787e-07 (taking best). -Reference operation time is 2.99931e-08 s (66.68 Mflops) with 12 threads. -After split step 2: tpop: 2.999e-08 s ~Mflops: 66.682 nsubm:1 otn:12 -Applying split (1 -> 1 leaves, 12 th.) yielded NEGLIGIBLE change (2th in a row) (old/new=1.00000x): 2.999e-08s -> 2.999e-08s, so IGNORING this instance. -Split (1 -> 1 leaves, 1 -> 1 subms) took 4.053e-06s (of which: 9.537e-07s analysis, 0s mem.mgmt); compute time: 0s overall, 0s searches, 0s shuffle, 0s switch, 0s quadrants. -3 iterations (12 th.) took 9.537e-07s; avg 3.179e-07s ( +/- 90.57/200.00 %); best 2.999e-08s; worst 9.537e-07s; std dev. 4.496e-07 (taking best). -Reference operation time is 2.99931e-08 s (66.68 Mflops) with 12 threads. -After split step 3: tpop: 2.999e-08 s ~Mflops: 66.682 nsubm:1 otn:12 -Applying split (1 -> 1 leaves, 12 th.) yielded NEGLIGIBLE change (3th in a row) (old/new=1.00000x): 2.999e-08s -> 2.999e-08s, so IGNORING this instance. -Split (1 -> 1 leaves, 1 -> 1 subms) took 1.907e-06s (of which: 9.537e-07s analysis, 0s mem.mgmt); compute time: 0s overall, 0s searches, 0s shuffle, 0s switch, 0s quadrants. -3 iterations (12 th.) took 9.537e-07s; avg 3.179e-07s ( +/- 90.57/200.00 %); best 2.999e-08s; worst 9.537e-07s; std dev. 4.496e-07 (taking best). -Reference operation time is 2.99931e-08 s (66.68 Mflops) with 12 threads. -After split step 4: tpop: 2.999e-08 s ~Mflops: 66.682 nsubm:1 otn:12 -Applying split (1 -> 1 leaves, 12 th.) yielded NEGLIGIBLE change (4th in a row) (old/new=1.00000x): 2.999e-08s -> 2.999e-08s, so IGNORING this instance. +3 iterations (12 th.) took 0s; avg 0s ( +/- -inf/ nan %); best 3.095e-08s; worst 0s; std dev. 0 (taking best). +Reference operation time is 3.09467e-08 s (64.63 Mflops) with 12 threads. +After split step 4: tpop: 3.095e-08 s ~Mflops: 64.627 nsubm:1 otn:12 +Applying split (1 -> 1 leaves, 12 th.) yielded NEGLIGIBLE change (4th in a row) (old/new=1.00000x): 3.095e-08s -> 3.095e-08s, so IGNORING this instance. Split (1 -> 1 leaves, 1 -> 1 subms) took 9.537e-07s (of which: 0s analysis, 0s mem.mgmt); compute time: 0s overall, 0s searches, 0s shuffle, 0s switch, 0s quadrants. -3 iterations (12 th.) took 0s; avg 0s ( +/- -inf/ nan %); best 2.999e-08s; worst 0s; std dev. 0 (taking best). -Reference operation time is 2.99931e-08 s (66.68 Mflops) with 12 threads. -After split step 5: tpop: 2.999e-08 s ~Mflops: 66.682 nsubm:1 otn:12 -Applying split (1 -> 1 leaves, 12 th.) yielded NEGLIGIBLE change (5th in a row) (old/new=1.00000x): 2.999e-08s -> 2.999e-08s, so IGNORING this instance. -Split (1 -> 1 leaves, 1 -> 1 subms) took 1.907e-06s (of which: 0s analysis, 0s mem.mgmt); compute time: 0s overall, 0s searches, 0s shuffle, 0s switch, 0s quadrants. -3 iterations (12 th.) took 0s; avg 0s ( +/- -inf/ nan %); best 2.999e-08s; worst 0s; std dev. 0 (taking best). -Reference operation time is 2.99931e-08 s (66.68 Mflops) with 12 threads. -After split step 6: tpop: 2.999e-08 s ~Mflops: 66.682 nsubm:1 otn:12 -Applying split (1 -> 1 leaves, 12 th.) yielded NEGLIGIBLE change (6th in a row) (old/new=1.00000x): 2.999e-08s -> 2.999e-08s, so IGNORING this instance. -A total of 6 split steps (of max 6) (1 -> 1 subms) took 0.0002799s (of which 0.000246s partitioning, 0s I/O); computing times: 0s in par. loops, 0s sorting, 5.007e-06s analyzing) -Total split + benchmarking process took 0.0002799s, equivalent to 9332.3/9332.3 new/old ops (0.01199s for 1 clones -- as 399793.3/399793.3 ops, or 399793.3/399793.3 ops per clone), SPEEDUP of 1.000x (NO SPEEDUP) -In 1 tuning rounds (tot. 0.024s, 0.024s for constructor, 2 clones) obtained NO speedup (best stays 66.68 Mflops). +3 iterations (12 th.) took 0s; avg 0s ( +/- -inf/ nan %); best 3.095e-08s; worst 0s; std dev. 0 (taking best). +Reference operation time is 3.09467e-08 s (64.63 Mflops) with 12 threads. +After split step 5: tpop: 3.095e-08 s ~Mflops: 64.627 nsubm:1 otn:12 +Applying split (1 -> 1 leaves, 12 th.) yielded NEGLIGIBLE change (5th in a row) (old/new=1.00000x): 3.095e-08s -> 3.095e-08s, so IGNORING this instance. +Split (1 -> 1 leaves, 1 -> 1 subms) took 1.192e-06s (of which: 0s analysis, 0s mem.mgmt); compute time: 0s overall, 0s searches, 0s shuffle, 0s switch, 0s quadrants. +3 iterations (12 th.) took 9.537e-07s; avg 3.179e-07s ( +/- 90.27/200.00 %); best 3.095e-08s; worst 9.537e-07s; std dev. 4.496e-07 (taking best). +Reference operation time is 3.09467e-08 s (64.63 Mflops) with 12 threads. +After split step 6: tpop: 3.095e-08 s ~Mflops: 64.627 nsubm:1 otn:12 +Applying split (1 -> 1 leaves, 12 th.) yielded NEGLIGIBLE change (6th in a row) (old/new=1.00000x): 3.095e-08s -> 3.095e-08s, so IGNORING this instance. +A total of 6 split steps (of max 6) (1 -> 1 subms) took 0.0003672s (of which 5.507e-05s partitioning, 0s I/O); computing times: 0s in par. loops, 0s sorting, 4.053e-06s analyzing) +Total split + benchmarking process took 0.0003672s, equivalent to 11864.4/11864.4 new/old ops (0.002196s for 1 clones -- as 70963.0/70963.0 ops, or 70963.0/70963.0 ops per clone), SPEEDUP of 1.000x (NO SPEEDUP) +In 1 tuning rounds (tot. 0.0054s, 0.0049s for constructor, 2 clones) obtained NO speedup (best stays 64.63 Mflops). Backsolving we should get a unitary vector: %%MatrixMarket matrix array real general @@ -8682,196 +8711,184 @@ /build/reproducible-path/librsb-1.3.0.2+dfsg/examples/fortran Building a matrix with 210 nnz, 20 x 20 Duplicates check: 210 - 0 = 210 - converted COO to RSB in 2.528e-02 s (100.00 %) - analyzed arrays in 1.264e-02 s (50.00 %) - cleaned-up arrays in 2.146e-06 s (0.01 %) - deduplicated arrays in 2.861e-06 s (0.01 %) - sorted arrays in 4.570e-03 s (18.08 %) - shuffled partitions in 4.387e-03 s (17.36 %) - memory allocations took 3.386e-05 s (0.13 %) - leafs setup took 7.868e-06 s (0.03 %) - halfword conversion took 3.619e-03 s (14.32 %) -Built (20 x 20)[0xaaab0aaf09f0]{D} @ (0(0..0),0(0..0)) (210 nnz, 10 nnz/r) flags 0x2446396 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 22, symflags:'LS' + converted COO to RSB in 9.237e-03 s (100.00 %) + analyzed arrays in 3.627e-03 s (39.26 %) + cleaned-up arrays in 2.146e-06 s (0.02 %) + deduplicated arrays in 3.099e-06 s (0.03 %) + sorted arrays in 1.571e-03 s (17.01 %) + shuffled partitions in 2.118e-03 s (22.93 %) + memory allocations took 3.290e-05 s (0.36 %) + leafs setup took 5.960e-06 s (0.06 %) + halfword conversion took 1.836e-03 s (19.88 %) +Built (20 x 20)[0xaaaae21979f0]{D} @ (0(0..0),0(0..0)) (210 nnz, 10 nnz/r) flags 0x2446396 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 22, symflags:'LS' Will autotune matrix: 20 x 20, type D, 210 nnz, 10 nnz/r, 30 subms, 22 lsubms, 3.7524 bpnz. -Parameters: verbosity:1 mintimes:3 maxtimes:10 mindt:0 maxdt:4.619e-08 -Starting autotuning (16 x 4.61936e-08 s stages, transA=N, nrhs=1, timer gran.=4.61936e-08), 12 suggested as starting thread count(default). -3 iterations (12 th.) took 0.006779s; avg 0.00226s ( +/- 44.29/ 50.60 %); best 0.001259s; worst 0.003403s; std dev. 0.0008812 (taking best). -Reference operation time is 0.00125885 s (0.6673 Mflops) with 12 threads. -Starting merge (same threads) based auto-tuning procedure (transA=N, nrhs=1, order=cols) (max 6 steps, inclusive 3 grace steps) on: 20 x 20, type D, 210 nnz, 10 nnz/r, 30 subms, 22 lsubms, 3.7524 bpnz (tpop: 0.001259 Mflops: 0.667) -Merge (22 -> 16 leaves) took w.c.t. of 0.00088s, ~0.0002069s of computing time (of which 2.146e-06s sorting, 6.914e-06s analysis) -3 iterations (12 th.) took 0.007997s; avg 0.002666s ( +/- 16.64/ 32.46 %); best 0.002222s; worst 0.003531s; std dev. 0.0006119 (taking best). -Reference operation time is 0.00222206 s (0.378 Mflops) with 12 threads. -After merge step 1: tpop: 0.002222 s ~Mflops: 0.378 nsubm:16 otn:12 -Applying merge (22 -> 16 leaves, 12 th.) yielded SLOWDOWN (1th of 3 tolerable) of 1.765x: 0.001259s -> 0.002222s. -Skipping further merge based tests after 1 definite performance degradations in a row (and last exceeding limit). -A total of 1 merge steps (of max 6) (22 -> 16 subms) took 0.008899s (of which 0.000885s partitioning, 0s I/O); computing times: 0.0002069s in par. loops, 2.146e-06s sorting, 6.914e-06s analyzing) -Total merge + benchmarking process took 0.008899s, equivalent to 7.1/7.1 new/old ops (0.005387s for 1 clones -- as 4.3/4.3 ops, or 4.3/4.3 ops per clone), SPEEDUP of 1.000x (NO SPEEDUP) -Merging based autotuning FAILED (=NO SPEEDUP); let's try splitting then... -3 iterations (12 th.) took 0.01273s; avg 0.004242s ( +/- 7.29/ 7.71 %); best 0.003933s; worst 0.004569s; std dev. 0.00026 (taking best). -Reference operation time is 0.00393295 s (0.2136 Mflops) with 12 threads. -Starting split (same threads) based auto-tuning procedure (transA=N, nrhs=1, order=cols) (max 6 steps, inclusive 3 grace steps) on: 20 x 20, type D, 210 nnz, 10 nnz/r, 30 subms, 22 lsubms, 3.7524 bpnz (tpop: 0.003933 Mflops: 0.214) -Split (22 -> 51 leaves, 30 -> 70 subms) took 0.005083s (of which: 5.96e-06s analysis, -1.968e+10s mem.mgmt); compute time: 0.00592s overall, 5.96e-06s searches, 0.005914s shuffle, 0.004922s switch, 5.698e-05s quadrants. -3 iterations (12 th.) took 0.008238s; avg 0.002746s ( +/- 28.92/ 25.75 %); best 0.001952s; worst 0.003453s; std dev. 0.0006159 (taking best). -Reference operation time is 0.00195193 s (0.4303 Mflops) with 12 threads. -After split step 1: tpop: 0.001952 s ~Mflops: 0.430 nsubm:51 otn:12 -Applying split (22 -> 51 leaves, 12 th.) yielded SPEEDUP of 2.015x: 0.003933s -> 0.001952s, so taking this instance. -Split (51 -> 122 leaves, 70 -> 166 subms) took 0.002577s (of which: 1.097e-05s analysis, -4.472e+10s mem.mgmt); compute time: 0.0009537s overall, 9.298e-06s searches, 0.0009444s shuffle, 0.0005627s switch, 7.796e-05s quadrants. -3 iterations (12 th.) took 0.02493s; avg 0.00831s ( +/- 4.22/ 6.09 %); best 0.007959s; worst 0.008816s; std dev. 0.0003668 (taking best). -Reference operation time is 0.00795889 s (0.1055 Mflops) with 12 threads. -After split step 2: tpop: 0.007959 s ~Mflops: 0.106 nsubm:122 otn:12 -Applying split (51 -> 122 leaves, 12 th.) yielded SLOWDOWN (1th of 3 tolerable) of 4.077x: 0.001952s -> 0.007959s. -Skipping further split based tests after 1 definite performance degradations in a row (and last exceeding limit). -A total of 2 split steps (of max 6) (22 -> 122 subms) took 0.05164s (of which 0.007828s partitioning, 0s I/O); computing times: 0.006874s in par. loops, 1.526e-05s sorting, 1.693e-05s analyzing) -Total split + benchmarking process took 0.05164s, equivalent to 26.5/13.1 new/old ops (0.0198s for 2 clones -- as 10.1/5.0 ops, or 5.1/2.5 ops per clone), SPEEDUP of 2.015x -Applying multi-split (22 -> 51 leaves, 1 steps, 0 -> 12 th.sp.) yielded SPEEDUP of 2.015x (0.003933s -> 0.001952s), will amortize in 26.1 ops by saving 0.001981s per op. -In 1 tuning rounds (tot. 0.095s, 0.025s for constructor, 3 clones) obtained a SPEEDUP of 101.5% (2.015x) (from 0.2136 to 0.4303 Mflops). +Parameters: verbosity:1 mintimes:3 maxtimes:10 mindt:0 maxdt:3.76e-08 +Starting autotuning (16 x 3.75986e-08 s stages, transA=N, nrhs=1, timer gran.=3.75986e-08), 12 suggested as starting thread count(default). +3 iterations (12 th.) took 0.02205s; avg 0.007348s ( +/- 81.64/128.20 %); best 0.001349s; worst 0.01677s; std dev. 0.006744 (taking best). +Reference operation time is 0.00134921 s (0.6226 Mflops) with 12 threads. +Starting merge (same threads) based auto-tuning procedure (transA=N, nrhs=1, order=cols) (max 6 steps, inclusive 3 grace steps) on: 20 x 20, type D, 210 nnz, 10 nnz/r, 30 subms, 22 lsubms, 3.7524 bpnz (tpop: 0.001349 Mflops: 0.623) +Merge (22 -> 16 leaves) took w.c.t. of 0.001435s, ~6.723e-05s of computing time (of which 2.146e-06s sorting, 6.914e-06s analysis) +3 iterations (12 th.) took 0.006415s; avg 0.002138s ( +/- 30.46/ 55.78 %); best 0.001487s; worst 0.003331s; std dev. 0.0008445 (taking best). +Reference operation time is 0.00148702 s (0.5649 Mflops) with 12 threads. +After merge step 1: tpop: 0.001487 s ~Mflops: 0.565 nsubm:16 otn:12 +Applying merge (22 -> 16 leaves, 12 th.) yielded SLOWDOWN (1th of 3 tolerable) of 1.102x: 0.001349s -> 0.001487s. +Merge (16 -> 10 leaves) took w.c.t. of 7.105e-05s, ~1.502e-05s of computing time (of which 1.907e-06s sorting, 8.106e-06s analysis) +3 iterations (12 th.) took 0.004734s; avg 0.001578s ( +/- 23.70/ 40.38 %); best 0.001204s; worst 0.002215s; std dev. 0.0004528 (taking best). +Reference operation time is 0.00120401 s (0.6977 Mflops) with 12 threads. +After merge step 2: tpop: 0.001204 s ~Mflops: 0.698 nsubm:10 otn:12 +Applying merge (16 -> 10 leaves, 12 th.) yielded SPEEDUP of 1.121x: 0.001349s -> 0.001204s, so taking this instance. +Merge (10 -> 8 leaves) took w.c.t. of 1.407e-05s, ~5.007e-06s of computing time (of which 9.537e-07s sorting, 4.053e-06s analysis) +3 iterations (12 th.) took 0.0033s; avg 0.0011s ( +/- 8.45/ 16.46 %); best 0.001007s; worst 0.001281s; std dev. 0.000128 (taking best). +Reference operation time is 0.00100708 s (0.8341 Mflops) with 12 threads. +After merge step 3: tpop: 0.001007 s ~Mflops: 0.834 nsubm:8 otn:12 +Applying merge (10 -> 8 leaves, 12 th.) yielded SPEEDUP of 1.196x: 0.001204s -> 0.001007s, so taking this instance. +Merge (8 -> 6 leaves) took w.c.t. of 1.192e-05s, ~4.053e-06s of computing time (of which 9.537e-07s sorting, 1.907e-06s analysis) +3 iterations (12 th.) took 0.004177s; avg 0.001392s ( +/- 35.58/ 54.27 %); best 0.0008969s; worst 0.002148s; std dev. 0.0005429 (taking best). +Reference operation time is 0.000896931 s (0.9365 Mflops) with 12 threads. +After merge step 4: tpop: 0.0008969 s ~Mflops: 0.937 nsubm:6 otn:12 +Applying merge (8 -> 6 leaves, 12 th.) yielded SPEEDUP of 1.123x: 0.001007s -> 0.0008969s, so taking this instance. +Merge (6 -> 3 leaves) took w.c.t. of 1.192e-05s, ~4.053e-06s of computing time (of which 9.537e-07s sorting, 9.537e-07s analysis) +3 iterations (12 th.) took 0.002259s; avg 0.0007529s ( +/- 38.63/ 26.28 %); best 0.0004621s; worst 0.0009508s; std dev. 0.0002101 (taking best). +Reference operation time is 0.000462055 s (1.818 Mflops) with 12 threads. +After merge step 5: tpop: 0.0004621 s ~Mflops: 1.818 nsubm:3 otn:12 +Applying merge (6 -> 3 leaves, 12 th.) yielded SPEEDUP of 1.941x: 0.0008969s -> 0.0004621s, so taking this instance. +Merge (3 -> 1 leaves) took w.c.t. of 2.098e-05s, ~8.821e-06s of computing time (of which 1.907e-06s sorting, 5.96e-06s analysis) +3 iterations (12 th.) took 5.96e-06s; avg 1.987e-06s ( +/- 98.11/152.00 %); best 3.76e-08s; worst 5.007e-06s; std dev. 2.171e-06 (taking best). +Reference operation time is 3.75986e-08 s (2.234e+04 Mflops) with 12 threads. +After merge step 6: tpop: 3.76e-08 s ~Mflops: 22341.251 nsubm:1 otn:12 +Applying merge (3 -> 1 leaves, 12 th.) yielded SPEEDUP of 12289.157x: 0.0004621s -> 3.76e-08s, so taking this instance. +Merged all the matrix leaves: no reason to continue merging. +A total of 6 merge steps (of max 6) (22 -> 1 subms) took 0.03743s (of which 0.001693s partitioning, 0s I/O); computing times: 0.0001042s in par. loops, 8.821e-06s sorting, 2.789e-05s analyzing) +Total merge + benchmarking process took 0.03743s, equivalent to 995542.2/27.7 new/old ops (0.01783s for 6 clones -- as 474140.8/13.2 ops, or 79023.5/2.2 ops per clone), SPEEDUP of 35884.591x +Applying multi-merge (22 -> 1 leaves, 6 steps, 0 -> 12 th.sp.) yielded SPEEDUP of 35884.591x (0.001349s -> 3.76e-08s), will amortize in 27.7 ops by saving 0.001349s per op. +In 1 tuning rounds (tot. 0.063s, 0.018s for constructor, 6 clones) obtained a SPEEDUP of 3588359.1% (3.588e+04x) (from 0.6226 to 2.234e+04 Mflops). autotuner chose 12 threads -Will autotune matrix: 20 x 20, type D, 210 nnz, 10 nnz/r, 70 subms, 51 lsubms, 4.4571 bpnz. -Parameters: verbosity:1 mintimes:3 maxtimes:10 mindt:0 maxdt:4.619e-08 -Starting autotuning (16 x 4.61936e-08 s stages, transA=N, nrhs=1, timer gran.=4.61936e-08), 12 suggested as starting thread count(default). -3 iterations (12 th.) took 0.02317s; avg 0.007724s ( +/- 33.53/ 23.62 %); best 0.005134s; worst 0.009548s; std dev. 0.001881 (taking best). -~ 12 threads: 0.005134s (0.16 Mflops) (0/2 degradations so far) - -3 iterations (11 th.) took 0.01103s; avg 0.003676s ( +/- 18.69/ 31.60 %); best 0.002989s; worst 0.004838s; std dev. 0.000826 (taking best). - 11 threads: 0.002989s (0.28 Mflops) (0/2 degradations so far) - -3 iterations (10 th.) took 0.008384s; avg 0.002795s ( +/- 35.66/ 48.89 %); best 0.001798s; worst 0.004161s; std dev. 0.0009994 (taking best). - 10 threads: 0.001798s (0.47 Mflops) (0/2 degradations so far) - -3 iterations (9 th.) took 0.007771s; avg 0.00259s ( +/- 26.41/ 40.63 %); best 0.001906s; worst 0.003643s; std dev. 0.0007553 (taking best). - 9 threads: 0.001906s (0.44 Mflops) (1/2 degradations so far) - -3 iterations (8 th.) took 0.006194s; avg 0.002065s ( +/- 30.01/ 30.63 %); best 0.001445s; worst 0.002697s; std dev. 0.0005112 (taking best). - 8 threads: 0.001445s (0.58 Mflops) (0/2 degradations so far) - -3 iterations (7 th.) took 0.004317s; avg 0.001439s ( +/- 4.17/ 4.86 %); best 0.001379s; worst 0.001509s; std dev. 5.351e-05 (taking best). - 7 threads: 0.001379s (0.61 Mflops) (0/2 degradations so far) - -3 iterations (6 th.) took 0.00763s; avg 0.002543s ( +/- 45.39/ 45.52 %); best 0.001389s; worst 0.003701s; std dev. 0.0009439 (taking best). - 6 threads: 0.001389s (0.6 Mflops) (1/2 degradations so far) - -3 iterations (5 th.) took 0.007267s; avg 0.002422s ( +/- 15.37/ 14.81 %); best 0.00205s; worst 0.002781s; std dev. 0.0002987 (taking best). - 5 threads: 0.00205s (0.41 Mflops) (2/2 degradations so far) - -Best threads choice is 7; starting threads were 12; max speed gap is 3.7x; search took 0.076s. -Starting merge (and threads) based auto-tuning procedure (transA=N, nrhs=1, order=cols) (max 6 steps, inclusive 3 grace steps) on: 20 x 20, type D, 210 nnz, 10 nnz/r, 70 subms, 51 lsubms, 4.4571 bpnz (tpop: 0.001379 Mflops: 0.609) -Merge (51 -> 36 leaves) took w.c.t. of 0.0007629s, ~0.0002737s of computing time (of which 5.007e-06s sorting, 7.153e-06s analysis) -3 iterations (12 th.) took 0.02562s; avg 0.008539s ( +/- 24.99/ 41.05 %); best 0.006405s; worst 0.01205s; std dev. 0.002498 (taking best). -~ 12 threads: 0.006405s (0.13 Mflops) (0/2 degradations so far) - -3 iterations (11 th.) took 0.01076s; avg 0.003587s ( +/- 48.15/ 37.55 %); best 0.00186s; worst 0.004934s; std dev. 0.001283 (taking best). - 11 threads: 0.00186s (0.45 Mflops) (0/2 degradations so far) - -3 iterations (10 th.) took 0.006735s; avg 0.002245s ( +/- 25.26/ 28.65 %); best 0.001678s; worst 0.002888s; std dev. 0.000497 (taking best). - 10 threads: 0.001678s (0.5 Mflops) (0/2 degradations so far) - -3 iterations (9 th.) took 0.008284s; avg 0.002761s ( +/- 21.59/ 26.02 %); best 0.002165s; worst 0.00348s; std dev. 0.0005437 (taking best). - 9 threads: 0.002165s (0.39 Mflops) (1/2 degradations so far) - -3 iterations (8 th.) took 0.005858s; avg 0.001953s ( +/- 11.81/ 18.45 %); best 0.001722s; worst 0.002313s; std dev. 0.000258 (taking best). - 8 threads: 0.001722s (0.49 Mflops) (2/2 degradations so far) - -Best threads choice is 10; starting threads were 12; max speed gap is 3.8x; search took 0.057s. -After merge step 1: tpop: 0.001678 s ~Mflops: 0.501 nsubm:36 otn:10 -Applying merge (51 -> 36 leaves, 10 th.) yielded SLOWDOWN (1th of 3 tolerable) of 1.217x: 0.001379s -> 0.001678s. -Skipping further merge based tests after 1 definite performance degradations in a row (and last exceeding limit). -A total of 1 merge steps (of max 6) (51 -> 36 subms) took 0.0581s (of which 0.000767s partitioning, 0s I/O); computing times: 0.0002737s in par. loops, 5.007e-06s sorting, 7.153e-06s analyzing) -Total merge + benchmarking process took 0.0581s, equivalent to 42.1/42.1 new/old ops (0.01356s for 1 clones -- as 9.8/9.8 ops, or 9.8/9.8 ops per clone), SPEEDUP of 1.000x (NO SPEEDUP) +Will autotune matrix: 20 x 20, type D, 210 nnz, 10 nnz/r, 1 subms, 1 lsubms, 2.4000 bpnz. +Parameters: verbosity:1 mintimes:3 maxtimes:10 mindt:0 maxdt:3.76e-08 +Starting autotuning (16 x 3.75986e-08 s stages, transA=N, nrhs=1, timer gran.=3.75986e-08), 12 suggested as starting thread count(default). +3 iterations (12 th.) took 7.153e-06s; avg 2.384e-06s ( +/- 98.42/160.00 %); best 3.76e-08s; worst 6.199e-06s; std dev. 2.725e-06 (taking best). +~ 12 threads: 3.76e-08s (2.2e+04 Mflops) (0/2 degradations so far) - +3 iterations (11 th.) took 9.537e-07s; avg 3.179e-07s ( +/- 88.17/200.00 %); best 3.76e-08s; worst 9.537e-07s; std dev. 4.496e-07 (taking best). + 11 threads: 3.76e-08s (2.2e+04 Mflops) (0/2 degradations so far) - +3 iterations (10 th.) took 1.907e-06s; avg 6.358e-07s ( +/- 94.09/ 50.00 %); best 3.76e-08s; worst 9.537e-07s; std dev. 4.496e-07 (taking best). + 10 threads: 3.76e-08s (2.2e+04 Mflops) (0/2 degradations so far) - +3 iterations (9 th.) took 9.537e-07s; avg 3.179e-07s ( +/- 88.17/200.00 %); best 3.76e-08s; worst 9.537e-07s; std dev. 4.496e-07 (taking best). + 9 threads: 3.76e-08s (2.2e+04 Mflops) (0/2 degradations so far) - +3 iterations (8 th.) took 9.537e-07s; avg 3.179e-07s ( +/- 88.17/200.00 %); best 3.76e-08s; worst 9.537e-07s; std dev. 4.496e-07 (taking best). + 8 threads: 3.76e-08s (2.2e+04 Mflops) (0/2 degradations so far) - +3 iterations (7 th.) took 9.537e-07s; avg 3.179e-07s ( +/- 88.17/200.00 %); best 3.76e-08s; worst 9.537e-07s; std dev. 4.496e-07 (taking best). + 7 threads: 3.76e-08s (2.2e+04 Mflops) (0/2 degradations so far) - +3 iterations (6 th.) took 1.907e-06s; avg 6.358e-07s ( +/- 94.09/ 50.00 %); best 3.76e-08s; worst 9.537e-07s; std dev. 4.496e-07 (taking best). + 6 threads: 3.76e-08s (2.2e+04 Mflops) (0/2 degradations so far) - +3 iterations (5 th.) took 1.907e-06s; avg 6.358e-07s ( +/- 94.09/ 50.00 %); best 3.76e-08s; worst 9.537e-07s; std dev. 4.496e-07 (taking best). + 5 threads: 3.76e-08s (2.2e+04 Mflops) (0/2 degradations so far) - +3 iterations (4 th.) took 1.907e-06s; avg 6.358e-07s ( +/- 94.09/ 50.00 %); best 3.76e-08s; worst 9.537e-07s; std dev. 4.496e-07 (taking best). + 4 threads: 3.76e-08s (2.2e+04 Mflops) (0/2 degradations so far) - +3 iterations (3 th.) took 2.146e-06s; avg 7.153e-07s ( +/- 94.74/ 66.67 %); best 3.76e-08s; worst 1.192e-06s; std dev. 5.15e-07 (taking best). + 3 threads: 3.76e-08s (2.2e+04 Mflops) (0/2 degradations so far) - +3 iterations (2 th.) took 2.146e-06s; avg 7.153e-07s ( +/- 94.74/ 66.67 %); best 3.76e-08s; worst 1.192e-06s; std dev. 5.15e-07 (taking best). + 2 threads: 3.76e-08s (2.2e+04 Mflops) (0/2 degradations so far) - +3 iterations (1 th.) took 1.192e-06s; avg 3.974e-07s ( +/- 90.54/200.00 %); best 3.76e-08s; worst 1.192e-06s; std dev. 5.62e-07 (taking best). + 1 threads: 3.76e-08s (2.2e+04 Mflops) (0/2 degradations so far) - +Best threads choice is 12; starting threads were 12; max speed gap is 1x; search took 7.9e-05s. +Starting merge (and threads) based auto-tuning procedure (transA=N, nrhs=1, order=cols) (max 6 steps, inclusive 3 grace steps) on: 20 x 20, type D, 210 nnz, 10 nnz/r, 1 subms, 1 lsubms, 2.4000 bpnz (tpop: 3.76e-08 Mflops: 22341.251) +Merge (1 -> 1 leaves) took w.c.t. of 0s, ~0s of computing time (of which 0s sorting, 0s analysis) +3 iterations (12 th.) took 2.146e-06s; avg 7.153e-07s ( +/- 94.74/ 66.67 %); best 3.76e-08s; worst 1.192e-06s; std dev. 5.15e-07 (taking best). +~ 12 threads: 3.76e-08s (2.2e+04 Mflops) (0/2 degradations so far) - +3 iterations (11 th.) took 1.192e-06s; avg 3.974e-07s ( +/- 90.54/200.00 %); best 3.76e-08s; worst 1.192e-06s; std dev. 5.62e-07 (taking best). + 11 threads: 3.76e-08s (2.2e+04 Mflops) (0/2 degradations so far) - +3 iterations (10 th.) took 1.192e-06s; avg 3.974e-07s ( +/- 90.54/200.00 %); best 3.76e-08s; worst 1.192e-06s; std dev. 5.62e-07 (taking best). + 10 threads: 3.76e-08s (2.2e+04 Mflops) (0/2 degradations so far) - +3 iterations (9 th.) took 9.537e-07s; avg 3.179e-07s ( +/- 88.17/200.00 %); best 3.76e-08s; worst 9.537e-07s; std dev. 4.496e-07 (taking best). + 9 threads: 3.76e-08s (2.2e+04 Mflops) (0/2 degradations so far) - +3 iterations (8 th.) took 2.861e-06s; avg 9.537e-07s ( +/- 96.06/100.00 %); best 3.76e-08s; worst 1.907e-06s; std dev. 7.787e-07 (taking best). + 8 threads: 3.76e-08s (2.2e+04 Mflops) (0/2 degradations so far) - +3 iterations (7 th.) took 9.537e-07s; avg 3.179e-07s ( +/- 88.17/200.00 %); best 3.76e-08s; worst 9.537e-07s; std dev. 4.496e-07 (taking best). + 7 threads: 3.76e-08s (2.2e+04 Mflops) (0/2 degradations so far) - +3 iterations (6 th.) took 9.537e-07s; avg 3.179e-07s ( +/- 88.17/200.00 %); best 3.76e-08s; worst 9.537e-07s; std dev. 4.496e-07 (taking best). + 6 threads: 3.76e-08s (2.2e+04 Mflops) (0/2 degradations so far) - +3 iterations (5 th.) took 1.907e-06s; avg 6.358e-07s ( +/- 94.09/ 50.00 %); best 3.76e-08s; worst 9.537e-07s; std dev. 4.496e-07 (taking best). + 5 threads: 3.76e-08s (2.2e+04 Mflops) (0/2 degradations so far) - +3 iterations (4 th.) took 1.907e-06s; avg 6.358e-07s ( +/- 94.09/ 50.00 %); best 3.76e-08s; worst 9.537e-07s; std dev. 4.496e-07 (taking best). + 4 threads: 3.76e-08s (2.2e+04 Mflops) (0/2 degradations so far) - +3 iterations (3 th.) took 9.537e-07s; avg 3.179e-07s ( +/- 88.17/200.00 %); best 3.76e-08s; worst 9.537e-07s; std dev. 4.496e-07 (taking best). + 3 threads: 3.76e-08s (2.2e+04 Mflops) (0/2 degradations so far) - +3 iterations (2 th.) took 1.907e-06s; avg 6.358e-07s ( +/- 94.09/ 50.00 %); best 3.76e-08s; worst 9.537e-07s; std dev. 4.496e-07 (taking best). + 2 threads: 3.76e-08s (2.2e+04 Mflops) (0/2 degradations so far) - +3 iterations (1 th.) took 1.907e-06s; avg 6.358e-07s ( +/- 94.09/ 50.00 %); best 3.76e-08s; worst 9.537e-07s; std dev. 4.496e-07 (taking best). + 1 threads: 3.76e-08s (2.2e+04 Mflops) (0/2 degradations so far) - +Best threads choice is 12; starting threads were 12; max speed gap is 1x; search took 0.00024s. +After merge step 1: tpop: 3.76e-08 s ~Mflops: 22341.251 nsubm:1 otn:12 +Applying merge (1 -> 1 leaves, 12 th.) yielded NEGLIGIBLE change (1th in a row) (old/new=1.00000x): 3.76e-08s -> 3.76e-08s, so IGNORING this instance. +Merged all the matrix leaves: no reason to continue merging. +A total of 1 merge steps (of max 6) (1 -> 1 subms) took 0.000258s (of which 2.861e-06s partitioning, 0s I/O); computing times: 0s in par. loops, 0s sorting, 0s analyzing) +Total merge + benchmarking process took 0.000258s, equivalent to 6861.1/6861.1 new/old ops (0.002483s for 1 clones -- as 66036.8/66036.8 ops, or 66036.8/66036.8 ops per clone), SPEEDUP of 1.000x (NO SPEEDUP) Merging based autotuning FAILED (=NO SPEEDUP); let's try splitting then... -3 iterations (12 th.) took 0.008676s; avg 0.002892s ( +/- 37.41/ 67.49 %); best 0.00181s; worst 0.004844s; std dev. 0.001383 (taking best). -~ 12 threads: 0.00181s (0.46 Mflops) (0/2 degradations so far) - -3 iterations (11 th.) took 0.005461s; avg 0.00182s ( +/- 34.56/ 46.94 %); best 0.001191s; worst 0.002675s; std dev. 0.0006263 (taking best). - 11 threads: 0.001191s (0.71 Mflops) (0/2 degradations so far) - -3 iterations (10 th.) took 0.005194s; avg 0.001731s ( +/- 22.61/ 42.61 %); best 0.00134s; worst 0.002469s; std dev. 0.000522 (taking best). - 10 threads: 0.00134s (0.63 Mflops) (1/2 degradations so far) - -3 iterations (9 th.) took 0.003793s; avg 0.001264s ( +/- 3.90/ 5.11 %); best 0.001215s; worst 0.001329s; std dev. 4.776e-05 (taking best). - 9 threads: 0.001215s (0.69 Mflops) (2/2 degradations so far) - -Best threads choice is 11; starting threads were 12; max speed gap is 1.5x; search took 0.023s. -Starting split (and threads) based auto-tuning procedure (transA=N, nrhs=1, order=cols) (max 6 steps, inclusive 3 grace steps) on: 20 x 20, type D, 210 nnz, 10 nnz/r, 70 subms, 51 lsubms, 4.4571 bpnz (tpop: 0.001191 Mflops: 0.705) -Split (51 -> 122 leaves, 70 -> 166 subms) took 0.002592s (of which: 5.007e-06s analysis, -4.472e+10s mem.mgmt); compute time: 0.0001786s overall, 5.96e-06s searches, 0.0001726s shuffle, 4.792e-05s switch, 3.672e-05s quadrants. -3 iterations (12 th.) took 0.005837s; avg 0.001946s ( +/- 7.85/ 13.02 %); best 0.001793s; worst 0.002199s; std dev. 0.0001804 (taking best). -~ 12 threads: 0.001793s (0.47 Mflops) (0/2 degradations so far) - -3 iterations (11 th.) took 0.01346s; avg 0.004487s ( +/- 70.47/ 95.00 %); best 0.001325s; worst 0.008749s; std dev. 0.003129 (taking best). - 11 threads: 0.001325s (0.63 Mflops) (0/2 degradations so far) - -3 iterations (10 th.) took 0.007265s; avg 0.002422s ( +/- 60.15/ 36.89 %); best 0.0009651s; worst 0.003315s; std dev. 0.001039 (taking best). - 10 threads: 0.0009651s (0.87 Mflops) (0/2 degradations so far) - -3 iterations (9 th.) took 0.005662s; avg 0.001887s ( +/- 10.61/ 14.97 %); best 0.001687s; worst 0.00217s; std dev. 0.0002055 (taking best). - 9 threads: 0.001687s (0.5 Mflops) (1/2 degradations so far) - -3 iterations (8 th.) took 0.005504s; avg 0.001835s ( +/- 28.23/ 28.27 %); best 0.001317s; worst 0.002353s; std dev. 0.0004231 (taking best). - 8 threads: 0.001317s (0.64 Mflops) (2/2 degradations so far) - -Best threads choice is 10; starting threads were 12; max speed gap is 1.9x; search took 0.038s. -After split step 1: tpop: 0.0009651 s ~Mflops: 0.870 nsubm:122 otn:10 -Applying split (51 -> 122 leaves, 10 th.) yielded SPEEDUP of 1.234x: 0.001191s -> 0.0009651s, so taking this instance. -Split (122 -> 146 leaves, 166 -> 198 subms) took 0.001553s (of which: 1.121e-05s analysis, -1.431e+10s mem.mgmt); compute time: 6.151e-05s overall, 9.537e-07s searches, 6.056e-05s shuffle, 1.788e-05s switch, 1.216e-05s quadrants. -3 iterations (12 th.) took 0.004249s; avg 0.001416s ( +/- 4.05/ 3.36 %); best 0.001359s; worst 0.001464s; std dev. 4.337e-05 (taking best). -~ 12 threads: 0.001359s (0.62 Mflops) (0/2 degradations so far) - -3 iterations (11 th.) took 0.00461s; avg 0.001537s ( +/- 46.64/ 52.61 %); best 0.0008199s; worst 0.002345s; std dev. 0.000626 (taking best). - 11 threads: 0.0008199s (1 Mflops) (0/2 degradations so far) - -3 iterations (10 th.) took 0.003253s; avg 0.001084s ( +/- 18.76/ 15.92 %); best 0.000881s; worst 0.001257s; std dev. 0.000155 (taking best). - 10 threads: 0.000881s (0.95 Mflops) (1/2 degradations so far) - -3 iterations (9 th.) took 0.006478s; avg 0.002159s ( +/- 46.46/ 28.19 %); best 0.001156s; worst 0.002768s; std dev. 0.0007148 (taking best). - 9 threads: 0.001156s (0.73 Mflops) (2/2 degradations so far) - -Best threads choice is 11; starting threads were 12; max speed gap is 1.7x; search took 0.019s. -After split step 2: tpop: 0.0008199 s ~Mflops: 1.024 nsubm:146 otn:11 -Applying split (122 -> 146 leaves, 11 th.) yielded SPEEDUP of 1.177x: 0.0009651s -> 0.0008199s, so taking this instance. -Split (146 -> 146 leaves, 198 -> 198 subms) took 0.000689s (of which: 1.502e-05s analysis, 0s mem.mgmt); compute time: 0s overall, 0s searches, 0s shuffle, 0s switch, 0s quadrants. -3 iterations (12 th.) took 0.003549s; avg 0.001183s ( +/- 18.76/ 19.53 %); best 0.0009611s; worst 0.001414s; std dev. 0.000185 (taking best). -~ 12 threads: 0.0009611s (0.87 Mflops) (0/2 degradations so far) - -3 iterations (11 th.) took 0.004498s; avg 0.001499s ( +/- 44.98/ 34.38 %); best 0.0008249s; worst 0.002015s; std dev. 0.0004986 (taking best). - 11 threads: 0.0008249s (1 Mflops) (0/2 degradations so far) - -3 iterations (10 th.) took 0.003659s; avg 0.00122s ( +/- 31.21/ 24.46 %); best 0.000839s; worst 0.001518s; std dev. 0.0002833 (taking best). - 10 threads: 0.000839s (1 Mflops) (1/2 degradations so far) - -3 iterations (9 th.) took 0.003236s; avg 0.001079s ( +/- 22.88/ 42.22 %); best 0.0008318s; worst 0.001534s; std dev. 0.0003224 (taking best). - 9 threads: 0.0008318s (1 Mflops) (2/2 degradations so far) - -Best threads choice is 11; starting threads were 12; max speed gap is 1.2x; search took 0.015s. -After split step 3: tpop: 0.0008249 s ~Mflops: 1.018 nsubm:146 otn:11 -Applying split (146 -> 146 leaves, 11 th.) yielded NEGLIGIBLE change (1th in a row) (old/new=0.99393x): 0.0008199s -> 0.0008249s, so IGNORING this instance. -Split (146 -> 146 leaves, 198 -> 198 subms) took 0.001202s (of which: 1.407e-05s analysis, 0s mem.mgmt); compute time: 0s overall, 0s searches, 0s shuffle, 0s switch, 0s quadrants. -3 iterations (12 th.) took 0.00272s; avg 0.0009067s ( +/- 16.17/ 19.67 %); best 0.0007601s; worst 0.001085s; std dev. 0.0001345 (taking best). -~ 12 threads: 0.0007601s (1.1 Mflops) (0/2 degradations so far) - -3 iterations (11 th.) took 0.00299s; avg 0.0009967s ( +/- 20.34/ 12.38 %); best 0.0007939s; worst 0.00112s; std dev. 0.0001445 (taking best). - 11 threads: 0.0007939s (1.1 Mflops) (1/2 degradations so far) - -3 iterations (10 th.) took 0.002923s; avg 0.0009743s ( +/- 21.28/ 21.62 %); best 0.000767s; worst 0.001185s; std dev. 0.0001706 (taking best). - 10 threads: 0.000767s (1.1 Mflops) (2/2 degradations so far) - -Best threads choice is 12; starting threads were 12; max speed gap is 1x; search took 0.0087s. -After split step 4: tpop: 0.0007601 s ~Mflops: 1.105 nsubm:146 otn:12 -Applying split (146 -> 146 leaves, 12 th.) yielded SPEEDUP of 1.079x: 0.0008199s -> 0.0007601s, so taking this instance. -Split (146 -> 146 leaves, 198 -> 198 subms) took 0.001075s (of which: 1.192e-05s analysis, 0s mem.mgmt); compute time: 0s overall, 0s searches, 0s shuffle, 0s switch, 0s quadrants. -3 iterations (12 th.) took 0.005139s; avg 0.001713s ( +/- 19.38/ 26.51 %); best 0.001381s; worst 0.002167s; std dev. 0.0003323 (taking best). -~ 12 threads: 0.001381s (0.61 Mflops) (0/2 degradations so far) - -3 iterations (11 th.) took 0.01038s; avg 0.003461s ( +/- 78.85/ 69.01 %); best 0.0007319s; worst 0.005849s; std dev. 0.002103 (taking best). - 11 threads: 0.0007319s (1.1 Mflops) (0/2 degradations so far) - -3 iterations (10 th.) took 0.003507s; avg 0.001169s ( +/- 27.03/ 50.29 %); best 0.0008531s; worst 0.001757s; std dev. 0.0004161 (taking best). - 10 threads: 0.0008531s (0.98 Mflops) (1/2 degradations so far) - -3 iterations (9 th.) took 0.002758s; avg 0.0009193s ( +/- 11.77/ 14.86 %); best 0.0008111s; worst 0.001056s; std dev. 0.000102 (taking best). - 9 threads: 0.0008111s (1 Mflops) (2/2 degradations so far) - -Best threads choice is 11; starting threads were 12; max speed gap is 1.9x; search took 0.022s. -After split step 5: tpop: 0.0007319 s ~Mflops: 1.148 nsubm:146 otn:11 -Applying split (146 -> 146 leaves, 11 th.) yielded SPEEDUP of 1.038x: 0.0007601s -> 0.0007319s, so taking this instance. -Split (146 -> 146 leaves, 198 -> 198 subms) took 0.001282s (of which: 1.097e-05s analysis, 0s mem.mgmt); compute time: 0s overall, 0s searches, 0s shuffle, 0s switch, 0s quadrants. -3 iterations (12 th.) took 0.006352s; avg 0.002117s ( +/- 59.48/ 57.83 %); best 0.0008581s; worst 0.003342s; std dev. 0.001014 (taking best). -~ 12 threads: 0.0008581s (0.98 Mflops) (0/2 degradations so far) - -3 iterations (11 th.) took 0.003214s; avg 0.001071s ( +/- 3.48/ 5.67 %); best 0.001034s; worst 0.001132s; std dev. 4.33e-05 (taking best). - 11 threads: 0.001034s (0.81 Mflops) (1/2 degradations so far) - -3 iterations (10 th.) took 0.008964s; avg 0.002988s ( +/- 70.95/108.30 %); best 0.0008681s; worst 0.006224s; std dev. 0.002325 (taking best). - 10 threads: 0.0008681s (0.97 Mflops) (2/2 degradations so far) - -Best threads choice is 12; starting threads were 12; max speed gap is 1.2x; search took 0.019s. -After split step 6: tpop: 0.0008581 s ~Mflops: 0.979 nsubm:146 otn:12 -Applying split (146 -> 146 leaves, 12 th.) yielded SLOWDOWN (1th of 3 tolerable) of 1.172x: 0.0007319s -> 0.0008581s. -A total of 6 split steps (of max 6) (51 -> 146 subms) took 0.1388s (of which 0.009227s partitioning, 0s I/O); computing times: 0.0002401s in par. loops, 6.914e-06s sorting, 6.819e-05s analyzing) -Total split + benchmarking process took 0.1388s, equivalent to 189.6/116.5 new/old ops (0.01248s for 5 clones -- as 17.0/10.5 ops, or 3.4/2.1 ops per clone), SPEEDUP of 1.627x -Applying multi-split (51 -> 146 leaves, 5 steps, 11 -> 11 th.sp.) yielded SPEEDUP of 1.627x (0.001191s -> 0.0007319s), will amortize in 302.3 ops by saving 0.0004592s per op. -In 1 tuning rounds (tot. 0.31s, 0.026s for constructor, 6 clones) obtained a SPEEDUP of 62.7% (1.627x) (from 0.7052 to 1.148 Mflops). +3 iterations (12 th.) took 2.146e-06s; avg 7.153e-07s ( +/- 94.74/ 66.67 %); best 3.76e-08s; worst 1.192e-06s; std dev. 5.15e-07 (taking best). +~ 12 threads: 3.76e-08s (2.2e+04 Mflops) (0/2 degradations so far) - +3 iterations (11 th.) took 9.537e-07s; avg 3.179e-07s ( +/- 88.17/200.00 %); best 3.76e-08s; worst 9.537e-07s; std dev. 4.496e-07 (taking best). + 11 threads: 3.76e-08s (2.2e+04 Mflops) (0/2 degradations so far) - +3 iterations (10 th.) took 9.537e-07s; avg 3.179e-07s ( +/- 88.17/200.00 %); best 3.76e-08s; worst 9.537e-07s; std dev. 4.496e-07 (taking best). + 10 threads: 3.76e-08s (2.2e+04 Mflops) (0/2 degradations so far) - +3 iterations (9 th.) took 9.537e-07s; avg 3.179e-07s ( +/- 88.17/200.00 %); best 3.76e-08s; worst 9.537e-07s; std dev. 4.496e-07 (taking best). + 9 threads: 3.76e-08s (2.2e+04 Mflops) (0/2 degradations so far) - +3 iterations (8 th.) took 1.907e-06s; avg 6.358e-07s ( +/- 94.09/ 50.00 %); best 3.76e-08s; worst 9.537e-07s; std dev. 4.496e-07 (taking best). + 8 threads: 3.76e-08s (2.2e+04 Mflops) (0/2 degradations so far) - +3 iterations (7 th.) took 1.907e-06s; avg 6.358e-07s ( +/- 94.09/ 50.00 %); best 3.76e-08s; worst 9.537e-07s; std dev. 4.496e-07 (taking best). + 7 threads: 3.76e-08s (2.2e+04 Mflops) (0/2 degradations so far) - +3 iterations (6 th.) took 9.537e-07s; avg 3.179e-07s ( +/- 88.17/200.00 %); best 3.76e-08s; worst 9.537e-07s; std dev. 4.496e-07 (taking best). + 6 threads: 3.76e-08s (2.2e+04 Mflops) (0/2 degradations so far) - +3 iterations (5 th.) took 3.099e-06s; avg 1.033e-06s ( +/- 96.36/107.69 %); best 3.76e-08s; worst 2.146e-06s; std dev. 8.778e-07 (taking best). + 5 threads: 3.76e-08s (2.2e+04 Mflops) (0/2 degradations so far) - +3 iterations (4 th.) took 9.537e-07s; avg 3.179e-07s ( +/- 88.17/200.00 %); best 3.76e-08s; worst 9.537e-07s; std dev. 4.496e-07 (taking best). + 4 threads: 3.76e-08s (2.2e+04 Mflops) (0/2 degradations so far) - +3 iterations (3 th.) took 1.192e-06s; avg 3.974e-07s ( +/- 90.54/200.00 %); best 3.76e-08s; worst 1.192e-06s; std dev. 5.62e-07 (taking best). + 3 threads: 3.76e-08s (2.2e+04 Mflops) (0/2 degradations so far) - +3 iterations (2 th.) took 2.146e-06s; avg 7.153e-07s ( +/- 94.74/ 66.67 %); best 3.76e-08s; worst 1.192e-06s; std dev. 5.15e-07 (taking best). + 2 threads: 3.76e-08s (2.2e+04 Mflops) (0/2 degradations so far) - +3 iterations (1 th.) took 2.146e-06s; avg 7.153e-07s ( +/- 94.74/ 66.67 %); best 3.76e-08s; worst 1.192e-06s; std dev. 5.15e-07 (taking best). + 1 threads: 3.76e-08s (2.2e+04 Mflops) (0/2 degradations so far) - +Best threads choice is 12; starting threads were 12; max speed gap is 1x; search took 0.00018s. +Starting split (and threads) based auto-tuning procedure (transA=N, nrhs=1, order=cols) (max 6 steps, inclusive 3 grace steps) on: 20 x 20, type D, 210 nnz, 10 nnz/r, 1 subms, 1 lsubms, 2.4000 bpnz (tpop: 3.76e-08 Mflops: 22341.251) +Split (1 -> 3 leaves, 1 -> 4 subms) took 3.6e-05s (of which: 3.099e-06s analysis, -1.754e+09s mem.mgmt); compute time: 1.502e-05s overall, 3.099e-06s searches, 1.192e-05s shuffle, 3.099e-06s switch, 0s quadrants. +3 iterations (12 th.) took 0.003212s; avg 0.001071s ( +/- 25.45/ 25.42 %); best 0.0007982s; worst 0.001343s; std dev. 0.0002223 (taking best). +~ 12 threads: 0.0007982s (1.1 Mflops) (0/2 degradations so far) - +3 iterations (11 th.) took 0.002051s; avg 0.0006836s ( +/- 16.93/ 13.24 %); best 0.0005679s; worst 0.0007741s; std dev. 8.606e-05 (taking best). + 11 threads: 0.0005679s (1.5 Mflops) (0/2 degradations so far) - +3 iterations (10 th.) took 0.003215s; avg 0.001072s ( +/- 30.75/ 33.88 %); best 0.0007422s; worst 0.001435s; std dev. 0.0002838 (taking best). + 10 threads: 0.0007422s (1.1 Mflops) (1/2 degradations so far) - +3 iterations (9 th.) took 0.002396s; avg 0.0007987s ( +/- 20.60/ 18.42 %); best 0.0006342s; worst 0.0009458s; std dev. 0.0001278 (taking best). + 9 threads: 0.0006342s (1.3 Mflops) (2/2 degradations so far) - +Best threads choice is 11; starting threads were 12; max speed gap is 1.4x; search took 0.011s. +After split step 1: tpop: 0.0005679 s ~Mflops: 1.479 nsubm:3 otn:11 +Applying split (1 -> 3 leaves, 11 th.) yielded SLOWDOWN (1th of 3 tolerable) of 15104.629x: 3.76e-08s -> 0.0005679s. +Skipping further split based tests after 1 definite performance degradations in a row (and last exceeding limit). +A total of 1 split steps (of max 6) (1 -> 3 subms) took 0.01102s (of which 4.721e-05s partitioning, 0s I/O); computing times: 1.502e-05s in par. loops, 3.099e-06s sorting, 3.099e-06s analyzing) +Total split + benchmarking process took 0.01102s, equivalent to 293202.3/293202.3 new/old ops (0.001879s for 1 clones -- as 49974.6/49974.6 ops, or 49974.6/49974.6 ops per clone), SPEEDUP of 1.000x (NO SPEEDUP) +In 1 tuning rounds (tot. 0.016s, 0.0044s for constructor, 2 clones) obtained NO speedup (best stays 2.234e+04 Mflops). check results are ok Building a matrix with 36 nnz, 6 x 6 Duplicates check: 36 - 0 = 36 - converted COO to RSB in 3.047e-03 s (100.00 %) - analyzed arrays in 1.411e-03 s (46.31 %) - cleaned-up arrays in 9.537e-07 s (0.03 %) - deduplicated arrays in 9.537e-07 s (0.03 %) - sorted arrays in 6.001e-04 s (19.69 %) - shuffled partitions in 1.030e-03 s (33.80 %) - memory allocations took 1.907e-06 s (0.06 %) - leafs setup took 9.537e-07 s (0.03 %) - halfword conversion took 0.000e+00 s (0.00 %) -Built (6 x 6)[0xaaab0aaf6740]{Z} @ (0(0..6),0(0..6)) (36 nnz, 6 nnz/r) flags 0x20440b4 (coo:0, csr:1, hw:0, ic:1, fi:0), storage: 1, subm: 1, symflags:'UL' + converted COO to RSB in 2.280e-03 s (100.00 %) + analyzed arrays in 8.199e-04 s (35.96 %) + cleaned-up arrays in 9.537e-07 s (0.04 %) + deduplicated arrays in 9.537e-07 s (0.04 %) + sorted arrays in 6.511e-04 s (28.56 %) + shuffled partitions in 7.958e-04 s (34.91 %) + memory allocations took 7.153e-06 s (0.31 %) + leafs setup took 2.146e-06 s (0.09 %) + halfword conversion took 9.537e-07 s (0.04 %) +Built (6 x 6)[0xaaaae219f4f0]{Z} @ (0(0..6),0(0..6)) (36 nnz, 6 nnz/r) flags 0x20440b4 (coo:0, csr:1, hw:0, ic:1, fi:0), storage: 1, subm: 1, symflags:'UL' Read matrix pd.mtx 6 x 6 : 36 Matrix has no symmetry Using NRHS=4 -Repeated USMV took 0.1841E-03 s -A single USMM took 0.6199E-05 s -USMM-to-USMV speed ratio is is 29.69 x +Repeated USMV took 0.2420E-03 s +A single USMM took 0.5960E-05 s +USMM-to-USMV speed ratio is is 40.60 x Call auto-tuning routine.. Repeat measurement. -Tuned USMM took 0.2146E-05 s -Tuned-to-untuned speed ratio is is 2.889 x +Tuned USMM took 0.5007E-05 s +Tuned-to-untuned speed ratio is is 1.190 x FAILED: 0 PASSED: 2 /build/reproducible-path/librsb-1.3.0.2+dfsg/examples/fortran_rsb_fi @@ -8920,193 +8937,218 @@ Loading matrix from file "/build/reproducible-path/librsb-1.3.0.2+dfsg/pd.mtx". Building a matrix with 36 nnz, 6 x 6 Duplicates check: 36 - 0 = 36 - converted COO to RSB in 1.713e-02 s (100.00 %) - analyzed arrays in 2.349e-03 s (13.71 %) - cleaned-up arrays in 6.914e-06 s (0.04 %) - deduplicated arrays in 2.146e-06 s (0.01 %) - sorted arrays in 6.368e-03 s (37.17 %) - shuffled partitions in 4.783e-03 s (27.92 %) - memory allocations took 1.335e-05 s (0.08 %) - leafs setup took 6.914e-06 s (0.04 %) - halfword conversion took 3.591e-03 s (20.96 %) -Built (6 x 6)[0xaaab10bc2a20]{D} @ (0(0..0),0(0..0)) (36 nnz, 6 nnz/r) flags 0x42046186 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 22, symflags:'' + converted COO to RSB in 9.409e-03 s (100.00 %) + analyzed arrays in 2.539e-03 s (26.98 %) + cleaned-up arrays in 9.060e-06 s (0.10 %) + deduplicated arrays in 5.007e-06 s (0.05 %) + sorted arrays in 1.477e-03 s (15.70 %) + shuffled partitions in 2.087e-03 s (22.18 %) + memory allocations took 3.195e-05 s (0.34 %) + leafs setup took 7.868e-06 s (0.08 %) + halfword conversion took 3.216e-03 s (34.18 %) +Built (6 x 6)[0xaaab113f1a20]{D} @ (0(0..0),0(0..0)) (36 nnz, 6 nnz/r) flags 0x42046186 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 22, symflags:'' Considering D clone. Base matrix: -(6 x 6)[0xaaab10bc6aa0]{D} @ (0(0..0),0(0..0)) (36 nnz, 6 nnz/r) flags 0x2046186 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 22, symflags:'' +(6 x 6)[0xaaab113f5aa0]{D} @ (0(0..0),0(0..0)) (36 nnz, 6 nnz/r) flags 0x2046186 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 22, symflags:'' -Will use autotuning routine to sample matrix: 6 x 6, type D, 36 nnz, 6 nnz/r, 29 subms, 22 lsubms, 4.6667 bpnz. +Will use autotuning routine to sample matrix: 6 x 6, type D, 36 nnz, 6 nnz/r, 29 subms, 22 lsubms, 4.2778 bpnz. Parameters: verbosity:1 mintimes:3 maxtimes:10 mindt:0 maxdt:0.1 -3 iterations (12 th.) took 0.00484s; avg 0.001613s ( +/- 45.84/ 66.12 %); best 0.0008738s; worst 0.00268s; std dev. 0.0007729 (taking best). -Reference operation time is 0.000873804 s (0.1648 Mflops) with 12 threads. -After 0.004889s, autotuning routine did not find a better threads count configuration. +3 iterations (12 th.) took 0.003912s; avg 0.001304s ( +/- 40.58/ 25.46 %); best 0.0007749s; worst 0.001636s; std dev. 0.0003782 (taking best). +Reference operation time is 0.00077486 s (0.1858 Mflops) with 12 threads. +After 0.003976s, autotuning routine did not find a better threads count configuration. -Will autotune matrix: 6 x 6, type D, 36 nnz, 6 nnz/r, 29 subms, 22 lsubms, 4.6667 bpnz. +Will autotune matrix: 6 x 6, type D, 36 nnz, 6 nnz/r, 29 subms, 22 lsubms, 4.2778 bpnz. Parameters: verbosity:1 mintimes:3 maxtimes:10 mindt:0 maxdt:0.1 -3 iterations (12 th.) took 0.003252s; avg 0.001084s ( +/- 11.91/ 12.44 %); best 0.0009549s; worst 0.001219s; std dev. 0.0001078 (taking best). -Reference operation time is 0.000954866 s (0.1508 Mflops) with 12 threads. -Starting merge (same threads) based auto-tuning procedure (transA=N, nrhs=2, order=cols) (max 6 steps, inclusive 3 grace steps) on: 6 x 6, type D, 36 nnz, 6 nnz/r, 29 subms, 22 lsubms, 4.6667 bpnz (tpop: 0.0009549 Mflops: 0.151) -Merge (22 -> 16 leaves) took w.c.t. of 0.001793s, ~0.002333s of computing time (of which 1.907e-06s sorting, 5.96e-06s analysis) -3 iterations (12 th.) took 0.007648s; avg 0.002549s ( +/- 59.44/118.84 %); best 0.001034s; worst 0.005579s; std dev. 0.002142 (taking best). -Reference operation time is 0.00103402 s (0.1393 Mflops) with 12 threads. -After merge step 1: tpop: 0.001034 s ~Mflops: 0.139 nsubm:16 otn:12 -Applying merge (22 -> 16 leaves, 12 th.) yielded SLOWDOWN (1th of 3 tolerable) of 1.083x: 0.0009549s -> 0.001034s. -Merge (16 -> 10 leaves) took w.c.t. of 0.000613s, ~1.502e-05s of computing time (of which 1.907e-06s sorting, 5.007e-06s analysis) -3 iterations (12 th.) took 0.004364s; avg 0.001455s ( +/- 45.63/ 32.07 %); best 0.0007908s; worst 0.001921s; std dev. 0.0004821 (taking best). -Reference operation time is 0.000790834 s (0.1821 Mflops) with 12 threads. -After merge step 2: tpop: 0.0007908 s ~Mflops: 0.182 nsubm:10 otn:12 -Applying merge (16 -> 10 leaves, 12 th.) yielded SPEEDUP of 1.207x: 0.0009549s -> 0.0007908s, so taking this instance. -Merge (10 -> 7 leaves) took w.c.t. of 1.097e-05s, ~3.815e-06s of computing time (of which 9.537e-07s sorting, 2.861e-06s analysis) -3 iterations (12 th.) took 0.009063s; avg 0.003021s ( +/- 62.95/109.53 %); best 0.001119s; worst 0.00633s; std dev. 0.002349 (taking best). -Reference operation time is 0.00111914 s (0.1287 Mflops) with 12 threads. -After merge step 3: tpop: 0.001119 s ~Mflops: 0.129 nsubm:7 otn:12 -Applying merge (10 -> 7 leaves, 12 th.) yielded SLOWDOWN (1th of 3 tolerable) of 1.415x: 0.0007908s -> 0.001119s. +3 iterations (12 th.) took 0.004872s; avg 0.001624s ( +/- 37.31/ 49.93 %); best 0.001018s; worst 0.002435s; std dev. 0.0005963 (taking best). +Reference operation time is 0.00101805 s (0.1414 Mflops) with 12 threads. +Starting merge (same threads) based auto-tuning procedure (transA=N, nrhs=2, order=cols) (max 6 steps, inclusive 3 grace steps) on: 6 x 6, type D, 36 nnz, 6 nnz/r, 29 subms, 22 lsubms, 4.2778 bpnz (tpop: 0.001018 Mflops: 0.141) +Merge (22 -> 19 leaves) took w.c.t. of 3.099e-05s, ~1.097e-05s of computing time (of which 9.537e-07s sorting, 6.914e-06s analysis) +3 iterations (12 th.) took 0.006189s; avg 0.002063s ( +/- 33.55/ 62.97 %); best 0.001371s; worst 0.003362s; std dev. 0.0009192 (taking best). +Reference operation time is 0.00137091 s (0.105 Mflops) with 12 threads. +After merge step 1: tpop: 0.001371 s ~Mflops: 0.105 nsubm:19 otn:12 +Applying merge (22 -> 19 leaves, 12 th.) yielded SLOWDOWN (1th of 3 tolerable) of 1.347x: 0.001018s -> 0.001371s. Skipping further merge based tests after 1 definite performance degradations in a row (and last exceeding limit). -A total of 3 merge steps (of max 6) (22 -> 7 subms) took 0.02718s (of which 0.002434s partitioning, 0s I/O); computing times: 0.002352s in par. loops, 4.768e-06s sorting, 1.383e-05s analyzing) -Total merge + benchmarking process took 0.02718s, equivalent to 34.4/28.5 new/old ops (0.005747s for 2 clones -- as 7.3/6.0 ops, or 3.6/3.0 ops per clone), SPEEDUP of 1.207x -Applying multi-merge (22 -> 10 leaves, 2 steps, 0 -> 12 th.sp.) yielded SPEEDUP of 1.207x (0.0009549s -> 0.0007908s), will amortize in 165.7 ops by saving 0.000164s per op. -In 1 tuning rounds (tot. 0.033s, 0.0057s for constructor, 2 clones) obtained a SPEEDUP of 20.7% (1.207x) (from 0.1508 to 0.1821 Mflops). -After 0.032810s, global autotuning declared speedup of 1.20742 x, when using threads count of 12 and a new matrix: -(6 x 6)[0xaaab10bc8e70]{D} @ (0(0..0),0(0..0)) (36 nnz, 6 nnz/r) flags 0x2046186 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 10, symflags:'' +A total of 1 merge steps (of max 6) (22 -> 19 subms) took 0.006242s (of which 3.695e-05s partitioning, 0s I/O); computing times: 1.097e-05s in par. loops, 9.537e-07s sorting, 6.914e-06s analyzing) +Total merge + benchmarking process took 0.006242s, equivalent to 6.1/6.1 new/old ops (0.002831s for 1 clones -- as 2.8/2.8 ops, or 2.8/2.8 ops per clone), SPEEDUP of 1.000x (NO SPEEDUP) +Merging based autotuning FAILED (=NO SPEEDUP); let's try splitting then... +3 iterations (12 th.) took 0.003951s; avg 0.001317s ( +/- 26.96/ 26.74 %); best 0.000962s; worst 0.001669s; std dev. 0.0002887 (taking best). +Reference operation time is 0.000962019 s (0.1497 Mflops) with 12 threads. +Starting split (same threads) based auto-tuning procedure (transA=N, nrhs=2, order=cols) (max 6 steps, inclusive 3 grace steps) on: 6 x 6, type D, 36 nnz, 6 nnz/r, 29 subms, 22 lsubms, 4.2778 bpnz (tpop: 0.000962 Mflops: 0.150) +Split (22 -> 25 leaves, 29 -> 33 subms) took 0.0009871s (of which: 3.815e-06s analysis, -1.754e+09s mem.mgmt); compute time: 0.0001221s overall, 4.053e-06s searches, 0.000118s shuffle, 9.298e-05s switch, 1.907e-06s quadrants. +3 iterations (12 th.) took 0.01256s; avg 0.004185s ( +/- 66.12/ 54.18 %); best 0.001418s; worst 0.006453s; std dev. 0.002086 (taking best). +Reference operation time is 0.00141788 s (0.1016 Mflops) with 12 threads. +After split step 1: tpop: 0.001418 s ~Mflops: 0.102 nsubm:25 otn:12 +Applying split (22 -> 25 leaves, 12 th.) yielded SLOWDOWN (1th of 3 tolerable) of 1.474x: 0.000962s -> 0.001418s. +Skipping further split based tests after 1 definite performance degradations in a row (and last exceeding limit). +A total of 1 split steps (of max 6) (22 -> 25 subms) took 0.01373s (of which 0.001059s partitioning, 0s I/O); computing times: 0.0001221s in par. loops, 4.053e-06s sorting, 3.815e-06s analyzing) +Total split + benchmarking process took 0.01373s, equivalent to 14.3/14.3 new/old ops (0.002688s for 1 clones -- as 2.8/2.8 ops, or 2.8/2.8 ops per clone), SPEEDUP of 1.000x (NO SPEEDUP) +In 1 tuning rounds (tot. 0.034s, 0.0055s for constructor, 2 clones) obtained NO speedup (best stays 0.1497 Mflops). +After 0.034411s, global autotuning found old matrix optimal, with declared speedup 1 x when using 12 threads Considering S clone. Building a matrix with 36 nnz, 6 x 6 Duplicates check: 36 - 0 = 36 - converted COO to RSB in 1.766e-02 s (100.00 %) - analyzed arrays in 7.455e-03 s (42.22 %) + converted COO to RSB in 9.764e-03 s (100.00 %) + analyzed arrays in 2.211e-03 s (22.64 %) cleaned-up arrays in 9.537e-07 s (0.01 %) - deduplicated arrays in 9.537e-07 s (0.01 %) + deduplicated arrays in 0.000e+00 s (0.00 %) sorted arrays in 0.000e+00 s (0.00 %) - shuffled partitions in 3.771e-03 s (21.35 %) - memory allocations took 4.053e-06 s (0.02 %) - leafs setup took 3.099e-06 s (0.02 %) - halfword conversion took 6.423e-03 s (36.37 %) -Built (6 x 6)[0xaaab10bc8e70]{S} @ (0(0..0),0(0..0)) (36 nnz, 6 nnz/r) flags 0x42046186 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 16, symflags:'' + shuffled partitions in 2.421e-03 s (24.80 %) + memory allocations took 4.053e-06 s (0.04 %) + leafs setup took 5.007e-06 s (0.05 %) + halfword conversion took 5.121e-03 s (52.45 %) +Built (6 x 6)[0xaaab113f5aa0]{S} @ (0(0..0),0(0..0)) (36 nnz, 6 nnz/r) flags 0x42046186 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 16, symflags:'' Base matrix: -(6 x 6)[0xaaab10bc8e70]{S} @ (0(0..0),0(0..0)) (36 nnz, 6 nnz/r) flags 0x2046186 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 16, symflags:'' +(6 x 6)[0xaaab113f5aa0]{S} @ (0(0..0),0(0..0)) (36 nnz, 6 nnz/r) flags 0x2046186 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 16, symflags:'' -Will use autotuning routine to sample matrix: 6 x 6, type S, 36 nnz, 6 nnz/r, 21 subms, 16 lsubms, 4.8889 bpnz. +Will use autotuning routine to sample matrix: 6 x 6, type S, 36 nnz, 6 nnz/r, 21 subms, 16 lsubms, 4.5000 bpnz. Parameters: verbosity:1 mintimes:3 maxtimes:10 mindt:0 maxdt:0.1 -3 iterations (12 th.) took 0.003594s; avg 0.001198s ( +/- 17.79/ 12.78 %); best 0.0009849s; worst 0.001351s; std dev. 0.0001554 (taking best). -Reference operation time is 0.000984907 s (0.1462 Mflops) with 12 threads. -After 0.003617s, autotuning routine did not find a better threads count configuration. +3 iterations (12 th.) took 0.01074s; avg 0.003581s ( +/- 67.52/119.27 %); best 0.001163s; worst 0.007852s; std dev. 0.003029 (taking best). +Reference operation time is 0.00116301 s (0.1238 Mflops) with 12 threads. +After 0.010778s, autotuning routine did not find a better threads count configuration. -Will autotune matrix: 6 x 6, type S, 36 nnz, 6 nnz/r, 21 subms, 16 lsubms, 4.8889 bpnz. +Will autotune matrix: 6 x 6, type S, 36 nnz, 6 nnz/r, 21 subms, 16 lsubms, 4.5000 bpnz. Parameters: verbosity:1 mintimes:3 maxtimes:10 mindt:0 maxdt:0.1 -3 iterations (12 th.) took 0.003245s; avg 0.001082s ( +/- 33.06/ 31.84 %); best 0.0007241s; worst 0.001426s; std dev. 0.0002867 (taking best). -Reference operation time is 0.000724077 s (0.1989 Mflops) with 12 threads. -Starting merge (same threads) based auto-tuning procedure (transA=N, nrhs=2, order=cols) (max 6 steps, inclusive 3 grace steps) on: 6 x 6, type S, 36 nnz, 6 nnz/r, 21 subms, 16 lsubms, 4.8889 bpnz (tpop: 0.0007241 Mflops: 0.199) -Merge (16 -> 10 leaves) took w.c.t. of 4.482e-05s, ~1.001e-05s of computing time (of which 2.146e-06s sorting, 3.815e-06s analysis) -3 iterations (12 th.) took 0.0217s; avg 0.007234s ( +/- 25.79/ 20.60 %); best 0.005368s; worst 0.008724s; std dev. 0.001396 (taking best). -Reference operation time is 0.00536799 s (0.02683 Mflops) with 12 threads. -After merge step 1: tpop: 0.005368 s ~Mflops: 0.027 nsubm:10 otn:12 -Applying merge (16 -> 10 leaves, 12 th.) yielded SLOWDOWN (1th of 3 tolerable) of 7.414x: 0.0007241s -> 0.005368s. -Skipping further merge based tests after 1 definite performance degradations in a row (and last exceeding limit). -A total of 1 merge steps (of max 6) (16 -> 10 subms) took 0.02178s (of which 4.792e-05s partitioning, 0s I/O); computing times: 1.001e-05s in par. loops, 2.146e-06s sorting, 3.815e-06s analyzing) -Total merge + benchmarking process took 0.02178s, equivalent to 30.1/30.1 new/old ops (0.002602s for 1 clones -- as 3.6/3.6 ops, or 3.6/3.6 ops per clone), SPEEDUP of 1.000x (NO SPEEDUP) -Merging based autotuning FAILED (=NO SPEEDUP); let's try splitting then... -3 iterations (12 th.) took 0.01474s; avg 0.004914s ( +/- 81.58/ 54.47 %); best 0.000905s; worst 0.007591s; std dev. 0.002888 (taking best). -Reference operation time is 0.000905037 s (0.1591 Mflops) with 12 threads. -Starting split (same threads) based auto-tuning procedure (transA=N, nrhs=2, order=cols) (max 6 steps, inclusive 3 grace steps) on: 6 x 6, type S, 36 nnz, 6 nnz/r, 21 subms, 16 lsubms, 4.8889 bpnz (tpop: 0.000905 Mflops: 0.159) -Split (16 -> 28 leaves, 21 -> 37 subms) took 0.003631s (of which: 3.815e-06s analysis, -7.155e+09s mem.mgmt); compute time: 0.00459s overall, 4.053e-06s searches, 0.004586s shuffle, 0.004144s switch, 4.625e-05s quadrants. -3 iterations (12 th.) took 0.006021s; avg 0.002007s ( +/- 22.32/ 14.90 %); best 0.001559s; worst 0.002306s; std dev. 0.0003226 (taking best). -Reference operation time is 0.00155902 s (0.09237 Mflops) with 12 threads. -After split step 1: tpop: 0.001559 s ~Mflops: 0.092 nsubm:28 otn:12 -Applying split (16 -> 28 leaves, 12 th.) yielded SLOWDOWN (1th of 3 tolerable) of 1.723x: 0.000905s -> 0.001559s. -Skipping further split based tests after 1 definite performance degradations in a row (and last exceeding limit). -A total of 1 split steps (of max 6) (16 -> 28 subms) took 0.009969s (of which 0.003925s partitioning, 0s I/O); computing times: 0.00459s in par. loops, 4.053e-06s sorting, 3.815e-06s analyzing) -Total split + benchmarking process took 0.009969s, equivalent to 11.0/11.0 new/old ops (0.006512s for 1 clones -- as 7.2/7.2 ops, or 7.2/7.2 ops per clone), SPEEDUP of 1.000x (NO SPEEDUP) -In 1 tuning rounds (tot. 0.059s, 0.0091s for constructor, 2 clones) obtained NO speedup (best stays 0.1591 Mflops). -After 0.058969s, global autotuning found old matrix optimal, with declared speedup 1 x when using 12 threads +3 iterations (12 th.) took 0.003956s; avg 0.001319s ( +/- 20.30/ 22.78 %); best 0.001051s; worst 0.001619s; std dev. 0.0002331 (taking best). +Reference operation time is 0.00105095 s (0.137 Mflops) with 12 threads. +Starting merge (same threads) based auto-tuning procedure (transA=N, nrhs=2, order=cols) (max 6 steps, inclusive 3 grace steps) on: 6 x 6, type S, 36 nnz, 6 nnz/r, 21 subms, 16 lsubms, 4.5000 bpnz (tpop: 0.001051 Mflops: 0.137) +Merge (16 -> 13 leaves) took w.c.t. of 1.407e-05s, ~4.053e-06s of computing time (of which 9.537e-07s sorting, 5.007e-06s analysis) +3 iterations (12 th.) took 0.003088s; avg 0.001029s ( +/- 42.00/ 51.67 %); best 0.000597s; worst 0.001561s; std dev. 0.0003999 (taking best). +Reference operation time is 0.000597 s (0.2412 Mflops) with 12 threads. +After merge step 1: tpop: 0.000597 s ~Mflops: 0.241 nsubm:13 otn:12 +Applying merge (16 -> 13 leaves, 12 th.) yielded SPEEDUP of 1.760x: 0.001051s -> 0.000597s, so taking this instance. +Merge (13 -> 10 leaves) took w.c.t. of 2.384e-05s, ~6.914e-06s of computing time (of which 1.907e-06s sorting, 6.914e-06s analysis) +3 iterations (12 th.) took 0.003776s; avg 0.001259s ( +/- 43.19/ 54.85 %); best 0.000715s; worst 0.001949s; std dev. 0.0005144 (taking best). +Reference operation time is 0.000715017 s (0.2014 Mflops) with 12 threads. +After merge step 2: tpop: 0.000715 s ~Mflops: 0.201 nsubm:10 otn:12 +Applying merge (13 -> 10 leaves, 12 th.) yielded SLOWDOWN (1th of 3 tolerable) of 1.198x: 0.000597s -> 0.000715s. +Merge (10 -> 7 leaves) took w.c.t. of 2.003e-05s, ~6.914e-06s of computing time (of which 9.537e-07s sorting, 5.96e-06s analysis) +3 iterations (12 th.) took 0.004535s; avg 0.001512s ( +/- 28.36/ 21.40 %); best 0.001083s; worst 0.001835s; std dev. 0.000316 (taking best). +Reference operation time is 0.0010829 s (0.133 Mflops) with 12 threads. +After merge step 3: tpop: 0.001083 s ~Mflops: 0.133 nsubm:7 otn:12 +Applying merge (10 -> 7 leaves, 12 th.) yielded SLOWDOWN (2th of 3 tolerable) of 1.814x: 0.000597s -> 0.001083s. +Skipping further merge based tests after 2 definite performance degradations in a row (and last exceeding limit). +A total of 3 merge steps (of max 6) (16 -> 7 subms) took 0.02001s (of which 7.033e-05s partitioning, 0s I/O); computing times: 1.788e-05s in par. loops, 3.815e-06s sorting, 1.788e-05s analyzing) +Total merge + benchmarking process took 0.02001s, equivalent to 33.5/19.0 new/old ops (0.01185s for 2 clones -- as 19.8/11.3 ops, or 9.9/5.6 ops per clone), SPEEDUP of 1.760x +Applying multi-merge (16 -> 13 leaves, 1 steps, 0 -> 12 th.sp.) yielded SPEEDUP of 1.760x (0.001051s -> 0.000597s), will amortize in 44.1 ops by saving 0.0004539s per op. +In 1 tuning rounds (tot. 0.027s, 0.012s for constructor, 2 clones) obtained a SPEEDUP of 76.0% (1.76x) (from 0.137 to 0.2412 Mflops). +After 0.027451s, global autotuning declared speedup of 1.76038 x, when using threads count of 12 and a new matrix: +(6 x 6)[0xaaab113f7e70]{S} @ (0(0..0),0(0..0)) (36 nnz, 6 nnz/r) flags 0x2046186 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 13, symflags:'' Considering C clone. Building a matrix with 36 nnz, 6 x 6 Duplicates check: 36 - 0 = 36 - converted COO to RSB in 1.153e-02 s (100.00 %) - analyzed arrays in 4.748e-03 s (41.16 %) - cleaned-up arrays in 0.000e+00 s (0.00 %) + converted COO to RSB in 1.319e-02 s (100.00 %) + analyzed arrays in 2.156e-03 s (16.35 %) + cleaned-up arrays in 1.192e-06 s (0.01 %) deduplicated arrays in 9.537e-07 s (0.01 %) sorted arrays in 0.000e+00 s (0.00 %) - shuffled partitions in 3.302e-03 s (28.62 %) - memory allocations took 6.199e-06 s (0.05 %) - leafs setup took 2.146e-06 s (0.02 %) - halfword conversion took 3.475e-03 s (30.13 %) -Built (6 x 6)[0xaaab10bcc400]{C} @ (0(0..0),0(0..0)) (36 nnz, 6 nnz/r) flags 0x42046186 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 22, symflags:'' + shuffled partitions in 8.304e-03 s (62.98 %) + memory allocations took 6.914e-06 s (0.05 %) + leafs setup took 5.007e-06 s (0.04 %) + halfword conversion took 2.710e-03 s (20.55 %) +Built (6 x 6)[0xaaab113fa990]{C} @ (0(0..0),0(0..0)) (36 nnz, 6 nnz/r) flags 0x42046186 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 22, symflags:'' Base matrix: -(6 x 6)[0xaaab10bcc400]{C} @ (0(0..0),0(0..0)) (36 nnz, 6 nnz/r) flags 0x2046186 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 22, symflags:'' +(6 x 6)[0xaaab113fa990]{C} @ (0(0..0),0(0..0)) (36 nnz, 6 nnz/r) flags 0x2046186 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 22, symflags:'' Will use autotuning routine to sample matrix: 6 x 6, type C, 36 nnz, 6 nnz/r, 29 subms, 22 lsubms, 4.6667 bpnz. Parameters: verbosity:1 mintimes:3 maxtimes:10 mindt:0 maxdt:0.1 -3 iterations (12 th.) took 0.007415s; avg 0.002472s ( +/- 65.73/ 96.43 %); best 0.0008471s; worst 0.004855s; std dev. 0.001722 (taking best). -Reference operation time is 0.000847101 s (0.68 Mflops) with 12 threads. -After 0.007433s, autotuning routine did not find a better threads count configuration. +3 iterations (12 th.) took 0.007631s; avg 0.002544s ( +/- 54.92/101.41 %); best 0.001147s; worst 0.005123s; std dev. 0.001826 (taking best). +Reference operation time is 0.00114679 s (0.5023 Mflops) with 12 threads. +After 0.007672s, autotuning routine did not find a better threads count configuration. Will autotune matrix: 6 x 6, type C, 36 nnz, 6 nnz/r, 29 subms, 22 lsubms, 4.6667 bpnz. Parameters: verbosity:1 mintimes:3 maxtimes:10 mindt:0 maxdt:0.1 -3 iterations (12 th.) took 0.003574s; avg 0.001191s ( +/- 13.22/ 25.66 %); best 0.001034s; worst 0.001497s; std dev. 0.0002162 (taking best). -Reference operation time is 0.00103378 s (0.5572 Mflops) with 12 threads. -Starting merge (same threads) based auto-tuning procedure (transA=N, nrhs=2, order=cols) (max 6 steps, inclusive 3 grace steps) on: 6 x 6, type C, 36 nnz, 6 nnz/r, 29 subms, 22 lsubms, 4.6667 bpnz (tpop: 0.001034 Mflops: 0.557) -Merge (22 -> 16 leaves) took w.c.t. of 0.000632s, ~1.001e-05s of computing time (of which 1.907e-06s sorting, 3.099e-06s analysis) -3 iterations (12 th.) took 0.005101s; avg 0.0017s ( +/- 47.60/ 62.37 %); best 0.000891s; worst 0.002761s; std dev. 0.0007838 (taking best). -Reference operation time is 0.00089097 s (0.6465 Mflops) with 12 threads. -After merge step 1: tpop: 0.000891 s ~Mflops: 0.646 nsubm:16 otn:12 -Applying merge (22 -> 16 leaves, 12 th.) yielded SPEEDUP of 1.160x: 0.001034s -> 0.000891s, so taking this instance. -Merge (16 -> 10 leaves) took w.c.t. of 0.000212s, ~1.216e-05s of computing time (of which 1.907e-06s sorting, 3.099e-06s analysis) -3 iterations (12 th.) took 0.01167s; avg 0.003891s ( +/- 70.06/128.89 %); best 0.001165s; worst 0.008907s; std dev. 0.003551 (taking best). -Reference operation time is 0.00116515 s (0.4944 Mflops) with 12 threads. -After merge step 2: tpop: 0.001165 s ~Mflops: 0.494 nsubm:10 otn:12 -Applying merge (16 -> 10 leaves, 12 th.) yielded SLOWDOWN (1th of 3 tolerable) of 1.308x: 0.000891s -> 0.001165s. +3 iterations (12 th.) took 0.003102s; avg 0.001034s ( +/- 17.41/ 17.32 %); best 0.000854s; worst 0.001213s; std dev. 0.0001466 (taking best). +Reference operation time is 0.000854015 s (0.6745 Mflops) with 12 threads. +Starting merge (same threads) based auto-tuning procedure (transA=N, nrhs=2, order=cols) (max 6 steps, inclusive 3 grace steps) on: 6 x 6, type C, 36 nnz, 6 nnz/r, 29 subms, 22 lsubms, 4.6667 bpnz (tpop: 0.000854 Mflops: 0.674) +Merge (22 -> 16 leaves) took w.c.t. of 0.00068s, ~0.0003479s of computing time (of which 1.907e-06s sorting, 4.053e-06s analysis) +3 iterations (12 th.) took 0.005046s; avg 0.001682s ( +/- 35.01/ 34.95 %); best 0.001093s; worst 0.00227s; std dev. 0.0004804 (taking best). +Reference operation time is 0.00109315 s (0.5269 Mflops) with 12 threads. +After merge step 1: tpop: 0.001093 s ~Mflops: 0.527 nsubm:16 otn:12 +Applying merge (22 -> 16 leaves, 12 th.) yielded SLOWDOWN (1th of 3 tolerable) of 1.280x: 0.000854s -> 0.001093s. Skipping further merge based tests after 1 definite performance degradations in a row (and last exceeding limit). -A total of 2 merge steps (of max 6) (22 -> 10 subms) took 0.02094s (of which 0.00085s partitioning, 0s I/O); computing times: 2.217e-05s in par. loops, 3.815e-06s sorting, 6.199e-06s analyzing) -Total merge + benchmarking process took 0.02094s, equivalent to 23.5/20.3 new/old ops (0.006367s for 2 clones -- as 7.1/6.2 ops, or 3.6/3.1 ops per clone), SPEEDUP of 1.160x -Applying multi-merge (22 -> 16 leaves, 1 steps, 0 -> 12 th.sp.) yielded SPEEDUP of 1.160x (0.001034s -> 0.000891s), will amortize in 146.6 ops by saving 0.0001428s per op. -In 1 tuning rounds (tot. 0.028s, 0.0064s for constructor, 2 clones) obtained a SPEEDUP of 16.0% (1.16x) (from 0.5572 to 0.6465 Mflops). -After 0.027663s, global autotuning declared speedup of 1.16029 x, when using threads count of 12 and a new matrix: -(6 x 6)[0xaaab10bc8e70]{C} @ (0(0..0),0(0..0)) (36 nnz, 6 nnz/r) flags 0x2046186 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 16, symflags:'' +A total of 1 merge steps (of max 6) (22 -> 16 subms) took 0.005752s (of which 0.0006859s partitioning, 0s I/O); computing times: 0.0003479s in par. loops, 1.907e-06s sorting, 4.053e-06s analyzing) +Total merge + benchmarking process took 0.005752s, equivalent to 6.7/6.7 new/old ops (0.00253s for 1 clones -- as 3.0/3.0 ops, or 3.0/3.0 ops per clone), SPEEDUP of 1.000x (NO SPEEDUP) +Merging based autotuning FAILED (=NO SPEEDUP); let's try splitting then... +3 iterations (12 th.) took 0.00385s; avg 0.001283s ( +/- 30.11/ 39.17 %); best 0.0008969s; worst 0.001786s; std dev. 0.0003722 (taking best). +Reference operation time is 0.000896931 s (0.6422 Mflops) with 12 threads. +Starting split (same threads) based auto-tuning procedure (transA=N, nrhs=2, order=cols) (max 6 steps, inclusive 3 grace steps) on: 6 x 6, type C, 36 nnz, 6 nnz/r, 29 subms, 22 lsubms, 4.6667 bpnz (tpop: 0.0008969 Mflops: 0.642) +Split (22 -> 28 leaves, 29 -> 37 subms) took 0.002001s (of which: 5.96e-06s analysis, -3.509e+09s mem.mgmt); compute time: 0.0004478s overall, 1.907e-06s searches, 0.0004458s shuffle, 0.0004289s switch, 2.146e-06s quadrants. +3 iterations (12 th.) took 0.003902s; avg 0.001301s ( +/- 7.36/ 6.10 %); best 0.001205s; worst 0.00138s; std dev. 7.237e-05 (taking best). +Reference operation time is 0.00120497 s (0.478 Mflops) with 12 threads. +After split step 1: tpop: 0.001205 s ~Mflops: 0.478 nsubm:28 otn:12 +Applying split (22 -> 28 leaves, 12 th.) yielded SLOWDOWN (1th of 3 tolerable) of 1.343x: 0.0008969s -> 0.001205s. +Skipping further split based tests after 1 definite performance degradations in a row (and last exceeding limit). +A total of 1 split steps (of max 6) (22 -> 28 subms) took 0.005948s (of which 0.002032s partitioning, 0s I/O); computing times: 0.0004478s in par. loops, 1.907e-06s sorting, 5.96e-06s analyzing) +Total split + benchmarking process took 0.005948s, equivalent to 6.6/6.6 new/old ops (0.004433s for 1 clones -- as 4.9/4.9 ops, or 4.9/4.9 ops per clone), SPEEDUP of 1.000x (NO SPEEDUP) +In 1 tuning rounds (tot. 0.026s, 0.007s for constructor, 2 clones) obtained NO speedup (best stays 0.6422 Mflops). +After 0.025901s, global autotuning found old matrix optimal, with declared speedup 1 x when using 12 threads Considering Z clone. Building a matrix with 36 nnz, 6 x 6 Duplicates check: 36 - 0 = 36 - converted COO to RSB in 1.254e-02 s (100.00 %) - analyzed arrays in 4.631e-03 s (36.92 %) + converted COO to RSB in 6.916e-03 s (100.00 %) + analyzed arrays in 2.559e-03 s (37.00 %) cleaned-up arrays in 9.537e-07 s (0.01 %) - deduplicated arrays in 1.192e-06 s (0.01 %) + deduplicated arrays in 9.537e-07 s (0.01 %) sorted arrays in 0.000e+00 s (0.00 %) - shuffled partitions in 3.512e-03 s (28.00 %) - memory allocations took 5.722e-06 s (0.05 %) - leafs setup took 5.960e-06 s (0.05 %) - halfword conversion took 4.387e-03 s (34.97 %) -Built (6 x 6)[0xaaab10bcc400]{Z} @ (0(0..0),0(0..0)) (36 nnz, 6 nnz/r) flags 0x42046186 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 28, symflags:'' + shuffled partitions in 2.060e-03 s (29.79 %) + memory allocations took 2.861e-06 s (0.04 %) + leafs setup took 7.153e-06 s (0.10 %) + halfword conversion took 2.284e-03 s (33.02 %) +Built (6 x 6)[0xaaab113fa990]{Z} @ (0(0..0),0(0..0)) (36 nnz, 6 nnz/r) flags 0x42046186 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 28, symflags:'' Base matrix: -(6 x 6)[0xaaab10bcc400]{Z} @ (0(0..0),0(0..0)) (36 nnz, 6 nnz/r) flags 0x2046186 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 28, symflags:'' +(6 x 6)[0xaaab113fa990]{Z} @ (0(0..0),0(0..0)) (36 nnz, 6 nnz/r) flags 0x2046186 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 28, symflags:'' Will use autotuning routine to sample matrix: 6 x 6, type Z, 36 nnz, 6 nnz/r, 37 subms, 28 lsubms, 4.4444 bpnz. Parameters: verbosity:1 mintimes:3 maxtimes:10 mindt:0 maxdt:0.1 -3 iterations (12 th.) took 0.005529s; avg 0.001843s ( +/- 53.66/ 83.01 %); best 0.000854s; worst 0.003373s; std dev. 0.001097 (taking best). -Reference operation time is 0.000854015 s (0.6745 Mflops) with 12 threads. -After 0.005555s, autotuning routine did not find a better threads count configuration. +3 iterations (12 th.) took 0.003725s; avg 0.001242s ( +/- 28.40/ 14.52 %); best 0.0008891s; worst 0.001422s; std dev. 0.0002494 (taking best). +Reference operation time is 0.000889063 s (0.6479 Mflops) with 12 threads. +After 0.003752s, autotuning routine did not find a better threads count configuration. Will autotune matrix: 6 x 6, type Z, 36 nnz, 6 nnz/r, 37 subms, 28 lsubms, 4.4444 bpnz. Parameters: verbosity:1 mintimes:3 maxtimes:10 mindt:0 maxdt:0.1 -3 iterations (12 th.) took 0.01434s; avg 0.004778s ( +/- 30.50/ 50.34 %); best 0.003321s; worst 0.007184s; std dev. 0.001714 (taking best). -Reference operation time is 0.00332093 s (0.1734 Mflops) with 12 threads. -Starting merge (same threads) based auto-tuning procedure (transA=N, nrhs=2, order=cols) (max 6 steps, inclusive 3 grace steps) on: 6 x 6, type Z, 36 nnz, 6 nnz/r, 37 subms, 28 lsubms, 4.4444 bpnz (tpop: 0.003321 Mflops: 0.173) -Merge (28 -> 22 leaves) took w.c.t. of 0.001463s, ~1.383e-05s of computing time (of which 1.907e-06s sorting, 5.007e-06s analysis) -3 iterations (12 th.) took 0.007227s; avg 0.002409s ( +/- 14.82/ 10.21 %); best 0.002052s; worst 0.002655s; std dev. 0.0002583 (taking best). -Reference operation time is 0.00205207 s (0.2807 Mflops) with 12 threads. -After merge step 1: tpop: 0.002052 s ~Mflops: 0.281 nsubm:22 otn:12 -Applying merge (28 -> 22 leaves, 12 th.) yielded SPEEDUP of 1.618x: 0.003321s -> 0.002052s, so taking this instance. -Merge (22 -> 16 leaves) took w.c.t. of 0.001172s, ~1.192e-05s of computing time (of which 1.907e-06s sorting, 7.153e-06s analysis) -3 iterations (12 th.) took 0.01708s; avg 0.005694s ( +/- 26.61/ 13.71 %); best 0.004179s; worst 0.006475s; std dev. 0.001072 (taking best). -Reference operation time is 0.004179 s (0.1378 Mflops) with 12 threads. -After merge step 2: tpop: 0.004179 s ~Mflops: 0.138 nsubm:16 otn:12 -Applying merge (22 -> 16 leaves, 12 th.) yielded SLOWDOWN (1th of 3 tolerable) of 2.036x: 0.002052s -> 0.004179s. -Skipping further merge based tests after 1 definite performance degradations in a row (and last exceeding limit). -A total of 2 merge steps (of max 6) (28 -> 16 subms) took 0.03422s (of which 0.002648s partitioning, 0s I/O); computing times: 2.575e-05s in par. loops, 3.815e-06s sorting, 1.216e-05s analyzing) -Total merge + benchmarking process took 0.03422s, equivalent to 16.7/10.3 new/old ops (0.01834s for 2 clones -- as 8.9/5.5 ops, or 4.5/2.8 ops per clone), SPEEDUP of 1.618x -Applying multi-merge (28 -> 22 leaves, 1 steps, 0 -> 12 th.sp.) yielded SPEEDUP of 1.618x (0.003321s -> 0.002052s), will amortize in 27.0 ops by saving 0.001269s per op. -In 1 tuning rounds (tot. 0.06s, 0.018s for constructor, 2 clones) obtained a SPEEDUP of 61.8% (1.618x) (from 0.1734 to 0.2807 Mflops). -After 0.059876s, global autotuning declared speedup of 1.61833 x, when using threads count of 12 and a new matrix: -(6 x 6)[0xaaab10bcfb50]{Z} @ (0(0..0),0(0..0)) (36 nnz, 6 nnz/r) flags 0x2046186 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 22, symflags:'' +3 iterations (12 th.) took 0.005426s; avg 0.001809s ( +/- 7.78/ 4.27 %); best 0.001668s; worst 0.001886s; std dev. 9.963e-05 (taking best). +Reference operation time is 0.00166798 s (0.3453 Mflops) with 12 threads. +Starting merge (same threads) based auto-tuning procedure (transA=N, nrhs=2, order=cols) (max 6 steps, inclusive 3 grace steps) on: 6 x 6, type Z, 36 nnz, 6 nnz/r, 37 subms, 28 lsubms, 4.4444 bpnz (tpop: 0.001668 Mflops: 0.345) +Merge (28 -> 22 leaves) took w.c.t. of 0.0003231s, ~1.311e-05s of computing time (of which 2.146e-06s sorting, 5.007e-06s analysis) +3 iterations (12 th.) took 0.005192s; avg 0.001731s ( +/- 26.96/ 52.38 %); best 0.001264s; worst 0.002637s; std dev. 0.0006411 (taking best). +Reference operation time is 0.0012641 s (0.4557 Mflops) with 12 threads. +After merge step 1: tpop: 0.001264 s ~Mflops: 0.456 nsubm:22 otn:12 +Applying merge (28 -> 22 leaves, 12 th.) yielded SPEEDUP of 1.320x: 0.001668s -> 0.001264s, so taking this instance. +Merge (22 -> 16 leaves) took w.c.t. of 0.002038s, ~1.526e-05s of computing time (of which 1.907e-06s sorting, 5.96e-06s analysis) +3 iterations (12 th.) took 0.00497s; avg 0.001657s ( +/- 14.47/ 16.63 %); best 0.001417s; worst 0.001932s; std dev. 0.0002118 (taking best). +Reference operation time is 0.00141692 s (0.4065 Mflops) with 12 threads. +After merge step 2: tpop: 0.001417 s ~Mflops: 0.407 nsubm:16 otn:12 +Applying merge (22 -> 16 leaves, 12 th.) yielded SLOWDOWN (1th of 3 tolerable) of 1.121x: 0.001264s -> 0.001417s. +Merge (16 -> 10 leaves) took w.c.t. of 0.0005069s, ~2.289e-05s of computing time (of which 2.861e-06s sorting, 5.96e-06s analysis) +3 iterations (12 th.) took 0.004326s; avg 0.001442s ( +/- 31.57/ 23.17 %); best 0.0009868s; worst 0.001776s; std dev. 0.0003334 (taking best). +Reference operation time is 0.000986814 s (0.5837 Mflops) with 12 threads. +After merge step 3: tpop: 0.0009868 s ~Mflops: 0.584 nsubm:10 otn:12 +Applying merge (16 -> 10 leaves, 12 th.) yielded SPEEDUP of 1.281x: 0.001264s -> 0.0009868s, so taking this instance. +Merge (10 -> 7 leaves) took w.c.t. of 1.502e-05s, ~5.007e-06s of computing time (of which 9.537e-07s sorting, 3.099e-06s analysis) +3 iterations (12 th.) took 0.003313s; avg 0.001104s ( +/- 16.43/ 30.40 %); best 0.0009229s; worst 0.00144s; std dev. 0.0002376 (taking best). +Reference operation time is 0.000922918 s (0.6241 Mflops) with 12 threads. +After merge step 4: tpop: 0.0009229 s ~Mflops: 0.624 nsubm:7 otn:12 +Applying merge (10 -> 7 leaves, 12 th.) yielded SPEEDUP of 1.069x: 0.0009868s -> 0.0009229s, so taking this instance. +Merge (7 -> 4 leaves) took w.c.t. of 1.502e-05s, ~4.053e-06s of computing time (of which 1.192e-06s sorting, 3.815e-06s analysis) +3 iterations (12 th.) took 0.002645s; avg 0.0008817s ( +/- 29.91/ 40.86 %); best 0.000618s; worst 0.001242s; std dev. 0.0002637 (taking best). +Reference operation time is 0.000617981 s (0.9321 Mflops) with 12 threads. +After merge step 5: tpop: 0.000618 s ~Mflops: 0.932 nsubm:4 otn:12 +Applying merge (7 -> 4 leaves, 12 th.) yielded SPEEDUP of 1.493x: 0.0009229s -> 0.000618s, so taking this instance. +Merge (4 -> 1 leaves) took w.c.t. of 1.121e-05s, ~4.053e-06s of computing time (of which 9.537e-07s sorting, 1.907e-06s analysis) +3 iterations (12 th.) took 4.053e-06s; avg 1.351e-06s ( +/- 94.20/129.41 %); best 7.834e-08s; worst 3.099e-06s; std dev. 1.296e-06 (taking best). +Reference operation time is 7.83443e-08 s (7352 Mflops) with 12 threads. +After merge step 6: tpop: 7.834e-08 s ~Mflops: 7352.158 nsubm:1 otn:12 +Applying merge (4 -> 1 leaves, 12 th.) yielded SPEEDUP of 7888.010x: 0.000618s -> 7.834e-08s, so taking this instance. +Merged all the matrix leaves: no reason to continue merging. +A total of 6 merge steps (of max 6) (28 -> 1 subms) took 0.04207s (of which 0.002937s partitioning, 0s I/O); computing times: 6.437e-05s in par. loops, 1.001e-05s sorting, 2.575e-05s analyzing) +Total merge + benchmarking process took 0.04207s, equivalent to 537051.1/25.2 new/old ops (0.02272s for 6 clones -- as 289948.3/13.6 ops, or 48324.7/2.3 ops per clone), SPEEDUP of 21290.323x +Applying multi-merge (28 -> 1 leaves, 6 steps, 0 -> 12 th.sp.) yielded SPEEDUP of 21290.323x (0.001668s -> 7.834e-08s), will amortize in 25.2 ops by saving 0.001668s per op. +In 1 tuning rounds (tot. 0.052s, 0.023s for constructor, 6 clones) obtained a SPEEDUP of 2128932.3% (2.129e+04x) (from 0.3453 to 7352 Mflops). +After 0.051777s, global autotuning declared speedup of 21290.3 x, when using threads count of 12 and a new matrix: +(6 x 6)[0xaaab113f7e70]{Z} @ (0(0..6),0(0..6)) (36 nnz, 6 nnz/r) flags 0x2244086 (coo:0, csr:1, hw:1, ic:1, fi:0), storage: 1, subm: 1, symflags:'' gmake[4]: Leaving directory '/build/reproducible-path/librsb-1.3.0.2+dfsg/examples' gmake[3]: Leaving directory '/build/reproducible-path/librsb-1.3.0.2+dfsg' @@ -9237,10 +9279,10 @@ 4 0 DIFF PRINT TEST END Beginning large binary search test. -Detected 33603371008 bytes of memory, comprehensive of 8611643392 of free memory. +Detected 33603371008 bytes of memory, comprehensive of 5862813696 of free memory. On this system, maximal array of coordinates can have 2147483137 elements and occupy 8589932548 bytes. -Will perform the test using less memory (6159 MB) than on the maximal coordinate indices array (6458732544) allows. -(c)allocated 1614683136 nnz (6458732544 bytes) +Will perform the test using less memory (4193 MB) than on the maximal coordinate indices array (4397110272) allows. +(c)allocated 1099277568 nnz (4397110272 bytes) Succeeded retrieving array last element. Successfully performed large binary search test. BASIC SPARSE BLAS TEST: BEGIN @@ -9249,7 +9291,7 @@ got RSB_IO_WANT_IS_INITIALIZED_MARKER: 1 INIT INTERFACE TEST: END (SUCCESS) DEVEL PRINT TEST: BEGIN -(4 x 4)[0xaaab13be63a0]{S} @ (0(0..0),0(0..0)) (4 nnz, 1 nnz/r) flags 0x2046186 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 2, symflags:'' +(4 x 4)[0xaaab047513a0]{S} @ (0(0..0),0(0..0)) (4 nnz, 1 nnz/r) flags 0x2046186 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 2, symflags:'' RSB_FLAG_USE_HALFWORD_INDICES | RSB_FLAG_SORTED_INPUT | RSB_FLAG_WANT_COO_STORAGE | @@ -9258,8 +9300,8 @@ RSB_FLAG_ASSEMBLED_IN_COO_ARRAYS | RSB_FLAG_OWN_PARTITIONING_ARRAYS | RSB_FLAG_SORT_INPUT -(2 x 2)[0xaaab13be64b0]{S} @ (0(0..2),0(0..2)) (2 nnz, 1 nnz/r) flags 0x2144386 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 0, symflags:'' -(2 x 2)[0xaaab13be65c0]{S} @ (2(2..4),2(2..4)) (2 nnz, 1 nnz/r) flags 0x2144386 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 0, symflags:'' +(2 x 2)[0xaaab047514b0]{S} @ (0(0..2),0(0..2)) (2 nnz, 1 nnz/r) flags 0x2144386 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 0, symflags:'' +(2 x 2)[0xaaab047515c0]{S} @ (2(2..4),2(2..4)) (2 nnz, 1 nnz/r) flags 0x2144386 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 0, symflags:'' #R 4 x 4, 4 nnz (16 bytes), 16 index space for bytes, 544 bytes for 2 structs (2 of which are on the diagonal) (1e+02% of nnz are on the diagonal) #N at 0 0, 4 x 4, 4 nnz ( 25%) #T at 0 0, 2 x 2, 2 nnz ( 50%) @@ -9267,9 +9309,9 @@ ( 0x2046186 = { rec:1 coo:1 css:1 hw:1 ic:1 fi:0 symflags: } ) DEVEL PRINT TEST: END PRINT TEST: BEGIN [QUIET] -(2 x 2)[0xaaab13be64b0]{S} @ (0(0..2),0(0..2)) (2 nnz, 1 nnz/r) flags 0x2144386 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 0, symflags:'' -(2 x 2)[0xaaab13be65c0]{S} @ (2(2..4),2(2..4)) (2 nnz, 1 nnz/r) flags 0x2144386 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 0, symflags:'' -(4 x 4)[0xaaab13be63a0]{S} @ (0(0..0),0(0..0)) (4 nnz, 1 nnz/r) flags 0x2046186 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 2, symflags:'' +(2 x 2)[0xaaab047514b0]{S} @ (0(0..2),0(0..2)) (2 nnz, 1 nnz/r) flags 0x2144386 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 0, symflags:'' +(2 x 2)[0xaaab047515c0]{S} @ (2(2..4),2(2..4)) (2 nnz, 1 nnz/r) flags 0x2144386 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 0, symflags:'' +(4 x 4)[0xaaab047513a0]{S} @ (0(0..0),0(0..0)) (4 nnz, 1 nnz/r) flags 0x2046186 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 2, symflags:'' RSB_FLAG_USE_HALFWORD_INDICES | RSB_FLAG_SORTED_INPUT | RSB_FLAG_WANT_COO_STORAGE | @@ -9287,8 +9329,8 @@ BASIC PRIMITIVES TEST: BEGIN BASIC PRIMITIVES TEST: END (SUCCESS) ADVANCED SPARSE BLAS TEST: BEGIN [limit 30.000000s] [QUIET] -Terminating testing earlier due to user timeout request: test took 30.000274 s, max allowed was 30.000000. - PASSED:18047 +Terminating testing earlier due to user timeout request: test took 30.002071 s, max allowed was 30.000000. + PASSED:19372 FAILED:0 ADVANCED SPARSE BLAS TEST: END (SUCCESS) gmake qtests -C librsbpp @@ -9297,17 +9339,17 @@ gmake[4]: Entering directory '/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp' gmake[4]: Leaving directory '/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp' ./rsbtt -if ! test -f G.mtx ; then cp -p /build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp/G.mtx . ; fi ; /bin/bash /build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp/test.sh +if ! test -f G.mtx ; then cp -p /build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp/G.mtx . ; fi ; /bin/sh /build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp/test.sh ++ grep Z-sort -++ ./rsbpp Td,s G.mtx ++ wc -l +++ ./rsbpp Td,s G.mtx + test 54 = 54 ++ ./rsbpp Td G.mtx ++ grep Z-sort ++ wc -l + test 27 = 27 -++ grep Z-sort ++ ./rsbpp Td,z G.mtx +++ grep Z-sort ++ wc -l + test 54 = 54 ++ ./rsbpp vTd,z G.mtx @@ -9319,8 +9361,8 @@ ++ wc -l + test 54 = 54 ++ ./rsbpp vvvTd,z G.mtx -++ grep Zorted ++ wc -l +++ grep Zorted + test 8 = 8 ++ ./rsbpp vvTd,z G.mtx ++ grep Z-sort @@ -9344,13 +9386,13 @@ + test 258 = 258 ++ OMP_NUM_THREADS=1 ++ ./rsbpp m10M10I1r1,4,8sFv -++ wc -l ++ grep spmm- +++ wc -l + test 9 = 9 ++ OMP_NUM_THREADS=1 ++ ./rsbpp C1000m100M100I1r1,4,8sFv -++ grep spmm- ++ wc -l +++ grep spmm- + test 9 = 9 ++ OMP_NUM_THREADS=1 ++ ./rsbpp C1000m100M100I1r1sFvtN,T @@ -9364,8 +9406,8 @@ + test 2 = 2 ++ OMP_NUM_THREADS=1 ++ ./rsbpp C1000m100M100I1r0vtN,TsF -++ grep spmm- ++ wc -l +++ grep spmm- + test 0 = 0 ++ OMP_NUM_THREADS=1 ++ RSB_NUM_THREADS=1 @@ -9382,8 +9424,8 @@ ++ OMP_NUM_THREADS=1 ++ RSB_NUM_THREADS=1 ++ ./rsbpp vvvC1000m100M100I1r1vtN,ToRsF -++ wc -l ++ grep Recursing +++ wc -l + test 208 = 208 ++ OMP_NUM_THREADS=2 ++ RSB_NUM_THREADS=2 @@ -9436,7 +9478,7 @@ 0 0 0 0 before tuning for SPMV: -(3 x 3)[0xaaaac0bc74c0]{D} @ (0(0..0),0(0..0)) (6 nnz, 2 nnz/r) flags 0x2046186 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'' +(3 x 3)[0xaaaae9cc40a0]{D} @ (0(0..0),0(0..0)) (6 nnz, 2 nnz/r) flags 0x2046186 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'' ** x: 1.1 @@ -9525,18 +9567,18 @@ BEGIN Rsb_Matrix_test_multimatrix_ms_mnrhs BEGIN -(3 x 3)[0xaaaac0bfb700]{D} @ (0(0..0),0(0..0)) (6 nnz, 2 nnz/r) flags 0x204619e (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'LT' -Tuned with speedup factor of 1: -(3 x 3)[0xaaaac0bfb700]{D} @ (0(0..0),0(0..0)) (6 nnz, 2 nnz/r) flags 0x204619e (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'LT' -(3 x 3)[0xaaaac0bfa980]{D} @ (0(0..0),0(0..0)) (6 nnz, 2 nnz/r) flags 0x204619e (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'LT' -Tuned with speedup factor of 1: -(3 x 3)[0xaaaac0bfa980]{D} @ (0(0..0),0(0..0)) (6 nnz, 2 nnz/r) flags 0x204619e (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'LT' -(3 x 3)[0xaaaac0bfadd0]{D} @ (0(0..0),0(0..0)) (6 nnz, 2 nnz/r) flags 0x204619e (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'LT' +(3 x 3)[0xaaaae9cec170]{D} @ (0(0..0),0(0..0)) (6 nnz, 2 nnz/r) flags 0x204619e (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'LT' Tuned with speedup factor of 1: -(3 x 3)[0xaaaac0bfadd0]{D} @ (0(0..0),0(0..0)) (6 nnz, 2 nnz/r) flags 0x204619e (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'LT' -(3 x 3)[0xaaaac0bfa980]{D} @ (0(0..0),0(0..0)) (6 nnz, 2 nnz/r) flags 0x204619e (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'LT' +(3 x 3)[0xaaaae9cec170]{D} @ (0(0..0),0(0..0)) (6 nnz, 2 nnz/r) flags 0x204619e (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'LT' +(3 x 3)[0xaaaae9cf2200]{D} @ (0(0..0),0(0..0)) (6 nnz, 2 nnz/r) flags 0x204619e (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'LT' Tuned with speedup factor of 1: -(3 x 3)[0xaaaac0bfa980]{D} @ (0(0..0),0(0..0)) (6 nnz, 2 nnz/r) flags 0x204619e (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'LT' +(3 x 3)[0xaaaae9cf2200]{D} @ (0(0..0),0(0..0)) (6 nnz, 2 nnz/r) flags 0x204619e (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'LT' +(3 x 3)[0xaaaae9cec170]{D} @ (0(0..0),0(0..0)) (6 nnz, 2 nnz/r) flags 0x204619e (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'LT' +Tuned with speedup factor of 1.00954: +(3 x 3)[0xaaaae9cfd1c0]{D} @ (0(0..0),0(0..0)) (6 nnz, 2 nnz/r) flags 0x204619e (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'LT' +(3 x 3)[0xaaaae9cec170]{D} @ (0(0..0),0(0..0)) (6 nnz, 2 nnz/r) flags 0x204619e (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'LT' +Tuned with speedup factor of 1.01041: +(3 x 3)[0xaaaae9cfbea0]{D} @ (0(0..0),0(0..0)) (6 nnz, 2 nnz/r) flags 0x204619e (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'LT' END OK: terminating with no allocations registered in librsb [*] tests terminated successfully ! @@ -9553,10 +9595,10 @@ ./rsbtest --no-tune --max_t 0.01 --serial | dd if=/dev/stdin of=/dev/stdout bs=16M status=none iflag=fullblock | grep -q Building ./rsbtest --no-tune --max_t 0.01 --max 1 --nrhs 1 --beta 1 --incy 1 --incx 1 --no-trans --alpha 1 --type d --rand --serial . | dd if=/dev/stdin of=/dev/stdout bs=16M status=none iflag=fullblock | grep -q adding ! ./rsbtest --mkl A.mkl -running on codethink03-arm64 +running on i-capture-the-hostname Built without the MKL. ( ! ./rsbtest --unrecognized-option-triggers-abort ) -running on codethink03-arm64 +running on i-capture-the-hostname /build/reproducible-path/librsb-1.3.0.2+dfsg/rsbtest/.libs/rsbtest: unrecognized option '--unrecognized-option-triggers-abort' unrecognized option, aborting. ( ./rsbtest --no-tune --max_t 0.01 --skip-loading-hermitian-matrices --skip-loading-unsymmetric-matrices --tune-maxt 10 --tune-maxr 10 --verbose-tuning --extra-verbose-interface --min_t 0.01 --max_t 0.01 --mintimes 1 --maxtimes 1 --verbose --skip-loading-symmetric-matrices A.mtx | dd if=/dev/stdin of=/dev/stdout bs=16M status=none iflag=fullblock | grep -q skip ) @@ -9565,7 +9607,7 @@ ( ! ./rsbtest --no-tune --max_t 0.01 --quiet --types all --nthreads 1,2 --maxtimes 1 -+ A.mtx | dd if=/dev/stdin of=/dev/stdout bs=16M status=none iflag=fullblock | grep -q 2.threads ) ( ! ./rsbtest --no-tune --max_t 0.01 --quiet --render-only A.mtx > /dev/null ) ! ./rsbtest --no-tune --max_t 0.01 --quiet --max 1 --nrhs 1 --beta 1 --incy 1 --incx 1 --render --no-trans --alpha 1 --type all A.mtx -running on codethink03-arm64 +running on i-capture-the-hostname Will not invoke autotuning routine. Benchmark will sample for at most 0.01 s Built without render support! @@ -9617,7 +9659,7 @@ gmake[4]: Entering directory '/build/reproducible-path/librsb-1.3.0.2+dfsg' gmake[5]: Entering directory '/build/reproducible-path/librsb-1.3.0.2+dfsg' /usr/bin/mkdir -p '/build/reproducible-path/librsb-1.3.0.2+dfsg/debian/tmp/usr/lib/aarch64-linux-gnu' - /bin/bash ./libtool --mode=install /usr/bin/install -c librsb.la '/build/reproducible-path/librsb-1.3.0.2+dfsg/debian/tmp/usr/lib/aarch64-linux-gnu' + /bin/sh ./libtool --mode=install /usr/bin/install -c librsb.la '/build/reproducible-path/librsb-1.3.0.2+dfsg/debian/tmp/usr/lib/aarch64-linux-gnu' libtool: install: /usr/bin/install -c .libs/librsb.so.0.0.0 /build/reproducible-path/librsb-1.3.0.2+dfsg/debian/tmp/usr/lib/aarch64-linux-gnu/librsb.so.0.0.0 libtool: install: (cd /build/reproducible-path/librsb-1.3.0.2+dfsg/debian/tmp/usr/lib/aarch64-linux-gnu && { ln -s -f librsb.so.0.0.0 librsb.so.0 || { rm -f librsb.so.0 && ln -s librsb.so.0.0.0 librsb.so.0; }; }) libtool: install: (cd /build/reproducible-path/librsb-1.3.0.2+dfsg/debian/tmp/usr/lib/aarch64-linux-gnu && { ln -s -f librsb.so.0.0.0 librsb.so || { rm -f librsb.so && ln -s librsb.so.0.0.0 librsb.so; }; }) @@ -9627,7 +9669,7 @@ libtool: install: ranlib /build/reproducible-path/librsb-1.3.0.2+dfsg/debian/tmp/usr/lib/aarch64-linux-gnu/librsb.a libtool: warning: remember to run 'libtool --finish /usr/lib/aarch64-linux-gnu' /usr/bin/mkdir -p '/build/reproducible-path/librsb-1.3.0.2+dfsg/debian/tmp/usr/bin' - /bin/bash ./libtool --mode=install /usr/bin/install -c rsbench '/build/reproducible-path/librsb-1.3.0.2+dfsg/debian/tmp/usr/bin' + /bin/sh ./libtool --mode=install /usr/bin/install -c rsbench '/build/reproducible-path/librsb-1.3.0.2+dfsg/debian/tmp/usr/bin' libtool: warning: 'librsb.la' has not been installed in '/usr/lib/aarch64-linux-gnu' libtool: install: /usr/bin/install -c .libs/rsbench /build/reproducible-path/librsb-1.3.0.2+dfsg/debian/tmp/usr/bin/rsbench /usr/bin/mkdir -p '/build/reproducible-path/librsb-1.3.0.2+dfsg/debian/tmp/usr/bin' @@ -9764,10 +9806,10 @@ dh_builddeb dpkg-deb: building package 'librsb0t64' in '../librsb0t64_1.3.0.2+dfsg-7_arm64.deb'. dpkg-deb: building package 'librsb0t64-dbgsym' in '../librsb0t64-dbgsym_1.3.0.2+dfsg-7_arm64.deb'. -dpkg-deb: building package 'librsb-dev' in '../librsb-dev_1.3.0.2+dfsg-7_arm64.deb'. -dpkg-deb: building package 'librsb-tools' in '../librsb-tools_1.3.0.2+dfsg-7_arm64.deb'. dpkg-deb: building package 'librsb-tools-dbgsym' in '../librsb-tools-dbgsym_1.3.0.2+dfsg-7_arm64.deb'. +dpkg-deb: building package 'librsb-dev' in '../librsb-dev_1.3.0.2+dfsg-7_arm64.deb'. dpkg-deb: building package 'librsb-doc' in '../librsb-doc_1.3.0.2+dfsg-7_all.deb'. +dpkg-deb: building package 'librsb-tools' in '../librsb-tools_1.3.0.2+dfsg-7_arm64.deb'. dpkg-genbuildinfo --build=binary -O../librsb_1.3.0.2+dfsg-7_arm64.buildinfo dpkg-genchanges --build=binary -O../librsb_1.3.0.2+dfsg-7_arm64.changes dpkg-genchanges: info: binary-only upload (no source code included) @@ -9776,12 +9818,14 @@ dpkg-buildpackage: info: binary-only upload (no source included) dpkg-genchanges: info: not including original source code in upload I: copying local configuration +I: user script /srv/workspace/pbuilder/1730324/tmp/hooks/B01_cleanup starting +I: user script /srv/workspace/pbuilder/1730324/tmp/hooks/B01_cleanup finished I: unmounting dev/ptmx filesystem I: unmounting dev/pts filesystem I: unmounting dev/shm filesystem I: unmounting proc filesystem I: unmounting sys filesystem I: cleaning the build env -I: removing directory /srv/workspace/pbuilder/1467199 and its subdirectories -I: Current time: Sat Sep 5 19:50:38 -12 2026 -I: pbuilder-time-stamp: 1788681038 +I: removing directory /srv/workspace/pbuilder/1730324 and its subdirectories +I: Current time: Mon Aug 4 15:39:59 +14 2025 +I: pbuilder-time-stamp: 1754271599