Diff of the two buildlogs: -- --- b1/build.log 2025-02-07 08:42:32.553800180 +0000 +++ b2/build.log 2025-02-07 08:56:32.195912919 +0000 @@ -1,6 +1,6 @@ I: pbuilder: network access will be disabled during build -I: Current time: Thu Mar 12 02:53:14 -12 2026 -I: pbuilder-time-stamp: 1773327194 +I: Current time: Fri Feb 7 22:42:35 +14 2025 +I: pbuilder-time-stamp: 1738917755 I: Building the build Environment I: extracting base tarball [/var/cache/pbuilder/trixie-reproducible-base.tgz] I: copying local configuration @@ -25,52 +25,84 @@ dpkg-source: info: applying auto-gitignore I: Not using root during the build. I: Installing the build-deps -I: user script /srv/workspace/pbuilder/2200206/tmp/hooks/D02_print_environment starting +I: user script /srv/workspace/pbuilder/1182468/tmp/hooks/D01_modify_environment starting +debug: Running on codethink04-arm64. +I: Changing host+domainname to test build reproducibility +I: Adding a custom variable just for the fun of it... +I: Changing /bin/sh to bash +'/bin/sh' -> '/bin/bash' +lrwxrwxrwx 1 root root 9 Feb 7 08:42 /bin/sh -> /bin/bash +I: Setting pbuilder2's login shell to /bin/bash +I: Setting pbuilder2's GECOS to second user,second room,second work-phone,second home-phone,second other +I: user script /srv/workspace/pbuilder/1182468/tmp/hooks/D01_modify_environment finished +I: user script /srv/workspace/pbuilder/1182468/tmp/hooks/D02_print_environment starting I: set - BUILDDIR='/build/reproducible-path' - BUILDUSERGECOS='first user,first room,first work-phone,first home-phone,first other' - BUILDUSERNAME='pbuilder1' - BUILD_ARCH='arm64' - DEBIAN_FRONTEND='noninteractive' + BASH=/bin/sh + BASHOPTS=checkwinsize:cmdhist:complete_fullquote:extquote:force_fignore:globasciiranges:globskipdots:hostcomplete:interactive_comments:patsub_replacement:progcomp:promptvars:sourcepath + BASH_ALIASES=() + BASH_ARGC=() + BASH_ARGV=() + BASH_CMDS=() + BASH_LINENO=([0]="12" [1]="0") + BASH_LOADABLES_PATH=/usr/local/lib/bash:/usr/lib/bash:/opt/local/lib/bash:/usr/pkg/lib/bash:/opt/pkg/lib/bash:. + BASH_SOURCE=([0]="/tmp/hooks/D02_print_environment" [1]="/tmp/hooks/D02_print_environment") + BASH_VERSINFO=([0]="5" [1]="2" [2]="37" [3]="1" [4]="release" [5]="aarch64-unknown-linux-gnu") + BASH_VERSION='5.2.37(1)-release' + BUILDDIR=/build/reproducible-path + BUILDUSERGECOS='second user,second room,second work-phone,second home-phone,second other' + BUILDUSERNAME=pbuilder2 + BUILD_ARCH=arm64 + DEBIAN_FRONTEND=noninteractive DEB_BUILD_OPTIONS='buildinfo=+all reproducible=+all parallel=12 ' - DISTRIBUTION='trixie' - HOME='/root' - HOST_ARCH='arm64' + DIRSTACK=() + DISTRIBUTION=trixie + EUID=0 + FUNCNAME=([0]="Echo" [1]="main") + GROUPS=() + HOME=/root + HOSTNAME=i-capture-the-hostname + HOSTTYPE=aarch64 + HOST_ARCH=arm64 IFS=' ' - INVOCATION_ID='824cac00744f4de38632fb79c0529666' - LANG='C' - LANGUAGE='en_US:en' - LC_ALL='C' - MAIL='/var/mail/root' - OPTIND='1' - PATH='/usr/sbin:/usr/bin:/sbin:/bin:/usr/games' - PBCURRENTCOMMANDLINEOPERATION='build' - PBUILDER_OPERATION='build' - PBUILDER_PKGDATADIR='/usr/share/pbuilder' - PBUILDER_PKGLIBDIR='/usr/lib/pbuilder' - PBUILDER_SYSCONFDIR='/etc' - PPID='2200206' - PS1='# ' - PS2='> ' + INVOCATION_ID=744c09a0bd02417ea3d187949cac53e1 + LANG=C + LANGUAGE=nl_BE:nl + LC_ALL=C + MACHTYPE=aarch64-unknown-linux-gnu + MAIL=/var/mail/root + OPTERR=1 + OPTIND=1 + OSTYPE=linux-gnu + PATH=/usr/sbin:/usr/bin:/sbin:/bin:/usr/games:/i/capture/the/path + PBCURRENTCOMMANDLINEOPERATION=build + PBUILDER_OPERATION=build + PBUILDER_PKGDATADIR=/usr/share/pbuilder + PBUILDER_PKGLIBDIR=/usr/lib/pbuilder + PBUILDER_SYSCONFDIR=/etc + PIPESTATUS=([0]="0") + POSIXLY_CORRECT=y + PPID=1182468 PS4='+ ' - PWD='/' - SHELL='/bin/bash' - SHLVL='2' - SUDO_COMMAND='/usr/bin/timeout -k 18.1h 18h /usr/bin/ionice -c 3 /usr/bin/nice /usr/sbin/pbuilder --build --configfile /srv/reproducible-results/rbuild-debian/r-b-build.YHA4EUgZ/pbuilderrc_3EBu --distribution trixie --hookdir /etc/pbuilder/first-build-hooks --debbuildopts -b --basetgz /var/cache/pbuilder/trixie-reproducible-base.tgz --buildresult /srv/reproducible-results/rbuild-debian/r-b-build.YHA4EUgZ/b1 --logfile b1/build.log librsb_1.3.0.2+dfsg-7.dsc' - SUDO_GID='109' - SUDO_UID='104' - SUDO_USER='jenkins' - TERM='unknown' - TZ='/usr/share/zoneinfo/Etc/GMT+12' - USER='root' - _='/usr/bin/systemd-run' - http_proxy='http://192.168.101.4:3128' + PWD=/ + SHELL=/bin/bash + SHELLOPTS=braceexpand:errexit:hashall:interactive-comments:posix + SHLVL=3 + SUDO_COMMAND='/usr/bin/timeout -k 24.1h 24h /usr/bin/ionice -c 3 /usr/bin/nice -n 11 /usr/bin/unshare --uts -- /usr/sbin/pbuilder --build --configfile /srv/reproducible-results/rbuild-debian/r-b-build.YHA4EUgZ/pbuilderrc_NZos --distribution trixie --hookdir /etc/pbuilder/rebuild-hooks --debbuildopts -b --basetgz /var/cache/pbuilder/trixie-reproducible-base.tgz --buildresult /srv/reproducible-results/rbuild-debian/r-b-build.YHA4EUgZ/b2 --logfile b2/build.log librsb_1.3.0.2+dfsg-7.dsc' + SUDO_GID=109 + SUDO_UID=104 + SUDO_USER=jenkins + TERM=unknown + TZ=/usr/share/zoneinfo/Etc/GMT-14 + UID=0 + USER=root + _='I: set' + http_proxy=http://192.168.101.4:3128 I: uname -a - Linux codethink03-arm64 6.1.0-30-cloud-arm64 #1 SMP Debian 6.1.124-1 (2025-01-12) aarch64 GNU/Linux + Linux i-capture-the-hostname 6.1.0-30-cloud-arm64 #1 SMP Debian 6.1.124-1 (2025-01-12) aarch64 GNU/Linux I: ls -l /bin - lrwxrwxrwx 1 root root 7 Nov 22 2024 /bin -> usr/bin -I: user script /srv/workspace/pbuilder/2200206/tmp/hooks/D02_print_environment finished + lrwxrwxrwx 1 root root 7 Nov 22 14:40 /bin -> usr/bin +I: user script /srv/workspace/pbuilder/1182468/tmp/hooks/D02_print_environment finished -> Attempting to satisfy build-dependencies -> Creating pbuilder-satisfydepends-dummy package Package: pbuilder-satisfydepends-dummy @@ -296,7 +328,7 @@ Get: 178 http://deb.debian.org/debian trixie/main arm64 libltdl-dev arm64 2.5.4-3 [168 kB] Get: 179 http://deb.debian.org/debian trixie/main arm64 libhwloc-dev arm64 2.11.2-1 [237 kB] Get: 180 http://deb.debian.org/debian trixie/main arm64 zlib1g-dev arm64 1:1.3.dfsg+really1.3.1-1+b1 [917 kB] -Fetched 366 MB in 1s (309 MB/s) +Fetched 366 MB in 2s (168 MB/s) Preconfiguring packages ... Selecting previously unselected package liblocale-gettext-perl. (Reading database ... (Reading database ... 5% (Reading database ... 10% (Reading database ... 15% (Reading database ... 20% (Reading database ... 25% (Reading database ... 30% (Reading database ... 35% (Reading database ... 40% (Reading database ... 45% (Reading database ... 50% (Reading database ... 55% (Reading database ... 60% (Reading database ... 65% (Reading database ... 70% (Reading database ... 75% (Reading database ... 80% (Reading database ... 85% (Reading database ... 90% (Reading database ... 95% (Reading database ... 100% (Reading database ... 19956 files and directories currently installed.) @@ -894,8 +926,8 @@ Setting up tzdata (2024b-6) ... Current default time zone: 'Etc/UTC' -Local time is now: Thu Mar 12 14:53:54 UTC 2026. -Universal Time is now: Thu Mar 12 14:53:54 UTC 2026. +Local time is now: Fri Feb 7 08:44:04 UTC 2025. +Universal Time is now: Fri Feb 7 08:44:04 UTC 2025. Run 'dpkg-reconfigure tzdata' if you wish to change it. Setting up libfontenc1:arm64 (1:1.1.8-1+b2) ... @@ -1062,7 +1094,11 @@ Building tag database... -> Finished parsing the build-deps I: Building the package -I: Running cd /build/reproducible-path/librsb-1.3.0.2+dfsg/ && env PATH="/usr/sbin:/usr/bin:/sbin:/bin:/usr/games" HOME="/nonexistent/first-build" dpkg-buildpackage -us -uc -b && env PATH="/usr/sbin:/usr/bin:/sbin:/bin:/usr/games" HOME="/nonexistent/first-build" dpkg-genchanges -S > ../librsb_1.3.0.2+dfsg-7_source.changes +I: user script /srv/workspace/pbuilder/1182468/tmp/hooks/A99_set_merged_usr starting +Not re-configuring usrmerge for trixie +I: user script /srv/workspace/pbuilder/1182468/tmp/hooks/A99_set_merged_usr finished +hostname: Name or service not known +I: Running cd /build/reproducible-path/librsb-1.3.0.2+dfsg/ && env PATH="/usr/sbin:/usr/bin:/sbin:/bin:/usr/games:/i/capture/the/path" HOME="/nonexistent/second-build" dpkg-buildpackage -us -uc -b && env PATH="/usr/sbin:/usr/bin:/sbin:/bin:/usr/games:/i/capture/the/path" HOME="/nonexistent/second-build" dpkg-genchanges -S > ../librsb_1.3.0.2+dfsg-7_source.changes dpkg-buildpackage: info: source package librsb dpkg-buildpackage: info: source version 1.3.0.2+dfsg-7 dpkg-buildpackage: info: source distribution unstable @@ -1082,62 +1118,62 @@ dh binary dh_update_autotools_config dh_autoreconf -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found libtoolize: putting auxiliary files in '.'. libtoolize: copying file './ltmain.sh' libtoolize: putting macros in AC_CONFIG_MACRO_DIRS, 'm4'. @@ -1179,90 +1215,90 @@ libtoolize: copying file 'm4/ltsugar.m4' libtoolize: copying file 'm4/ltversion.m4' libtoolize: copying file 'm4/lt~obsolete.m4' -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found configure.ac:66: installing './compile' configure.ac:65: installing './missing' Makefile.am: installing './depcomp' @@ -1448,7 +1484,7 @@ checking for m4... m4 checking for gmake... gmake checking for ggrep... /usr/bin/grep -checking for bash... /bin/bash +checking for bash... /bin/sh checking for gsed... /usr/bin/sed checking for cmp... cmp checking for basename... basename @@ -1565,7 +1601,7 @@ configure: It appears that Fortran programs can be linked without using the Fortran linker. configure: Using OPENMP_CFLAGS ok for linking an OpenMP program: adding it to LIBS. checking if your have a usable getrusage() ... 1 -checking for /bin/bash... /bin/bash +checking for /bin/sh... /bin/sh configure: Will not use Google Test. configure: You seem to not have GNU Octave or have disabled 'int' type. Part of the test suite will not be generated. If you want more testing capabilities, you should enable the 'int' type as well. checking that generated files are newer than configure... done @@ -1587,7 +1623,7 @@ config.status: executing depfiles commands config.status: executing libtool commands === configuring in librsbpp (/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp) -configure: running /bin/bash ./configure --disable-option-checking '--prefix=/usr' '--build=aarch64-linux-gnu' '--includedir=${prefix}/include' '--mandir=${prefix}/share/man' '--infodir=${prefix}/share/info' '--sysconfdir=/etc' '--localstatedir=/var' '--disable-silent-rules' '--libdir=${prefix}/lib/aarch64-linux-gnu' '--runstatedir=/run' '--disable-maintainer-mode' '--disable-dependency-tracking' '--with-memhinfo=L2:4/64/512K,L1:8/64/24K' '--with-hwloc' '--enable-matrix-types=blas' '--with-zlib=-lz' '--enable-doc-build' '--enable-fortran-module-install' '--enable-extra-patches' '--enable-pkg-config-install' '--disable-extra-patches' 'build_alias=aarch64-linux-gnu' 'CFLAGS=-g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3' 'LDFLAGS=-Wl,-z,relro' 'CPPFLAGS=-Wdate-time -D_FORTIFY_SOURCE=2' 'FCFLAGS=-g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -mbranch-protection=standard -pipe' 'CXXFLAGS=-g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard' 'BASH=/bin/bash' --cache-file=/dev/null --srcdir=. +configure: running /bin/sh ./configure --disable-option-checking '--prefix=/usr' '--build=aarch64-linux-gnu' '--includedir=${prefix}/include' '--mandir=${prefix}/share/man' '--infodir=${prefix}/share/info' '--sysconfdir=/etc' '--localstatedir=/var' '--disable-silent-rules' '--libdir=${prefix}/lib/aarch64-linux-gnu' '--runstatedir=/run' '--disable-maintainer-mode' '--disable-dependency-tracking' '--with-memhinfo=L2:4/64/512K,L1:8/64/24K' '--with-hwloc' '--enable-matrix-types=blas' '--with-zlib=-lz' '--enable-doc-build' '--enable-fortran-module-install' '--enable-extra-patches' '--enable-pkg-config-install' '--disable-extra-patches' 'build_alias=aarch64-linux-gnu' 'CFLAGS=-g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3' 'LDFLAGS=-Wl,-z,relro' 'CPPFLAGS=-Wdate-time -D_FORTIFY_SOURCE=2' 'FCFLAGS=-g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -mbranch-protection=standard -pipe' 'CXXFLAGS=-g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard' 'BASH=/bin/sh' --cache-file=/dev/null --srcdir=. checking for a BSD-compatible install... /usr/bin/install -c checking whether sleep supports fractional seconds... yes checking filesystem timestamp resolution... 0.01 @@ -1712,7 +1748,7 @@ configure: Will not use Google Test. checking whether you have std::thread... yes checking whether you have std::mutex... yes -/bin/bash +/bin/sh checking that generated files are newer than configure... done configure: creating ./config.status config.status: creating Makefile @@ -1721,7 +1757,7 @@ config.status: executing libtool commands configure: Successfully created a Makefile. === configuring in rsblib (/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib) -configure: running /bin/bash ./configure --disable-option-checking '--prefix=/usr' '--build=aarch64-linux-gnu' '--includedir=${prefix}/include' '--mandir=${prefix}/share/man' '--infodir=${prefix}/share/info' '--sysconfdir=/etc' '--localstatedir=/var' '--disable-silent-rules' '--libdir=${prefix}/lib/aarch64-linux-gnu' '--runstatedir=/run' '--disable-maintainer-mode' '--disable-dependency-tracking' '--with-memhinfo=L2:4/64/512K,L1:8/64/24K' '--with-hwloc' '--enable-matrix-types=blas' '--with-zlib=-lz' '--enable-doc-build' '--enable-fortran-module-install' '--enable-extra-patches' '--enable-pkg-config-install' '--disable-extra-patches' 'build_alias=aarch64-linux-gnu' 'CFLAGS=-g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3' 'LDFLAGS=-Wl,-z,relro' 'CPPFLAGS=-Wdate-time -D_FORTIFY_SOURCE=2' 'FCFLAGS=-g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -mbranch-protection=standard -pipe' 'CXXFLAGS=-g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard' 'BASH=/bin/bash' --cache-file=/dev/null --srcdir=. +configure: running /bin/sh ./configure --disable-option-checking '--prefix=/usr' '--build=aarch64-linux-gnu' '--includedir=${prefix}/include' '--mandir=${prefix}/share/man' '--infodir=${prefix}/share/info' '--sysconfdir=/etc' '--localstatedir=/var' '--disable-silent-rules' '--libdir=${prefix}/lib/aarch64-linux-gnu' '--runstatedir=/run' '--disable-maintainer-mode' '--disable-dependency-tracking' '--with-memhinfo=L2:4/64/512K,L1:8/64/24K' '--with-hwloc' '--enable-matrix-types=blas' '--with-zlib=-lz' '--enable-doc-build' '--enable-fortran-module-install' '--enable-extra-patches' '--enable-pkg-config-install' '--disable-extra-patches' 'build_alias=aarch64-linux-gnu' 'CFLAGS=-g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3' 'LDFLAGS=-Wl,-z,relro' 'CPPFLAGS=-Wdate-time -D_FORTIFY_SOURCE=2' 'FCFLAGS=-g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -mbranch-protection=standard -pipe' 'CXXFLAGS=-g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard' 'BASH=/bin/sh' --cache-file=/dev/null --srcdir=. checking for a BSD-compatible install... /usr/bin/install -c checking whether sleep supports fractional seconds... yes checking filesystem timestamp resolution... 0.01 @@ -1833,7 +1869,7 @@ checking for filesystem... yes checking for main in -lstdc++fs... yes configure: Assuming you are yet to build librsb.la. (set LIBS= -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la) -/bin/bash +/bin/sh checking that generated files are newer than configure... done configure: creating ./config.status config.status: creating Makefile @@ -1843,7 +1879,7 @@ config.status: executing libtool commands configure: Created a Makefile. === configuring in rsbtest (/build/reproducible-path/librsb-1.3.0.2+dfsg/rsbtest) -configure: running /bin/bash ./configure --disable-option-checking '--prefix=/usr' '--build=aarch64-linux-gnu' '--includedir=${prefix}/include' '--mandir=${prefix}/share/man' '--infodir=${prefix}/share/info' '--sysconfdir=/etc' '--localstatedir=/var' '--disable-silent-rules' '--libdir=${prefix}/lib/aarch64-linux-gnu' '--runstatedir=/run' '--disable-maintainer-mode' '--disable-dependency-tracking' '--with-memhinfo=L2:4/64/512K,L1:8/64/24K' '--with-hwloc' '--enable-matrix-types=blas' '--with-zlib=-lz' '--enable-doc-build' '--enable-fortran-module-install' '--enable-extra-patches' '--enable-pkg-config-install' '--disable-extra-patches' 'build_alias=aarch64-linux-gnu' 'CFLAGS=-g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3' 'LDFLAGS=-Wl,-z,relro' 'CPPFLAGS=-Wdate-time -D_FORTIFY_SOURCE=2' 'FCFLAGS=-g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -mbranch-protection=standard -pipe' 'CXXFLAGS=-g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard' 'BASH=/bin/bash' --cache-file=/dev/null --srcdir=. +configure: running /bin/sh ./configure --disable-option-checking '--prefix=/usr' '--build=aarch64-linux-gnu' '--includedir=${prefix}/include' '--mandir=${prefix}/share/man' '--infodir=${prefix}/share/info' '--sysconfdir=/etc' '--localstatedir=/var' '--disable-silent-rules' '--libdir=${prefix}/lib/aarch64-linux-gnu' '--runstatedir=/run' '--disable-maintainer-mode' '--disable-dependency-tracking' '--with-memhinfo=L2:4/64/512K,L1:8/64/24K' '--with-hwloc' '--enable-matrix-types=blas' '--with-zlib=-lz' '--enable-doc-build' '--enable-fortran-module-install' '--enable-extra-patches' '--enable-pkg-config-install' '--disable-extra-patches' 'build_alias=aarch64-linux-gnu' 'CFLAGS=-g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3' 'LDFLAGS=-Wl,-z,relro' 'CPPFLAGS=-Wdate-time -D_FORTIFY_SOURCE=2' 'FCFLAGS=-g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -mbranch-protection=standard -pipe' 'CXXFLAGS=-g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard' 'BASH=/bin/sh' --cache-file=/dev/null --srcdir=. checking for a BSD-compatible install... /usr/bin/install -c checking whether sleep supports fractional seconds... yes checking filesystem timestamp resolution... 0.01 @@ -1957,7 +1993,7 @@ checking for filesystem... yes checking for rsb_lib_init... no checking for dd... yes -/bin/bash +/bin/sh /usr/bin/timeout checking that generated files are newer than configure... done configure: creating ./config.status @@ -1989,7 +2025,7 @@ ARFLAGS : cru M4 : m4 MAKE : gmake - BASH : /bin/bash + BASH : /bin/sh OCTAVE : false DOXYGEN : doxygen HELP2MAN : help2man @@ -2045,24 +2081,24 @@ Making all in librsbpp gmake[4]: Entering directory '/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp' g++ -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -DRSBPP_HAS_RSB_H=1 -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -DRSBPP_HAS_RSB_H=1 -c -o rsbpp.o rsbpp.cpp -/bin/bash ./libtool --tag=CXX --mode=compile g++ -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -DRSBPP_HAS_RSB_H=1 -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -DRSBPP_HAS_RSB_H=1 -c -o rsbpp_coo.lo rsbpp_coo.cpp -/bin/bash ./libtool --tag=CXX --mode=compile g++ -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -DRSBPP_HAS_RSB_H=1 -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -DRSBPP_HAS_RSB_H=1 -c -o rsbpp_csr.lo rsbpp_csr.cpp +/bin/sh ./libtool --tag=CXX --mode=compile g++ -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -DRSBPP_HAS_RSB_H=1 -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -DRSBPP_HAS_RSB_H=1 -c -o rsbpp_coo.lo rsbpp_coo.cpp +/bin/sh ./libtool --tag=CXX --mode=compile g++ -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -DRSBPP_HAS_RSB_H=1 -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -DRSBPP_HAS_RSB_H=1 -c -o rsbpp_csr.lo rsbpp_csr.cpp g++ -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -DRSBPP_HAS_RSB_H=1 -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -DRSBPP_HAS_RSB_H=1 -c -o rsbtt.o rsbtt.cpp gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -DRSBPP_HAS_RSB_H=1 -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -c -o rsbct.o rsbct.c -libtool: compile: g++ -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -DRSBPP_HAS_RSB_H=1 -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -DRSBPP_HAS_RSB_H=1 -c rsbpp_coo.cpp -fPIC -DPIC -o .libs/rsbpp_coo.o libtool: compile: g++ -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -DRSBPP_HAS_RSB_H=1 -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -DRSBPP_HAS_RSB_H=1 -c rsbpp_csr.cpp -fPIC -DPIC -o .libs/rsbpp_csr.o +libtool: compile: g++ -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -DRSBPP_HAS_RSB_H=1 -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -DRSBPP_HAS_RSB_H=1 -c rsbpp_coo.cpp -fPIC -DPIC -o .libs/rsbpp_coo.o libtool: compile: g++ -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -DRSBPP_HAS_RSB_H=1 -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -DRSBPP_HAS_RSB_H=1 -c rsbpp_coo.cpp -o rsbpp_coo.o >/dev/null 2>&1 libtool: compile: g++ -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -DRSBPP_HAS_RSB_H=1 -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -DRSBPP_HAS_RSB_H=1 -c rsbpp_csr.cpp -o rsbpp_csr.o >/dev/null 2>&1 -/bin/bash ./libtool --tag=CXX --mode=link g++ -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -DRSBPP_HAS_RSB_H=1 -Wl,-z,relro -o librsbpp.la rsbpp_coo.lo rsbpp_csr.lo -lpthread -lstdc++fs +/bin/sh ./libtool --tag=CXX --mode=link g++ -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -DRSBPP_HAS_RSB_H=1 -Wl,-z,relro -o librsbpp.la rsbpp_coo.lo rsbpp_csr.lo -lpthread -lstdc++fs libtool: link: ar cr .libs/librsbpp.a .libs/rsbpp_coo.o .libs/rsbpp_csr.o libtool: link: ranlib .libs/librsbpp.a libtool: link: ( cd ".libs" && rm -f "librsbpp.la" && ln -s "../librsbpp.la" "librsbpp.la" ) -/bin/bash ./libtool --tag=CXX --mode=link g++ -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -DRSBPP_HAS_RSB_H=1 -Wl,-z,relro -o rsbpp rsbpp.o librsbpp.la -lpthread -lstdc++fs -/bin/bash ./libtool --tag=CXX --mode=link g++ -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -DRSBPP_HAS_RSB_H=1 -Wl,-z,relro -o rsbtt rsbtt.o librsbpp.la -lpthread -lstdc++fs -/bin/bash ./libtool --tag=CXX --mode=link g++ -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -DRSBPP_HAS_RSB_H=1 -Wl,-z,relro -o rsbct rsbct.o librsbpp.la -lpthread -lstdc++fs -libtool: link: g++ -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -DRSBPP_HAS_RSB_H=1 -Wl,-z -Wl,relro -o rsbtt rsbtt.o ./.libs/librsbpp.a -lpthread -lstdc++fs -fopenmp -libtool: link: g++ -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -DRSBPP_HAS_RSB_H=1 -Wl,-z -Wl,relro -o rsbpp rsbpp.o ./.libs/librsbpp.a -lpthread -lstdc++fs -fopenmp +/bin/sh ./libtool --tag=CXX --mode=link g++ -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -DRSBPP_HAS_RSB_H=1 -Wl,-z,relro -o rsbpp rsbpp.o librsbpp.la -lpthread -lstdc++fs +/bin/sh ./libtool --tag=CXX --mode=link g++ -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -DRSBPP_HAS_RSB_H=1 -Wl,-z,relro -o rsbtt rsbtt.o librsbpp.la -lpthread -lstdc++fs +/bin/sh ./libtool --tag=CXX --mode=link g++ -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -DRSBPP_HAS_RSB_H=1 -Wl,-z,relro -o rsbct rsbct.o librsbpp.la -lpthread -lstdc++fs libtool: link: g++ -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -DRSBPP_HAS_RSB_H=1 -Wl,-z -Wl,relro -o rsbct rsbct.o ./.libs/librsbpp.a -lpthread -lstdc++fs -fopenmp +libtool: link: g++ -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -DRSBPP_HAS_RSB_H=1 -Wl,-z -Wl,relro -o rsbpp rsbpp.o ./.libs/librsbpp.a -lpthread -lstdc++fs -fopenmp +libtool: link: g++ -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -DRSBPP_HAS_RSB_H=1 -Wl,-z -Wl,relro -o rsbtt rsbtt.o ./.libs/librsbpp.a -lpthread -lstdc++fs -fopenmp gmake all-am gmake[5]: Entering directory '/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp' gmake[5]: Leaving directory '/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp' @@ -2080,89 +2116,87 @@ gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o rsbench-rsb_libspblas_tests.o `test -f 'rsb_libspblas_tests.c' || echo './'`rsb_libspblas_tests.c g++ -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -fopenmp -c -o rsb_dummy.o rsb_dummy.cpp gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o ch2icfb-ch2icfb.o `test -f 'ch2icfb.c' || echo './'`ch2icfb.c -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_nounroll_la-rsb_stropts.lo `test -f 'rsb_stropts.c' || echo './'`rsb_stropts.c -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_nounroll_la-rsb_strmif.lo `test -f 'rsb_strmif.c' || echo './'`rsb_strmif.c -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_nounroll_la-rsb_unroll.lo `test -f 'rsb_unroll.c' || echo './'`rsb_unroll.c -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_nounroll_la-rsb_krnl_vb.lo `test -f 'rsb_krnl_vb.c' || echo './'`rsb_krnl_vb.c -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_nounroll_la-rsb_krnl_lb.lo `test -f 'rsb_krnl_lb.c' || echo './'`rsb_krnl_lb.c -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_unroll.c -fPIC -DPIC -o .libs/librsb_nounroll_la-rsb_unroll.o +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_nounroll_la-rsb_stropts.lo `test -f 'rsb_stropts.c' || echo './'`rsb_stropts.c +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_nounroll_la-rsb_strmif.lo `test -f 'rsb_strmif.c' || echo './'`rsb_strmif.c +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_nounroll_la-rsb_unroll.lo `test -f 'rsb_unroll.c' || echo './'`rsb_unroll.c +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_nounroll_la-rsb_krnl_vb.lo `test -f 'rsb_krnl_vb.c' || echo './'`rsb_krnl_vb.c +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_nounroll_la-rsb_krnl_lb.lo `test -f 'rsb_krnl_lb.c' || echo './'`rsb_krnl_lb.c +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_nounroll_la-rsb_krnl.lo `test -f 'rsb_krnl.c' || echo './'`rsb_krnl.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_stropts.c -fPIC -DPIC -o .libs/librsb_nounroll_la-rsb_stropts.o libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_krnl_vb.c -fPIC -DPIC -o .libs/librsb_nounroll_la-rsb_krnl_vb.o -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_strmif.c -fPIC -DPIC -o .libs/librsb_nounroll_la-rsb_strmif.o -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_nounroll_la-rsb_krnl.lo `test -f 'rsb_krnl.c' || echo './'`rsb_krnl.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_krnl_lb.c -fPIC -DPIC -o .libs/librsb_nounroll_la-rsb_krnl_lb.o -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_unroll.c -o librsb_nounroll_la-rsb_unroll.o >/dev/null 2>&1 +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_unroll.c -fPIC -DPIC -o .libs/librsb_nounroll_la-rsb_unroll.o +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_strmif.c -fPIC -DPIC -o .libs/librsb_nounroll_la-rsb_strmif.o +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_krnl.c -fPIC -DPIC -o .libs/librsb_nounroll_la-rsb_krnl.o libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_krnl_vb.c -o librsb_nounroll_la-rsb_krnl_vb.o >/dev/null 2>&1 libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_stropts.c -o librsb_nounroll_la-rsb_stropts.o >/dev/null 2>&1 -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_krnl.c -fPIC -DPIC -o .libs/librsb_nounroll_la-rsb_krnl.o -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_nounroll_la-rsb_bench.lo `test -f 'rsb_bench.c' || echo './'`rsb_bench.c -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_nounroll_la-rsb_mergesort.lo `test -f 'rsb_mergesort.c' || echo './'`rsb_mergesort.c -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_nounroll_la-rsb_permute.lo `test -f 'rsb_permute.c' || echo './'`rsb_permute.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_krnl_lb.c -o librsb_nounroll_la-rsb_krnl_lb.o >/dev/null 2>&1 -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_nounroll_la-rsb_krnl_bcss_l.lo `test -f 'rsb_krnl_bcss_l.c' || echo './'`rsb_krnl_bcss_l.c +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_unroll.c -o librsb_nounroll_la-rsb_unroll.o >/dev/null 2>&1 +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_nounroll_la-rsb_bench.lo `test -f 'rsb_bench.c' || echo './'`rsb_bench.c +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_nounroll_la-rsb_mergesort.lo `test -f 'rsb_mergesort.c' || echo './'`rsb_mergesort.c +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_nounroll_la-rsb_permute.lo `test -f 'rsb_permute.c' || echo './'`rsb_permute.c +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_nounroll_la-rsb_krnl_bcss_l.lo `test -f 'rsb_krnl_bcss_l.c' || echo './'`rsb_krnl_bcss_l.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_strmif.c -o librsb_nounroll_la-rsb_strmif.o >/dev/null 2>&1 -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_bench.c -fPIC -DPIC -o .libs/librsb_nounroll_la-rsb_bench.o -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_nounroll_la-rsb_krnl_bcss_u.lo `test -f 'rsb_krnl_bcss_u.c' || echo './'`rsb_krnl_bcss_u.c +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_nounroll_la-rsb_krnl_bcss_u.lo `test -f 'rsb_krnl_bcss_u.c' || echo './'`rsb_krnl_bcss_u.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_mergesort.c -fPIC -DPIC -o .libs/librsb_nounroll_la-rsb_mergesort.o -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_nounroll_la-rsb_krnl_bcss_spsv_u.lo `test -f 'rsb_krnl_bcss_spsv_u.c' || echo './'`rsb_krnl_bcss_spsv_u.c -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_permute.c -fPIC -DPIC -o .libs/librsb_nounroll_la-rsb_permute.o +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_nounroll_la-rsb_krnl_bcss_spsv_u.lo `test -f 'rsb_krnl_bcss_spsv_u.c' || echo './'`rsb_krnl_bcss_spsv_u.c +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_bench.c -fPIC -DPIC -o .libs/librsb_nounroll_la-rsb_bench.o libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_krnl_bcss_l.c -fPIC -DPIC -o .libs/librsb_nounroll_la-rsb_krnl_bcss_l.o +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_permute.c -fPIC -DPIC -o .libs/librsb_nounroll_la-rsb_permute.o +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_nounroll_la-rsb_krnl_bcss_spmv_u.lo `test -f 'rsb_krnl_bcss_spmv_u.c' || echo './'`rsb_krnl_bcss_spmv_u.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_krnl_bcss_u.c -fPIC -DPIC -o .libs/librsb_nounroll_la-rsb_krnl_bcss_u.o -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_nounroll_la-rsb_krnl_bcss_spmv_u.lo `test -f 'rsb_krnl_bcss_spmv_u.c' || echo './'`rsb_krnl_bcss_spmv_u.c -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_krnl_bcss_spsv_u.c -fPIC -DPIC -o .libs/librsb_nounroll_la-rsb_krnl_bcss_spsv_u.o libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_krnl_bcss_l.c -o librsb_nounroll_la-rsb_krnl_bcss_l.o >/dev/null 2>&1 +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_krnl_bcss_spsv_u.c -fPIC -DPIC -o .libs/librsb_nounroll_la-rsb_krnl_bcss_spsv_u.o libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_mergesort.c -o librsb_nounroll_la-rsb_mergesort.o >/dev/null 2>&1 +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_nounroll_la-rsb_krnl_bcss_misc_u.lo `test -f 'rsb_krnl_bcss_misc_u.c' || echo './'`rsb_krnl_bcss_misc_u.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_krnl_bcss_u.c -o librsb_nounroll_la-rsb_krnl_bcss_u.o >/dev/null 2>&1 -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_nounroll_la-rsb_krnl_bcss_misc_u.lo `test -f 'rsb_krnl_bcss_misc_u.c' || echo './'`rsb_krnl_bcss_misc_u.c -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_nounroll_la-rsb_krnl_bcoo_spmv_u.lo `test -f 'rsb_krnl_bcoo_spmv_u.c' || echo './'`rsb_krnl_bcoo_spmv_u.c -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_nounroll_la-rsb_krnl_bcss.lo `test -f 'rsb_krnl_bcss.c' || echo './'`rsb_krnl_bcss.c +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_nounroll_la-rsb_krnl_bcoo_spmv_u.lo `test -f 'rsb_krnl_bcoo_spmv_u.c' || echo './'`rsb_krnl_bcoo_spmv_u.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_krnl_bcss_spmv_u.c -fPIC -DPIC -o .libs/librsb_nounroll_la-rsb_krnl_bcss_spmv_u.o -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_nounroll_la-rsb_spmv.lo `test -f 'rsb_spmv.c' || echo './'`rsb_spmv.c +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_nounroll_la-rsb_krnl_bcss.lo `test -f 'rsb_krnl_bcss.c' || echo './'`rsb_krnl_bcss.c +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_nounroll_la-rsb_spmv.lo `test -f 'rsb_spmv.c' || echo './'`rsb_spmv.c +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_krnl_bcoo_spmv_u.c -fPIC -DPIC -o .libs/librsb_nounroll_la-rsb_krnl_bcoo_spmv_u.o libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_krnl_bcss_misc_u.c -fPIC -DPIC -o .libs/librsb_nounroll_la-rsb_krnl_bcss_misc_u.o libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_krnl_bcss.c -fPIC -DPIC -o .libs/librsb_nounroll_la-rsb_krnl_bcss.o -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_krnl_bcoo_spmv_u.c -fPIC -DPIC -o .libs/librsb_nounroll_la-rsb_krnl_bcoo_spmv_u.o libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_spmv.c -fPIC -DPIC -o .libs/librsb_nounroll_la-rsb_spmv.o libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_krnl_bcss.c -o librsb_nounroll_la-rsb_krnl_bcss.o >/dev/null 2>&1 libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_bench.c -o librsb_nounroll_la-rsb_bench.o >/dev/null 2>&1 -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_nounroll_la-rsb_merge.lo `test -f 'rsb_merge.c' || echo './'`rsb_merge.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_permute.c -o librsb_nounroll_la-rsb_permute.o >/dev/null 2>&1 -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_nounroll_la-rsb_ompio.lo `test -f 'rsb_ompio.c' || echo './'`rsb_ompio.c -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_merge.c -fPIC -DPIC -o .libs/librsb_nounroll_la-rsb_merge.o libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_spmv.c -o librsb_nounroll_la-rsb_spmv.o >/dev/null 2>&1 +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_nounroll_la-rsb_merge.lo `test -f 'rsb_merge.c' || echo './'`rsb_merge.c +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_nounroll_la-rsb_ompio.lo `test -f 'rsb_ompio.c' || echo './'`rsb_ompio.c +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_nounroll_la-rsb_util.lo `test -f 'rsb_util.c' || echo './'`rsb_util.c +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_merge.c -fPIC -DPIC -o .libs/librsb_nounroll_la-rsb_merge.o libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_ompio.c -fPIC -DPIC -o .libs/librsb_nounroll_la-rsb_ompio.o -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_nounroll_la-rsb_util.lo `test -f 'rsb_util.c' || echo './'`rsb_util.c +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_util.c -fPIC -DPIC -o .libs/librsb_nounroll_la-rsb_util.o libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_ompio.c -o librsb_nounroll_la-rsb_ompio.o >/dev/null 2>&1 +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_nounroll_la-rsb_spgemm_csr.lo `test -f 'rsb_spgemm_csr.c' || echo './'`rsb_spgemm_csr.c +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_nounroll_la-rsb_spsum_misc.lo `test -f 'rsb_spsum_misc.c' || echo './'`rsb_spsum_misc.c +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_nounroll_la-rsb_prec.lo `test -f 'rsb_prec.c' || echo './'`rsb_prec.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_merge.c -o librsb_nounroll_la-rsb_merge.o >/dev/null 2>&1 -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_nounroll_la-rsb_spgemm_csr.lo `test -f 'rsb_spgemm_csr.c' || echo './'`rsb_spgemm_csr.c -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_nounroll_la-rsb_spsum_misc.lo `test -f 'rsb_spsum_misc.c' || echo './'`rsb_spsum_misc.c -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_util.c -fPIC -DPIC -o .libs/librsb_nounroll_la-rsb_util.o libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_spgemm_csr.c -fPIC -DPIC -o .libs/librsb_nounroll_la-rsb_spgemm_csr.o libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_spsum_misc.c -fPIC -DPIC -o .libs/librsb_nounroll_la-rsb_spsum_misc.o -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_nounroll_la-rsb_prec.lo `test -f 'rsb_prec.c' || echo './'`rsb_prec.c -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_spgemm_csr.c -o librsb_nounroll_la-rsb_spgemm_csr.o >/dev/null 2>&1 -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_is.lo `test -f 'rsb_is.c' || echo './'`rsb_is.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_prec.c -fPIC -DPIC -o .libs/librsb_nounroll_la-rsb_prec.o -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_spsum_misc.c -o librsb_nounroll_la-rsb_spsum_misc.o >/dev/null 2>&1 +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_spgemm_csr.c -o librsb_nounroll_la-rsb_spgemm_csr.o >/dev/null 2>&1 libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_prec.c -o librsb_nounroll_la-rsb_prec.o >/dev/null 2>&1 +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_spsum_misc.c -o librsb_nounroll_la-rsb_spsum_misc.o >/dev/null 2>&1 +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_is.lo `test -f 'rsb_is.c' || echo './'`rsb_is.c +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_mio.lo `test -f 'rsb_mio.c' || echo './'`rsb_mio.c +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_op.lo `test -f 'rsb_op.c' || echo './'`rsb_op.c +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_bio.lo `test -f 'rsb_bio.c' || echo './'`rsb_bio.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_is.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_is.o -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_mio.lo `test -f 'rsb_mio.c' || echo './'`rsb_mio.c -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_op.lo `test -f 'rsb_op.c' || echo './'`rsb_op.c -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_mio.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_mio.o -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_bio.lo `test -f 'rsb_bio.c' || echo './'`rsb_bio.c -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_is.c -o librsb_base_la-rsb_is.o >/dev/null 2>&1 libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_op.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_op.o -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_bio.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_bio.o +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_mio.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_mio.o libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_op.c -o librsb_base_la-rsb_op.o >/dev/null 2>&1 -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_get.lo `test -f 'rsb_get.c' || echo './'`rsb_get.c -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_get.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_get.o +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_get.lo `test -f 'rsb_get.c' || echo './'`rsb_get.c +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_bio.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_bio.o +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_is.c -o librsb_base_la-rsb_is.o >/dev/null 2>&1 libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_bio.c -o librsb_base_la-rsb_bio.o >/dev/null 2>&1 -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_set.lo `test -f 'rsb_set.c' || echo './'`rsb_set.c +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_get.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_get.o +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_set.lo `test -f 'rsb_set.c' || echo './'`rsb_set.c +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_coo.lo `test -f 'rsb_coo.c' || echo './'`rsb_coo.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_set.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_set.o -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_coo.lo `test -f 'rsb_coo.c' || echo './'`rsb_coo.c -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_coo.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_coo.o -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_set.c -o librsb_base_la-rsb_set.o >/dev/null 2>&1 libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_mio.c -o librsb_base_la-rsb_mio.o >/dev/null 2>&1 -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_krnl_bcss_spsv_u.c -o librsb_nounroll_la-rsb_krnl_bcss_spsv_u.o >/dev/null 2>&1 +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_coo.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_coo.o rsb_test_matops.c: In function 'rsb__main_block_partitioned_spmv_sxsa': rsb_test_matops.c:214:41: warning: '%s' directive writing up to 2047 bytes into a region of size 1011 [-Wformat-overflow=] 214 | rsb__sprintf(dst,"%s%s_%s_%.0lf_%s%s" "%s%s%s" "%s%s" "%s",pp?pp:"",h,rsb__getenv_nnr("HOSTNAME"),rsb_time(),buf,ap?ap:"", @@ -2181,137 +2215,125 @@ | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ 32 | __va_arg_pack ()); | ~~~~~~~~~~~~~~~~~ -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_csr.lo `test -f 'rsb_csr.c' || echo './'`rsb_csr.c +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_set.c -o librsb_base_la-rsb_set.o >/dev/null 2>&1 libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_coo.c -o librsb_base_la-rsb_coo.o >/dev/null 2>&1 +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_csr.lo `test -f 'rsb_csr.c' || echo './'`rsb_csr.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_get.c -o librsb_base_la-rsb_get.o >/dev/null 2>&1 +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_coo_check.lo `test -f 'rsb_coo_check.c' || echo './'`rsb_coo_check.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_csr.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_csr.o -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_coo_check.lo `test -f 'rsb_coo_check.c' || echo './'`rsb_coo_check.c -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_csr.c -o librsb_base_la-rsb_csr.o >/dev/null 2>&1 -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_coo_symm.lo `test -f 'rsb_coo_symm.c' || echo './'`rsb_coo_symm.c -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_idx.lo `test -f 'rsb_idx.c' || echo './'`rsb_idx.c +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_coo_symm.lo `test -f 'rsb_coo_symm.c' || echo './'`rsb_coo_symm.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_coo_check.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_coo_check.o +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_csr.c -o librsb_base_la-rsb_csr.o >/dev/null 2>&1 +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_krnl_bcss_spsv_u.c -o librsb_nounroll_la-rsb_krnl_bcss_spsv_u.o >/dev/null 2>&1 libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_coo_symm.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_coo_symm.o libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_coo_check.c -o librsb_base_la-rsb_coo_check.o >/dev/null 2>&1 -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_idx.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_idx.o -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_srt.lo `test -f 'rsb_srt.c' || echo './'`rsb_srt.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_coo_symm.c -o librsb_base_la-rsb_coo_symm.o >/dev/null 2>&1 -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_srtp.lo `test -f 'rsb_srtp.c' || echo './'`rsb_srtp.c -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_src.lo `test -f 'rsb_src.c' || echo './'`rsb_src.c +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_idx.lo `test -f 'rsb_idx.c' || echo './'`rsb_idx.c +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_srt.lo `test -f 'rsb_srt.c' || echo './'`rsb_srt.c +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_srtp.lo `test -f 'rsb_srtp.c' || echo './'`rsb_srtp.c +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_idx.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_idx.o libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_srt.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_srt.o +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_src.lo `test -f 'rsb_src.c' || echo './'`rsb_src.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_srtp.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_srtp.o libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_idx.c -o librsb_base_la-rsb_idx.o >/dev/null 2>&1 libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_src.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_src.o -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_srt.c -o librsb_base_la-rsb_srt.o >/dev/null 2>&1 libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_srtp.c -o librsb_base_la-rsb_srtp.o >/dev/null 2>&1 +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_srt.c -o librsb_base_la-rsb_srt.o >/dev/null 2>&1 libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_src.c -o librsb_base_la-rsb_src.o >/dev/null 2>&1 -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_test_accuracy.lo `test -f 'rsb_test_accuracy.c' || echo './'`rsb_test_accuracy.c -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_clone.lo `test -f 'rsb_clone.c' || echo './'`rsb_clone.c -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_rec.lo `test -f 'rsb_rec.c' || echo './'`rsb_rec.c -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_render.lo `test -f 'rsb_render.c' || echo './'`rsb_render.c -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_rec.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_rec.o +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_test_accuracy.lo `test -f 'rsb_test_accuracy.c' || echo './'`rsb_test_accuracy.c +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_clone.lo `test -f 'rsb_clone.c' || echo './'`rsb_clone.c +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_rec.lo `test -f 'rsb_rec.c' || echo './'`rsb_rec.c +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_render.lo `test -f 'rsb_render.c' || echo './'`rsb_render.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_test_accuracy.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_test_accuracy.o -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_clone.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_clone.o libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_render.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_render.o +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_clone.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_clone.o +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_rec.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_rec.o libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_test_accuracy.c -o librsb_base_la-rsb_test_accuracy.o >/dev/null 2>&1 libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_render.c -o librsb_base_la-rsb_render.o >/dev/null 2>&1 -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_eps.lo `test -f 'rsb_eps.c' || echo './'`rsb_eps.c -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_msort_up.lo `test -f 'rsb_msort_up.c' || echo './'`rsb_msort_up.c -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_clone.c -o librsb_base_la-rsb_clone.o >/dev/null 2>&1 +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_eps.lo `test -f 'rsb_eps.c' || echo './'`rsb_eps.c +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_msort_up.lo `test -f 'rsb_msort_up.c' || echo './'`rsb_msort_up.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_eps.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_eps.o -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_rec.c -o librsb_base_la-rsb_rec.o >/dev/null 2>&1 libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_msort_up.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_msort_up.o -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_sys.lo `test -f 'rsb_sys.c' || echo './'`rsb_sys.c -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_blas_stuff.lo `test -f 'rsb_blas_stuff.c' || echo './'`rsb_blas_stuff.c +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_clone.c -o librsb_base_la-rsb_clone.o >/dev/null 2>&1 libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_msort_up.c -o librsb_base_la-rsb_msort_up.o >/dev/null 2>&1 -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_gen.lo `test -f 'rsb_gen.c' || echo './'`rsb_gen.c -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_sys.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_sys.o -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_perf.lo `test -f 'rsb_perf.c' || echo './'`rsb_perf.c -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_blas_stuff.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_blas_stuff.o +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_rec.c -o librsb_base_la-rsb_rec.o >/dev/null 2>&1 +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_sys.lo `test -f 'rsb_sys.c' || echo './'`rsb_sys.c +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_blas_stuff.lo `test -f 'rsb_blas_stuff.c' || echo './'`rsb_blas_stuff.c +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_gen.lo `test -f 'rsb_gen.c' || echo './'`rsb_gen.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_eps.c -o librsb_base_la-rsb_eps.o >/dev/null 2>&1 +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_sys.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_sys.o libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_gen.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_gen.o +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_blas_stuff.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_blas_stuff.o +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_sys.c -o librsb_base_la-rsb_sys.o >/dev/null 2>&1 libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_blas_stuff.c -o librsb_base_la-rsb_blas_stuff.o >/dev/null 2>&1 +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_perf.lo `test -f 'rsb_perf.c' || echo './'`rsb_perf.c +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_rsb.lo `test -f 'rsb_rsb.c' || echo './'`rsb_rsb.c +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_err.lo `test -f 'rsb_err.c' || echo './'`rsb_err.c +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_tune.lo `test -f 'rsb_tune.c' || echo './'`rsb_tune.c +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_gen.c -o librsb_base_la-rsb_gen.o >/dev/null 2>&1 +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_do.lo `test -f 'rsb_do.c' || echo './'`rsb_do.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_perf.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_perf.o -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_rsb.lo `test -f 'rsb_rsb.c' || echo './'`rsb_rsb.c -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_sys.c -o librsb_base_la-rsb_sys.o >/dev/null 2>&1 -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_err.lo `test -f 'rsb_err.c' || echo './'`rsb_err.c -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_perf.c -o librsb_base_la-rsb_perf.o >/dev/null 2>&1 libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_rsb.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_rsb.o -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_gen.c -o librsb_base_la-rsb_gen.o >/dev/null 2>&1 libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_err.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_err.o -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_tune.lo `test -f 'rsb_tune.c' || echo './'`rsb_tune.c -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_do.lo `test -f 'rsb_do.c' || echo './'`rsb_do.c -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_internals.lo `test -f 'rsb_internals.c' || echo './'`rsb_internals.c +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_tune.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_tune.o +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_do.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_do.o libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_err.c -o librsb_base_la-rsb_err.o >/dev/null 2>&1 libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_rsb.c -o librsb_base_la-rsb_rsb.o >/dev/null 2>&1 -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_do.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_do.o -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_tune.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_tune.o -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_garbage.lo `test -f 'rsb_garbage.c' || echo './'`rsb_garbage.c +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_perf.c -o librsb_base_la-rsb_perf.o >/dev/null 2>&1 +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_internals.lo `test -f 'rsb_internals.c' || echo './'`rsb_internals.c +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_garbage.lo `test -f 'rsb_garbage.c' || echo './'`rsb_garbage.c +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_mmio.lo `test -f 'rsb_mmio.c' || echo './'`rsb_mmio.c +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_do.c -o librsb_base_la-rsb_do.o >/dev/null 2>&1 libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_internals.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_internals.o -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_mmio.lo `test -f 'rsb_mmio.c' || echo './'`rsb_mmio.c -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_partition.lo `test -f 'rsb_partition.c' || echo './'`rsb_partition.c +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_partition.lo `test -f 'rsb_partition.c' || echo './'`rsb_partition.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_garbage.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_garbage.o -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_partition.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_partition.o libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_mmio.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_mmio.o -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_do.c -o librsb_base_la-rsb_do.o >/dev/null 2>&1 -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_partition.c -o librsb_base_la-rsb_partition.o >/dev/null 2>&1 +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_partition.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_partition.o libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_garbage.c -o librsb_base_la-rsb_garbage.o >/dev/null 2>&1 +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_mbw.lo `test -f 'rsb_mbw.c' || echo './'`rsb_mbw.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_mmio.c -o librsb_base_la-rsb_mmio.o >/dev/null 2>&1 -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_mbw.lo `test -f 'rsb_mbw.c' || echo './'`rsb_mbw.c -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_limiter.lo `test -f 'rsb_limiter.c' || echo './'`rsb_limiter.c -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_fpb.lo `test -f 'rsb_fpb.c' || echo './'`rsb_fpb.c -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_spgemm.lo `test -f 'rsb_spgemm.c' || echo './'`rsb_spgemm.c -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_fpb.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_fpb.o +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_partition.c -o librsb_base_la-rsb_partition.o >/dev/null 2>&1 libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_mbw.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_mbw.o -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_internals.c -o librsb_base_la-rsb_internals.o >/dev/null 2>&1 -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_limiter.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_limiter.o +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_limiter.lo `test -f 'rsb_limiter.c' || echo './'`rsb_limiter.c +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_fpb.lo `test -f 'rsb_fpb.c' || echo './'`rsb_fpb.c +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_spgemm.lo `test -f 'rsb_spgemm.c' || echo './'`rsb_spgemm.c +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_util.c -o librsb_nounroll_la-rsb_util.o >/dev/null 2>&1 +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_fpb.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_fpb.o libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_spgemm.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_spgemm.o -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_limiter.c -o librsb_base_la-rsb_limiter.o >/dev/null 2>&1 +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_limiter.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_limiter.o +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_tune.c -o librsb_base_la-rsb_tune.o >/dev/null 2>&1 +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_internals.c -o librsb_base_la-rsb_internals.o >/dev/null 2>&1 libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_fpb.c -o librsb_base_la-rsb_fpb.o >/dev/null 2>&1 -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_mbw.c -o librsb_base_la-rsb_mbw.o >/dev/null 2>&1 -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_krnl_bcss_misc_u.c -o librsb_nounroll_la-rsb_krnl_bcss_misc_u.o >/dev/null 2>&1 -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_spsum.lo `test -f 'rsb_spsum.c' || echo './'`rsb_spsum.c +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_limiter.c -o librsb_base_la-rsb_limiter.o >/dev/null 2>&1 libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_spgemm.c -o librsb_base_la-rsb_spgemm.o >/dev/null 2>&1 -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_util.c -o librsb_nounroll_la-rsb_util.o >/dev/null 2>&1 -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_tune.c -o librsb_base_la-rsb_tune.o >/dev/null 2>&1 -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_spsv.lo `test -f 'rsb_spsv.c' || echo './'`rsb_spsv.c +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_spsum.lo `test -f 'rsb_spsum.c' || echo './'`rsb_spsum.c +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_spsv.lo `test -f 'rsb_spsv.c' || echo './'`rsb_spsv.c +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_mbw.c -o librsb_base_la-rsb_mbw.o >/dev/null 2>&1 libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_spsum.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_spsum.o -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_lock.lo `test -f 'rsb_lock.c' || echo './'`rsb_lock.c -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_swt.lo `test -f 'rsb_swt.c' || echo './'`rsb_swt.c -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_init.lo `test -f 'rsb_init.c' || echo './'`rsb_init.c +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_lock.lo `test -f 'rsb_lock.c' || echo './'`rsb_lock.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_spsv.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_spsv.o +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_krnl_bcss_misc_u.c -o librsb_nounroll_la-rsb_krnl_bcss_misc_u.o >/dev/null 2>&1 libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_spsum.c -o librsb_base_la-rsb_spsum.o >/dev/null 2>&1 -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_init.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_init.o -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_swt.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_swt.o libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_lock.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_lock.o -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_dump.lo `test -f 'rsb_dump.c' || echo './'`rsb_dump.c -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_spsv.c -o librsb_base_la-rsb_spsv.o >/dev/null 2>&1 +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_swt.lo `test -f 'rsb_swt.c' || echo './'`rsb_swt.c +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_init.lo `test -f 'rsb_init.c' || echo './'`rsb_init.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_lock.c -o librsb_base_la-rsb_lock.o >/dev/null 2>&1 +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_spsv.c -o librsb_base_la-rsb_spsv.o >/dev/null 2>&1 +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_dump.lo `test -f 'rsb_dump.c' || echo './'`rsb_dump.c +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_cpmv.lo `test -f 'rsb_cpmv.c' || echo './'`rsb_cpmv.c +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_swt.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_swt.o +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_init.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_init.o libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_dump.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_dump.o -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_init.c -o librsb_base_la-rsb_init.o >/dev/null 2>&1 -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_swt.c -o librsb_base_la-rsb_swt.o >/dev/null 2>&1 -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_cpmv.lo `test -f 'rsb_cpmv.c' || echo './'`rsb_cpmv.c -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_asm.lo `test -f 'rsb_asm.c' || echo './'`rsb_asm.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_cpmv.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_cpmv.o -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_dump.c -o librsb_base_la-rsb_dump.o >/dev/null 2>&1 -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_user.lo `test -f 'rsb_user.c' || echo './'`rsb_user.c -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_coo2rec.lo `test -f 'rsb_coo2rec.c' || echo './'`rsb_coo2rec.c -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_cpmv.c -o librsb_base_la-rsb_cpmv.o >/dev/null 2>&1 +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_swt.c -o librsb_base_la-rsb_swt.o >/dev/null 2>&1 +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_asm.lo `test -f 'rsb_asm.c' || echo './'`rsb_asm.c +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_user.lo `test -f 'rsb_user.c' || echo './'`rsb_user.c +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_init.c -o librsb_base_la-rsb_init.o >/dev/null 2>&1 libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_asm.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_asm.o -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_rec2coo.lo `test -f 'rsb_rec2coo.c' || echo './'`rsb_rec2coo.c -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_coo2rec.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_coo2rec.o libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_user.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_user.o -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_rec2csr.lo `test -f 'rsb_rec2csr.c' || echo './'`rsb_rec2csr.c -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_csr2coo.lo `test -f 'rsb_csr2coo.c' || echo './'`rsb_csr2coo.c -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_asm.c -o librsb_base_la-rsb_asm.o >/dev/null 2>&1 -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_rec2coo.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_rec2coo.o -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_rec2csr.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_rec2csr.o -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_user.c -o librsb_base_la-rsb_user.o >/dev/null 2>&1 -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_csr2coo.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_csr2coo.o -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_rec2csr.c -o librsb_base_la-rsb_rec2csr.o >/dev/null 2>&1 -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_rec2coo.c -o librsb_base_la-rsb_rec2coo.o >/dev/null 2>&1 -/bin/bash ./libtool --tag=FC --mode=compile gfortran -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -mbranch-protection=standard -pipe -fopenmp -c -o rsb_blas_sparse.lo rsb_blas_sparse.F90 -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o rsb_libspblas_handle.lo rsb_libspblas_handle.c -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_csr2coo.c -o librsb_base_la-rsb_csr2coo.o >/dev/null 2>&1 +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_dump.c -o librsb_base_la-rsb_dump.o >/dev/null 2>&1 +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_cpmv.c -o librsb_base_la-rsb_cpmv.o >/dev/null 2>&1 +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_coo2rec.lo `test -f 'rsb_coo2rec.c' || echo './'`rsb_coo2rec.c rsb_test_matops.c: In function 'rsb__main_block_partitioned_spsv_sxsx': rsb_test_matops.c:214:41: warning: '%s' directive writing up to 2047 bytes into a region of size 1011 [-Wformat-overflow=] 214 | rsb__sprintf(dst,"%s%s_%s_%.0lf_%s%s" "%s%s%s" "%s%s" "%s",pp?pp:"",h,rsb__getenv_nnr("HOSTNAME"),rsb_time(),buf,ap?ap:"", @@ -2326,32 +2348,46 @@ | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ 32 | __va_arg_pack ()); | ~~~~~~~~~~~~~~~~~ -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o rsb_libspblas.lo rsb_libspblas.c +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_rec2coo.lo `test -f 'rsb_rec2coo.c' || echo './'`rsb_rec2coo.c +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_rec2csr.lo `test -f 'rsb_rec2csr.c' || echo './'`rsb_rec2csr.c +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_coo2rec.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_coo2rec.o +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_asm.c -o librsb_base_la-rsb_asm.o >/dev/null 2>&1 +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o librsb_base_la-rsb_csr2coo.lo `test -f 'rsb_csr2coo.c' || echo './'`rsb_csr2coo.c +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_user.c -o librsb_base_la-rsb_user.o >/dev/null 2>&1 +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_rec2coo.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_rec2coo.o +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_rec2csr.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_rec2csr.o +/bin/sh ./libtool --tag=FC --mode=compile gfortran -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -mbranch-protection=standard -pipe -fopenmp -c -o rsb_blas_sparse.lo rsb_blas_sparse.F90 +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_csr2coo.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_csr2coo.o +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_rec2coo.c -o librsb_base_la-rsb_rec2coo.o >/dev/null 2>&1 +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_rec2csr.c -o librsb_base_la-rsb_rec2csr.o >/dev/null 2>&1 +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o rsb_libspblas_handle.lo rsb_libspblas_handle.c +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_csr2coo.c -o librsb_base_la-rsb_csr2coo.o >/dev/null 2>&1 libtool: compile: gfortran -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -mbranch-protection=standard -pipe -fopenmp -c rsb_blas_sparse.F90 -fPIC -o .libs/rsb_blas_sparse.o +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c -o rsb_libspblas.lo rsb_libspblas.c gfortran -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -mbranch-protection=standard -pipe -fopenmp -c -o rsb_blas_sparse.o rsb_blas_sparse.F90 -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_coo2rec.c -o librsb_base_la-rsb_coo2rec.o >/dev/null 2>&1 libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_libspblas_handle.c -fPIC -DPIC -o .libs/rsb_libspblas_handle.o +/bin/sh ./libtool --tag=CC --mode=link gcc -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -no-undefined -version-info 0:0:0 -Wl,-z,relro -o ch2icfb ch2icfb-ch2icfb.o -lm -lhwloc -lz -fopenmp -L/usr/lib/gcc/aarch64-linux-gnu/14 -L/usr/lib/gcc/aarch64-linux-gnu/14/../../../aarch64-linux-gnu -L/usr/lib/gcc/aarch64-linux-gnu/14/../../../../lib -L/lib/aarch64-linux-gnu -L/lib/../lib -L/usr/lib/aarch64-linux-gnu -L/usr/lib/../lib -L/usr/lib/gcc/aarch64-linux-gnu/14/../../.. -lgfortran -lm libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_krnl.c -o librsb_nounroll_la-rsb_krnl.o >/dev/null 2>&1 -/bin/bash ./libtool --tag=CC --mode=link gcc -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -no-undefined -version-info 0:0:0 -Wl,-z,relro -o ch2icfb ch2icfb-ch2icfb.o -lm -lhwloc -lz -fopenmp -L/usr/lib/gcc/aarch64-linux-gnu/14 -L/usr/lib/gcc/aarch64-linux-gnu/14/../../../aarch64-linux-gnu -L/usr/lib/gcc/aarch64-linux-gnu/14/../../../../lib -L/lib/aarch64-linux-gnu -L/lib/../lib -L/usr/lib/aarch64-linux-gnu -L/usr/lib/../lib -L/usr/lib/gcc/aarch64-linux-gnu/14/../../.. -lgfortran -lm +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_coo2rec.c -o librsb_base_la-rsb_coo2rec.o >/dev/null 2>&1 libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_libspblas.c -fPIC -DPIC -o .libs/rsb_libspblas.o libtool: warning: '-version-info' is ignored for programs libtool: link: gcc -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -Wl,-z -Wl,relro -o ch2icfb ch2icfb-ch2icfb.o -fopenmp -lhwloc -lz -L/usr/lib/gcc/aarch64-linux-gnu/14 -L/usr/lib/gcc/aarch64-linux-gnu/14/../../../aarch64-linux-gnu -L/usr/lib/gcc/aarch64-linux-gnu/14/../../../../lib -L/lib/aarch64-linux-gnu -L/lib/../lib -L/usr/lib/aarch64-linux-gnu -L/usr/lib/../lib -L/usr/lib/gcc/aarch64-linux-gnu/14/../../.. -lgfortran -lm -fopenmp if test -f ./rsb_types.h -a ! -f ./rsb_types.h ; then cp -pv ./rsb_types.h ./rsb_types.h ; fi # out-of-dir behaviour varies between installations -if test -f ch2icfb ; then if SED=/usr/bin/sed GREP=/usr/bin/grep /bin/bash ./scripts/rsb_h_to_rsb_fi.sh . /build/reproducible-path/librsb-1.3.0.2+dfsg > rsb.F90 ; then true; else rm "rsb.F90"; echo "Failure generating rsb.F90!" ; exit ; fi ; else echo "Warning: Your system did not build ch2icfb for some reason --- skipping rebuild of "rsb.F90 ;true ; fi -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_libspblas_handle.c -o rsb_libspblas_handle.o >/dev/null 2>&1 -/bin/bash ./libtool --tag=FC --mode=compile gfortran -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -mbranch-protection=standard -pipe -fopenmp -c -o rsb.lo rsb.F90 +if test -f ch2icfb ; then if SED=/usr/bin/sed GREP=/usr/bin/grep /bin/sh ./scripts/rsb_h_to_rsb_fi.sh . /build/reproducible-path/librsb-1.3.0.2+dfsg > rsb.F90 ; then true; else rm "rsb.F90"; echo "Failure generating rsb.F90!" ; exit ; fi ; else echo "Warning: Your system did not build ch2icfb for some reason --- skipping rebuild of "rsb.F90 ;true ; fi +/bin/sh ./libtool --tag=FC --mode=compile gfortran -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -mbranch-protection=standard -pipe -fopenmp -c -o rsb.lo rsb.F90 gfortran -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -mbranch-protection=standard -pipe -fopenmp -c -o rsb.o rsb.F90 -libtool: compile: gfortran -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -mbranch-protection=standard -pipe -fopenmp -c rsb_blas_sparse.F90 -o rsb_blas_sparse.o >/dev/null 2>&1 +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_libspblas_handle.c -o rsb_libspblas_handle.o >/dev/null 2>&1 libtool: compile: gfortran -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -mbranch-protection=standard -pipe -fopenmp -c rsb.F90 -fPIC -o .libs/rsb.o libtool: compile: gfortran -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -mbranch-protection=standard -pipe -fopenmp -c rsb.F90 -o rsb.o >/dev/null 2>&1 libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_libspblas.c -o rsb_libspblas.o >/dev/null 2>&1 -/bin/bash ./libtool --tag=CC --mode=link gcc -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -no-undefined -version-info 0:0:0 -Wl,-z,relro -o librsb_base.la librsb_base_la-rsb_is.lo librsb_base_la-rsb_mio.lo librsb_base_la-rsb_op.lo librsb_base_la-rsb_bio.lo librsb_base_la-rsb_get.lo librsb_base_la-rsb_set.lo librsb_base_la-rsb_coo.lo librsb_base_la-rsb_csr.lo librsb_base_la-rsb_coo_check.lo librsb_base_la-rsb_coo_symm.lo librsb_base_la-rsb_idx.lo librsb_base_la-rsb_srt.lo librsb_base_la-rsb_srtp.lo librsb_base_la-rsb_src.lo librsb_base_la-rsb_test_accuracy.lo librsb_base_la-rsb_clone.lo librsb_base_la-rsb_rec.lo librsb_base_la-rsb_render.lo librsb_base_la-rsb_eps.lo librsb_base_la-rsb_msort_up.lo librsb_base_la-rsb_sys.lo librsb_base_la-rsb_blas_stuff.lo librsb_base_la-rsb_gen.lo librsb_base_la-rsb_perf.lo librsb_base_la-rsb_rsb.lo librsb_base_la-rsb_err.lo librsb_base_la-rsb_tune.lo librsb_base_la-rsb_do.lo librsb_base_la-rsb_internals.lo librsb_base_la-rsb_garbage.lo librsb_base_la-rsb_mmio.lo librsb_base_la-rsb_partition.lo librsb_base_la-rsb_mbw.lo librsb_base_la-rsb_limiter.lo librsb_base_la-rsb_fpb.lo librsb_base_la-rsb_spgemm.lo librsb_base_la-rsb_spsum.lo librsb_base_la-rsb_spsv.lo librsb_base_la-rsb_lock.lo librsb_base_la-rsb_swt.lo librsb_base_la-rsb_init.lo librsb_base_la-rsb_dump.lo librsb_base_la-rsb_cpmv.lo librsb_base_la-rsb_asm.lo librsb_base_la-rsb_user.lo librsb_base_la-rsb_coo2rec.lo librsb_base_la-rsb_rec2coo.lo librsb_base_la-rsb_rec2csr.lo librsb_base_la-rsb_csr2coo.lo rsb_blas_sparse.lo -lm -lhwloc -lz -fopenmp -L/usr/lib/gcc/aarch64-linux-gnu/14 -L/usr/lib/gcc/aarch64-linux-gnu/14/../../../aarch64-linux-gnu -L/usr/lib/gcc/aarch64-linux-gnu/14/../../../../lib -L/lib/aarch64-linux-gnu -L/lib/../lib -L/usr/lib/aarch64-linux-gnu -L/usr/lib/../lib -L/usr/lib/gcc/aarch64-linux-gnu/14/../../.. -lgfortran -lm -libtool: warning: '-version-info/-version-number' is ignored for convenience libraries -/bin/bash ./libtool --tag=CC --mode=link gcc -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -no-undefined -version-info 0:0:0 -Wl,-z,relro -o librsb_spblas.la rsb_libspblas_handle.lo rsb_libspblas.lo -lm -lhwloc -lz -fopenmp -L/usr/lib/gcc/aarch64-linux-gnu/14 -L/usr/lib/gcc/aarch64-linux-gnu/14/../../../aarch64-linux-gnu -L/usr/lib/gcc/aarch64-linux-gnu/14/../../../../lib -L/lib/aarch64-linux-gnu -L/lib/../lib -L/usr/lib/aarch64-linux-gnu -L/usr/lib/../lib -L/usr/lib/gcc/aarch64-linux-gnu/14/../../.. -lgfortran -lm +libtool: compile: gfortran -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -mbranch-protection=standard -pipe -fopenmp -c rsb_blas_sparse.F90 -o rsb_blas_sparse.o >/dev/null 2>&1 +/bin/sh ./libtool --tag=CC --mode=link gcc -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -no-undefined -version-info 0:0:0 -Wl,-z,relro -o librsb_base.la librsb_base_la-rsb_is.lo librsb_base_la-rsb_mio.lo librsb_base_la-rsb_op.lo librsb_base_la-rsb_bio.lo librsb_base_la-rsb_get.lo librsb_base_la-rsb_set.lo librsb_base_la-rsb_coo.lo librsb_base_la-rsb_csr.lo librsb_base_la-rsb_coo_check.lo librsb_base_la-rsb_coo_symm.lo librsb_base_la-rsb_idx.lo librsb_base_la-rsb_srt.lo librsb_base_la-rsb_srtp.lo librsb_base_la-rsb_src.lo librsb_base_la-rsb_test_accuracy.lo librsb_base_la-rsb_clone.lo librsb_base_la-rsb_rec.lo librsb_base_la-rsb_render.lo librsb_base_la-rsb_eps.lo librsb_base_la-rsb_msort_up.lo librsb_base_la-rsb_sys.lo librsb_base_la-rsb_blas_stuff.lo librsb_base_la-rsb_gen.lo librsb_base_la-rsb_perf.lo librsb_base_la-rsb_rsb.lo librsb_base_la-rsb_err.lo librsb_base_la-rsb_tune.lo librsb_base_la-rsb_do.lo librsb_base_la-rsb_internals.lo librsb_base_la-rsb_garbage.lo librsb_base_la-rsb_mmio.lo librsb_base_la-rsb_partition.lo librsb_base_la-rsb_mbw.lo librsb_base_la-rsb_limiter.lo librsb_base_la-rsb_fpb.lo librsb_base_la-rsb_spgemm.lo librsb_base_la-rsb_spsum.lo librsb_base_la-rsb_spsv.lo librsb_base_la-rsb_lock.lo librsb_base_la-rsb_swt.lo librsb_base_la-rsb_init.lo librsb_base_la-rsb_dump.lo librsb_base_la-rsb_cpmv.lo librsb_base_la-rsb_asm.lo librsb_base_la-rsb_user.lo librsb_base_la-rsb_coo2rec.lo librsb_base_la-rsb_rec2coo.lo librsb_base_la-rsb_rec2csr.lo librsb_base_la-rsb_csr2coo.lo rsb_blas_sparse.lo -lm -lhwloc -lz -fopenmp -L/usr/lib/gcc/aarch64-linux-gnu/14 -L/usr/lib/gcc/aarch64-linux-gnu/14/../../../aarch64-linux-gnu -L/usr/lib/gcc/aarch64-linux-gnu/14/../../../../lib -L/lib/aarch64-linux-gnu -L/lib/../lib -L/usr/lib/aarch64-linux-gnu -L/usr/lib/../lib -L/usr/lib/gcc/aarch64-linux-gnu/14/../../.. -lgfortran -lm +/bin/sh ./libtool --tag=CC --mode=link gcc -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -no-undefined -version-info 0:0:0 -Wl,-z,relro -o librsb_spblas.la rsb_libspblas_handle.lo rsb_libspblas.lo -lm -lhwloc -lz -fopenmp -L/usr/lib/gcc/aarch64-linux-gnu/14 -L/usr/lib/gcc/aarch64-linux-gnu/14/../../../aarch64-linux-gnu -L/usr/lib/gcc/aarch64-linux-gnu/14/../../../../lib -L/lib/aarch64-linux-gnu -L/lib/../lib -L/usr/lib/aarch64-linux-gnu -L/usr/lib/../lib -L/usr/lib/gcc/aarch64-linux-gnu/14/../../.. -lgfortran -lm libtool: warning: '-version-info/-version-number' is ignored for convenience libraries libtool: link: ar cr .libs/librsb_spblas.a .libs/rsb_libspblas_handle.o .libs/rsb_libspblas.o libtool: link: ranlib .libs/librsb_spblas.a libtool: link: ( cd ".libs" && rm -f "librsb_spblas.la" && ln -s "../librsb_spblas.la" "librsb_spblas.la" ) +libtool: warning: '-version-info/-version-number' is ignored for convenience libraries libtool: link: ar cr .libs/librsb_base.a .libs/librsb_base_la-rsb_is.o .libs/librsb_base_la-rsb_mio.o .libs/librsb_base_la-rsb_op.o .libs/librsb_base_la-rsb_bio.o .libs/librsb_base_la-rsb_get.o .libs/librsb_base_la-rsb_set.o .libs/librsb_base_la-rsb_coo.o .libs/librsb_base_la-rsb_csr.o .libs/librsb_base_la-rsb_coo_check.o .libs/librsb_base_la-rsb_coo_symm.o .libs/librsb_base_la-rsb_idx.o .libs/librsb_base_la-rsb_srt.o .libs/librsb_base_la-rsb_srtp.o .libs/librsb_base_la-rsb_src.o .libs/librsb_base_la-rsb_test_accuracy.o .libs/librsb_base_la-rsb_clone.o .libs/librsb_base_la-rsb_rec.o .libs/librsb_base_la-rsb_render.o .libs/librsb_base_la-rsb_eps.o .libs/librsb_base_la-rsb_msort_up.o .libs/librsb_base_la-rsb_sys.o .libs/librsb_base_la-rsb_blas_stuff.o .libs/librsb_base_la-rsb_gen.o .libs/librsb_base_la-rsb_perf.o .libs/librsb_base_la-rsb_rsb.o .libs/librsb_base_la-rsb_err.o .libs/librsb_base_la-rsb_tune.o .libs/librsb_base_la-rsb_do.o .libs/librsb_base_la-rsb_internals.o .libs/librsb_base_la-rsb_garbage.o .libs/librsb_base_la-rsb_mmio.o .libs/librsb_base_la-rsb_partition.o .libs/librsb_base_la-rsb_mbw.o .libs/librsb_base_la-rsb_limiter.o .libs/librsb_base_la-rsb_fpb.o .libs/librsb_base_la-rsb_spgemm.o .libs/librsb_base_la-rsb_spsum.o .libs/librsb_base_la-rsb_spsv.o .libs/librsb_base_la-rsb_lock.o .libs/librsb_base_la-rsb_swt.o .libs/librsb_base_la-rsb_init.o .libs/librsb_base_la-rsb_dump.o .libs/librsb_base_la-rsb_cpmv.o .libs/librsb_base_la-rsb_asm.o .libs/librsb_base_la-rsb_user.o .libs/librsb_base_la-rsb_coo2rec.o .libs/librsb_base_la-rsb_rec2coo.o .libs/librsb_base_la-rsb_rec2csr.o .libs/librsb_base_la-rsb_csr2coo.o .libs/rsb_blas_sparse.o libtool: link: ranlib .libs/librsb_base.a libtool: link: ( cd ".libs" && rm -f "librsb_base.la" && ln -s "../librsb_base.la" "librsb_base.la" ) @@ -2371,12 +2407,12 @@ | ~~~~~~~~~~~~~~~~~ libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_krnl_bcss_spmv_u.c -o librsb_nounroll_la-rsb_krnl_bcss_spmv_u.o >/dev/null 2>&1 libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -c rsb_krnl_bcoo_spmv_u.c -o librsb_nounroll_la-rsb_krnl_bcoo_spmv_u.o >/dev/null 2>&1 -/bin/bash ./libtool --tag=CC --mode=link gcc -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -no-undefined -version-info 0:0:0 -Wl,-z,relro -o librsb_nounroll.la librsb_nounroll_la-rsb_stropts.lo librsb_nounroll_la-rsb_strmif.lo librsb_nounroll_la-rsb_unroll.lo librsb_nounroll_la-rsb_krnl_vb.lo librsb_nounroll_la-rsb_krnl_lb.lo librsb_nounroll_la-rsb_krnl.lo librsb_nounroll_la-rsb_bench.lo librsb_nounroll_la-rsb_mergesort.lo librsb_nounroll_la-rsb_permute.lo librsb_nounroll_la-rsb_krnl_bcss_l.lo librsb_nounroll_la-rsb_krnl_bcss_u.lo librsb_nounroll_la-rsb_krnl_bcss_spsv_u.lo librsb_nounroll_la-rsb_krnl_bcss_spmv_u.lo librsb_nounroll_la-rsb_krnl_bcss_misc_u.lo librsb_nounroll_la-rsb_krnl_bcoo_spmv_u.lo librsb_nounroll_la-rsb_krnl_bcss.lo librsb_nounroll_la-rsb_spmv.lo librsb_nounroll_la-rsb_merge.lo librsb_nounroll_la-rsb_ompio.lo librsb_nounroll_la-rsb_util.lo librsb_nounroll_la-rsb_spgemm_csr.lo librsb_nounroll_la-rsb_spsum_misc.lo librsb_nounroll_la-rsb_prec.lo -lm -lhwloc -lz -fopenmp -L/usr/lib/gcc/aarch64-linux-gnu/14 -L/usr/lib/gcc/aarch64-linux-gnu/14/../../../aarch64-linux-gnu -L/usr/lib/gcc/aarch64-linux-gnu/14/../../../../lib -L/lib/aarch64-linux-gnu -L/lib/../lib -L/usr/lib/aarch64-linux-gnu -L/usr/lib/../lib -L/usr/lib/gcc/aarch64-linux-gnu/14/../../.. -lgfortran -lm +/bin/sh ./libtool --tag=CC --mode=link gcc -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -no-undefined -version-info 0:0:0 -Wl,-z,relro -o librsb_nounroll.la librsb_nounroll_la-rsb_stropts.lo librsb_nounroll_la-rsb_strmif.lo librsb_nounroll_la-rsb_unroll.lo librsb_nounroll_la-rsb_krnl_vb.lo librsb_nounroll_la-rsb_krnl_lb.lo librsb_nounroll_la-rsb_krnl.lo librsb_nounroll_la-rsb_bench.lo librsb_nounroll_la-rsb_mergesort.lo librsb_nounroll_la-rsb_permute.lo librsb_nounroll_la-rsb_krnl_bcss_l.lo librsb_nounroll_la-rsb_krnl_bcss_u.lo librsb_nounroll_la-rsb_krnl_bcss_spsv_u.lo librsb_nounroll_la-rsb_krnl_bcss_spmv_u.lo librsb_nounroll_la-rsb_krnl_bcss_misc_u.lo librsb_nounroll_la-rsb_krnl_bcoo_spmv_u.lo librsb_nounroll_la-rsb_krnl_bcss.lo librsb_nounroll_la-rsb_spmv.lo librsb_nounroll_la-rsb_merge.lo librsb_nounroll_la-rsb_ompio.lo librsb_nounroll_la-rsb_util.lo librsb_nounroll_la-rsb_spgemm_csr.lo librsb_nounroll_la-rsb_spsum_misc.lo librsb_nounroll_la-rsb_prec.lo -lm -lhwloc -lz -fopenmp -L/usr/lib/gcc/aarch64-linux-gnu/14 -L/usr/lib/gcc/aarch64-linux-gnu/14/../../../aarch64-linux-gnu -L/usr/lib/gcc/aarch64-linux-gnu/14/../../../../lib -L/lib/aarch64-linux-gnu -L/lib/../lib -L/usr/lib/aarch64-linux-gnu -L/usr/lib/../lib -L/usr/lib/gcc/aarch64-linux-gnu/14/../../.. -lgfortran -lm libtool: warning: '-version-info/-version-number' is ignored for convenience libraries libtool: link: ar cr .libs/librsb_nounroll.a .libs/librsb_nounroll_la-rsb_stropts.o .libs/librsb_nounroll_la-rsb_strmif.o .libs/librsb_nounroll_la-rsb_unroll.o .libs/librsb_nounroll_la-rsb_krnl_vb.o .libs/librsb_nounroll_la-rsb_krnl_lb.o .libs/librsb_nounroll_la-rsb_krnl.o .libs/librsb_nounroll_la-rsb_bench.o .libs/librsb_nounroll_la-rsb_mergesort.o .libs/librsb_nounroll_la-rsb_permute.o .libs/librsb_nounroll_la-rsb_krnl_bcss_l.o .libs/librsb_nounroll_la-rsb_krnl_bcss_u.o .libs/librsb_nounroll_la-rsb_krnl_bcss_spsv_u.o .libs/librsb_nounroll_la-rsb_krnl_bcss_spmv_u.o .libs/librsb_nounroll_la-rsb_krnl_bcss_misc_u.o .libs/librsb_nounroll_la-rsb_krnl_bcoo_spmv_u.o .libs/librsb_nounroll_la-rsb_krnl_bcss.o .libs/librsb_nounroll_la-rsb_spmv.o .libs/librsb_nounroll_la-rsb_merge.o .libs/librsb_nounroll_la-rsb_ompio.o .libs/librsb_nounroll_la-rsb_util.o .libs/librsb_nounroll_la-rsb_spgemm_csr.o .libs/librsb_nounroll_la-rsb_spsum_misc.o .libs/librsb_nounroll_la-rsb_prec.o libtool: link: ranlib .libs/librsb_nounroll.a libtool: link: ( cd ".libs" && rm -f "librsb_nounroll.la" && ln -s "../librsb_nounroll.la" "librsb_nounroll.la" ) -/bin/bash ./libtool --tag=CC --mode=link gcc -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -no-undefined -version-info 0:0:0 -Wl,-z,relro -o librsb.la -rpath /usr/lib/aarch64-linux-gnu rsb.lo librsb_nounroll.la librsb_base.la librsb_spblas.la /build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp/librsbpp.la -lstdc++ -lm -lhwloc -lz -fopenmp -L/usr/lib/gcc/aarch64-linux-gnu/14 -L/usr/lib/gcc/aarch64-linux-gnu/14/../../../aarch64-linux-gnu -L/usr/lib/gcc/aarch64-linux-gnu/14/../../../../lib -L/lib/aarch64-linux-gnu -L/lib/../lib -L/usr/lib/aarch64-linux-gnu -L/usr/lib/../lib -L/usr/lib/gcc/aarch64-linux-gnu/14/../../.. -lgfortran -lm +/bin/sh ./libtool --tag=CC --mode=link gcc -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -no-undefined -version-info 0:0:0 -Wl,-z,relro -o librsb.la -rpath /usr/lib/aarch64-linux-gnu rsb.lo librsb_nounroll.la librsb_base.la librsb_spblas.la /build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp/librsbpp.la -lstdc++ -lm -lhwloc -lz -fopenmp -L/usr/lib/gcc/aarch64-linux-gnu/14 -L/usr/lib/gcc/aarch64-linux-gnu/14/../../../aarch64-linux-gnu -L/usr/lib/gcc/aarch64-linux-gnu/14/../../../../lib -L/lib/aarch64-linux-gnu -L/lib/../lib -L/usr/lib/aarch64-linux-gnu -L/usr/lib/../lib -L/usr/lib/gcc/aarch64-linux-gnu/14/../../.. -lgfortran -lm libtool: link: gcc -shared -fPIC -DPIC .libs/rsb.o -Wl,--whole-archive ./.libs/librsb_nounroll.a ./.libs/librsb_base.a ./.libs/librsb_spblas.a /build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp/.libs/librsbpp.a -Wl,--no-whole-archive -L/usr/lib/gcc/aarch64-linux-gnu/14 -L/usr/lib/gcc/aarch64-linux-gnu/14/../../../aarch64-linux-gnu -L/usr/lib/gcc/aarch64-linux-gnu/14/../../../../lib -L/lib/aarch64-linux-gnu -L/lib/../lib -L/usr/lib/aarch64-linux-gnu -L/usr/lib/../lib -L/usr/lib/gcc/aarch64-linux-gnu/14/../../.. -lpthread -lstdc++fs -lstdc++ -lhwloc -lz -lgfortran -lm -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Werror=format-security -mbranch-protection=standard -O3 -Wl,-z -Wl,relro -fopenmp -fopenmp -Wl,-soname -Wl,librsb.so.0 -o .libs/librsb.so.0.0.0 libtool: link: (cd ".libs" && rm -f "librsb.so.0" && ln -s "librsb.so.0.0.0" "librsb.so.0") libtool: link: (cd ".libs" && rm -f "librsb.so" && ln -s "librsb.so.0.0.0" "librsb.so") @@ -2388,7 +2424,7 @@ libtool: link: ranlib .libs/librsb.a libtool: link: rm -fr .libs/librsb.lax libtool: link: ( cd ".libs" && rm -f "librsb.la" && ln -s "../librsb.la" "librsb.la" ) -/bin/bash ./libtool --tag=CXX --mode=link g++ -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -fopenmp -no-undefined -version-info 0:0:0 -Wl,-z,relro -o rsbench rsbench-rsbench.o rsbench-rsb_test_matops.o rsbench-rsb_mkl.o rsbench-rsb_genmm.o rsbench-rsb_mmls.o rsbench-rsb_pr.o rsbench-rsb_pcnt.o rsbench-rsb_failure_tests.o rsbench-rsb_libspblas_tests.o rsb_dummy.o librsb.la -lhwloc -lm -lhwloc -lz -fopenmp -L/usr/lib/gcc/aarch64-linux-gnu/14 -L/usr/lib/gcc/aarch64-linux-gnu/14/../../../aarch64-linux-gnu -L/usr/lib/gcc/aarch64-linux-gnu/14/../../../../lib -L/lib/aarch64-linux-gnu -L/lib/../lib -L/usr/lib/aarch64-linux-gnu -L/usr/lib/../lib -L/usr/lib/gcc/aarch64-linux-gnu/14/../../.. -lgfortran -lm +/bin/sh ./libtool --tag=CXX --mode=link g++ -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -fopenmp -no-undefined -version-info 0:0:0 -Wl,-z,relro -o rsbench rsbench-rsbench.o rsbench-rsb_test_matops.o rsbench-rsb_mkl.o rsbench-rsb_genmm.o rsbench-rsb_mmls.o rsbench-rsb_pr.o rsbench-rsb_pcnt.o rsbench-rsb_failure_tests.o rsbench-rsb_libspblas_tests.o rsb_dummy.o librsb.la -lhwloc -lm -lhwloc -lz -fopenmp -L/usr/lib/gcc/aarch64-linux-gnu/14 -L/usr/lib/gcc/aarch64-linux-gnu/14/../../../aarch64-linux-gnu -L/usr/lib/gcc/aarch64-linux-gnu/14/../../../../lib -L/lib/aarch64-linux-gnu -L/lib/../lib -L/usr/lib/aarch64-linux-gnu -L/usr/lib/../lib -L/usr/lib/gcc/aarch64-linux-gnu/14/../../.. -lgfortran -lm libtool: warning: '-version-info' is ignored for programs libtool: link: g++ -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -fopenmp -Wl,-z -Wl,relro -o .libs/rsbench rsbench-rsbench.o rsbench-rsb_test_matops.o rsbench-rsb_mkl.o rsbench-rsb_genmm.o rsbench-rsb_mmls.o rsbench-rsb_pr.o rsbench-rsb_pcnt.o rsbench-rsb_failure_tests.o rsbench-rsb_libspblas_tests.o rsb_dummy.o -fopenmp ./.libs/librsb.so -lhwloc -lz -L/usr/lib/gcc/aarch64-linux-gnu/14 -L/usr/lib/gcc/aarch64-linux-gnu/14/../../../aarch64-linux-gnu -L/usr/lib/gcc/aarch64-linux-gnu/14/../../../../lib -L/lib/aarch64-linux-gnu -L/lib/../lib -L/usr/lib/aarch64-linux-gnu -L/usr/lib/../lib -L/usr/lib/gcc/aarch64-linux-gnu/14/../../.. -lgfortran -lm -fopenmp gmake[4]: Leaving directory '/build/reproducible-path/librsb-1.3.0.2+dfsg' @@ -2405,26 +2441,26 @@ gfortran -DHAVE_CONFIG_H -I. -I.. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -I.. -I.. -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -mbranch-protection=standard -pipe -fopenmp -c -o fortran.o fortran.F90 gfortran -DHAVE_CONFIG_H -I. -I.. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -I.. -I.. -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -mbranch-protection=standard -pipe -fopenmp -c -o fortran_rsb_fi.o fortran_rsb_fi.F90 g++ -DHAVE_CONFIG_H -I. -I.. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -fopenmp -c -o cplusplus.o cplusplus.cpp -/bin/bash ../libtool --tag=CXX --mode=link g++ -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -fopenmp -Wl,-z,relro -o hello hello.o -L.. /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la -lhwloc -lm -lhwloc -lz -fopenmp -L/usr/lib/gcc/aarch64-linux-gnu/14 -L/usr/lib/gcc/aarch64-linux-gnu/14/../../../aarch64-linux-gnu -L/usr/lib/gcc/aarch64-linux-gnu/14/../../../../lib -L/lib/aarch64-linux-gnu -L/lib/../lib -L/usr/lib/aarch64-linux-gnu -L/usr/lib/../lib -L/usr/lib/gcc/aarch64-linux-gnu/14/../../.. -lgfortran -lm -/bin/bash ../libtool --tag=CXX --mode=link g++ -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -fopenmp -Wl,-z,relro -o transpose transpose.o -L.. /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la -lhwloc -lm -lhwloc -lz -fopenmp -L/usr/lib/gcc/aarch64-linux-gnu/14 -L/usr/lib/gcc/aarch64-linux-gnu/14/../../../aarch64-linux-gnu -L/usr/lib/gcc/aarch64-linux-gnu/14/../../../../lib -L/lib/aarch64-linux-gnu -L/lib/../lib -L/usr/lib/aarch64-linux-gnu -L/usr/lib/../lib -L/usr/lib/gcc/aarch64-linux-gnu/14/../../.. -lgfortran -lm -/bin/bash ../libtool --tag=CXX --mode=link g++ -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -fopenmp -Wl,-z,relro -o hello-spblas hello-spblas.o -L.. /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la -lhwloc -lm -lhwloc -lz -fopenmp -L/usr/lib/gcc/aarch64-linux-gnu/14 -L/usr/lib/gcc/aarch64-linux-gnu/14/../../../aarch64-linux-gnu -L/usr/lib/gcc/aarch64-linux-gnu/14/../../../../lib -L/lib/aarch64-linux-gnu -L/lib/../lib -L/usr/lib/aarch64-linux-gnu -L/usr/lib/../lib -L/usr/lib/gcc/aarch64-linux-gnu/14/../../.. -lgfortran -lm -/bin/bash ../libtool --tag=CXX --mode=link g++ -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -fopenmp -Wl,-z,relro -o power power.o -L.. /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la -lhwloc -lm -lhwloc -lz -fopenmp -L/usr/lib/gcc/aarch64-linux-gnu/14 -L/usr/lib/gcc/aarch64-linux-gnu/14/../../../aarch64-linux-gnu -L/usr/lib/gcc/aarch64-linux-gnu/14/../../../../lib -L/lib/aarch64-linux-gnu -L/lib/../lib -L/usr/lib/aarch64-linux-gnu -L/usr/lib/../lib -L/usr/lib/gcc/aarch64-linux-gnu/14/../../.. -lgfortran -lm -/bin/bash ../libtool --tag=CXX --mode=link g++ -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -fopenmp -Wl,-z,relro -o io-spblas io-spblas.o -L.. /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la -lhwloc -lm -lhwloc -lz -fopenmp -L/usr/lib/gcc/aarch64-linux-gnu/14 -L/usr/lib/gcc/aarch64-linux-gnu/14/../../../aarch64-linux-gnu -L/usr/lib/gcc/aarch64-linux-gnu/14/../../../../lib -L/lib/aarch64-linux-gnu -L/lib/../lib -L/usr/lib/aarch64-linux-gnu -L/usr/lib/../lib -L/usr/lib/gcc/aarch64-linux-gnu/14/../../.. -lgfortran -lm -/bin/bash ../libtool --tag=CXX --mode=link g++ -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -fopenmp -Wl,-z,relro -o backsolve backsolve.o -L.. /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la -lhwloc -lm -lhwloc -lz -fopenmp -L/usr/lib/gcc/aarch64-linux-gnu/14 -L/usr/lib/gcc/aarch64-linux-gnu/14/../../../aarch64-linux-gnu -L/usr/lib/gcc/aarch64-linux-gnu/14/../../../../lib -L/lib/aarch64-linux-gnu -L/lib/../lib -L/usr/lib/aarch64-linux-gnu -L/usr/lib/../lib -L/usr/lib/gcc/aarch64-linux-gnu/14/../../.. -lgfortran -lm -/bin/bash ../libtool --tag=CXX --mode=link g++ -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -fopenmp -Wl,-z,relro -o autotune autotune.o -L.. /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la -lhwloc -lm -lhwloc -lz -fopenmp -L/usr/lib/gcc/aarch64-linux-gnu/14 -L/usr/lib/gcc/aarch64-linux-gnu/14/../../../aarch64-linux-gnu -L/usr/lib/gcc/aarch64-linux-gnu/14/../../../../lib -L/lib/aarch64-linux-gnu -L/lib/../lib -L/usr/lib/aarch64-linux-gnu -L/usr/lib/../lib -L/usr/lib/gcc/aarch64-linux-gnu/14/../../.. -lgfortran -lm -/bin/bash ../libtool --tag=CXX --mode=link g++ -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -fopenmp -Wl,-z,relro -o fortran_rsb_fi fortran_rsb_fi.o -L.. /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la -lhwloc -lm -lhwloc -lz -fopenmp -L/usr/lib/gcc/aarch64-linux-gnu/14 -L/usr/lib/gcc/aarch64-linux-gnu/14/../../../aarch64-linux-gnu -L/usr/lib/gcc/aarch64-linux-gnu/14/../../../../lib -L/lib/aarch64-linux-gnu -L/lib/../lib -L/usr/lib/aarch64-linux-gnu -L/usr/lib/../lib -L/usr/lib/gcc/aarch64-linux-gnu/14/../../.. -lgfortran -lm -/bin/bash ../libtool --tag=CXX --mode=link g++ -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -fopenmp -Wl,-z,relro -o fortran fortran.o -L.. /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la -lhwloc -lm -lhwloc -lz -fopenmp -L/usr/lib/gcc/aarch64-linux-gnu/14 -L/usr/lib/gcc/aarch64-linux-gnu/14/../../../aarch64-linux-gnu -L/usr/lib/gcc/aarch64-linux-gnu/14/../../../../lib -L/lib/aarch64-linux-gnu -L/lib/../lib -L/usr/lib/aarch64-linux-gnu -L/usr/lib/../lib -L/usr/lib/gcc/aarch64-linux-gnu/14/../../.. -lgfortran -lm -/bin/bash ../libtool --tag=CXX --mode=link g++ -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -fopenmp -Wl,-z,relro -o snippets snippets.o -L.. /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la -lhwloc -lm -lhwloc -lz -fopenmp -L/usr/lib/gcc/aarch64-linux-gnu/14 -L/usr/lib/gcc/aarch64-linux-gnu/14/../../../aarch64-linux-gnu -L/usr/lib/gcc/aarch64-linux-gnu/14/../../../../lib -L/lib/aarch64-linux-gnu -L/lib/../lib -L/usr/lib/aarch64-linux-gnu -L/usr/lib/../lib -L/usr/lib/gcc/aarch64-linux-gnu/14/../../.. -lgfortran -lm -/bin/bash ../libtool --tag=CXX --mode=link g++ -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -fopenmp -Wl,-z,relro -o cplusplus cplusplus.o -L.. /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la -lhwloc -lm -lhwloc -lz -fopenmp -L/usr/lib/gcc/aarch64-linux-gnu/14 -L/usr/lib/gcc/aarch64-linux-gnu/14/../../../aarch64-linux-gnu -L/usr/lib/gcc/aarch64-linux-gnu/14/../../../../lib -L/lib/aarch64-linux-gnu -L/lib/../lib -L/usr/lib/aarch64-linux-gnu -L/usr/lib/../lib -L/usr/lib/gcc/aarch64-linux-gnu/14/../../.. -lgfortran -lm -libtool: link: g++ -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -fopenmp -Wl,-z -Wl,relro -o .libs/transpose transpose.o -fopenmp -L.. /build/reproducible-path/librsb-1.3.0.2+dfsg/.libs/librsb.so -lhwloc -lz -L/usr/lib/gcc/aarch64-linux-gnu/14 -L/usr/lib/gcc/aarch64-linux-gnu/14/../../../aarch64-linux-gnu -L/usr/lib/gcc/aarch64-linux-gnu/14/../../../../lib -L/lib/aarch64-linux-gnu -L/lib/../lib -L/usr/lib/aarch64-linux-gnu -L/usr/lib/../lib -L/usr/lib/gcc/aarch64-linux-gnu/14/../../.. -lgfortran -lm -fopenmp +/bin/sh ../libtool --tag=CXX --mode=link g++ -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -fopenmp -Wl,-z,relro -o hello hello.o -L.. /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la -lhwloc -lm -lhwloc -lz -fopenmp -L/usr/lib/gcc/aarch64-linux-gnu/14 -L/usr/lib/gcc/aarch64-linux-gnu/14/../../../aarch64-linux-gnu -L/usr/lib/gcc/aarch64-linux-gnu/14/../../../../lib -L/lib/aarch64-linux-gnu -L/lib/../lib -L/usr/lib/aarch64-linux-gnu -L/usr/lib/../lib -L/usr/lib/gcc/aarch64-linux-gnu/14/../../.. -lgfortran -lm +/bin/sh ../libtool --tag=CXX --mode=link g++ -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -fopenmp -Wl,-z,relro -o power power.o -L.. /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la -lhwloc -lm -lhwloc -lz -fopenmp -L/usr/lib/gcc/aarch64-linux-gnu/14 -L/usr/lib/gcc/aarch64-linux-gnu/14/../../../aarch64-linux-gnu -L/usr/lib/gcc/aarch64-linux-gnu/14/../../../../lib -L/lib/aarch64-linux-gnu -L/lib/../lib -L/usr/lib/aarch64-linux-gnu -L/usr/lib/../lib -L/usr/lib/gcc/aarch64-linux-gnu/14/../../.. -lgfortran -lm +/bin/sh ../libtool --tag=CXX --mode=link g++ -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -fopenmp -Wl,-z,relro -o io-spblas io-spblas.o -L.. /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la -lhwloc -lm -lhwloc -lz -fopenmp -L/usr/lib/gcc/aarch64-linux-gnu/14 -L/usr/lib/gcc/aarch64-linux-gnu/14/../../../aarch64-linux-gnu -L/usr/lib/gcc/aarch64-linux-gnu/14/../../../../lib -L/lib/aarch64-linux-gnu -L/lib/../lib -L/usr/lib/aarch64-linux-gnu -L/usr/lib/../lib -L/usr/lib/gcc/aarch64-linux-gnu/14/../../.. -lgfortran -lm +/bin/sh ../libtool --tag=CXX --mode=link g++ -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -fopenmp -Wl,-z,relro -o transpose transpose.o -L.. /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la -lhwloc -lm -lhwloc -lz -fopenmp -L/usr/lib/gcc/aarch64-linux-gnu/14 -L/usr/lib/gcc/aarch64-linux-gnu/14/../../../aarch64-linux-gnu -L/usr/lib/gcc/aarch64-linux-gnu/14/../../../../lib -L/lib/aarch64-linux-gnu -L/lib/../lib -L/usr/lib/aarch64-linux-gnu -L/usr/lib/../lib -L/usr/lib/gcc/aarch64-linux-gnu/14/../../.. -lgfortran -lm +/bin/sh ../libtool --tag=CXX --mode=link g++ -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -fopenmp -Wl,-z,relro -o backsolve backsolve.o -L.. /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la -lhwloc -lm -lhwloc -lz -fopenmp -L/usr/lib/gcc/aarch64-linux-gnu/14 -L/usr/lib/gcc/aarch64-linux-gnu/14/../../../aarch64-linux-gnu -L/usr/lib/gcc/aarch64-linux-gnu/14/../../../../lib -L/lib/aarch64-linux-gnu -L/lib/../lib -L/usr/lib/aarch64-linux-gnu -L/usr/lib/../lib -L/usr/lib/gcc/aarch64-linux-gnu/14/../../.. -lgfortran -lm +/bin/sh ../libtool --tag=CXX --mode=link g++ -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -fopenmp -Wl,-z,relro -o hello-spblas hello-spblas.o -L.. /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la -lhwloc -lm -lhwloc -lz -fopenmp -L/usr/lib/gcc/aarch64-linux-gnu/14 -L/usr/lib/gcc/aarch64-linux-gnu/14/../../../aarch64-linux-gnu -L/usr/lib/gcc/aarch64-linux-gnu/14/../../../../lib -L/lib/aarch64-linux-gnu -L/lib/../lib -L/usr/lib/aarch64-linux-gnu -L/usr/lib/../lib -L/usr/lib/gcc/aarch64-linux-gnu/14/../../.. -lgfortran -lm +/bin/sh ../libtool --tag=CXX --mode=link g++ -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -fopenmp -Wl,-z,relro -o fortran_rsb_fi fortran_rsb_fi.o -L.. /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la -lhwloc -lm -lhwloc -lz -fopenmp -L/usr/lib/gcc/aarch64-linux-gnu/14 -L/usr/lib/gcc/aarch64-linux-gnu/14/../../../aarch64-linux-gnu -L/usr/lib/gcc/aarch64-linux-gnu/14/../../../../lib -L/lib/aarch64-linux-gnu -L/lib/../lib -L/usr/lib/aarch64-linux-gnu -L/usr/lib/../lib -L/usr/lib/gcc/aarch64-linux-gnu/14/../../.. -lgfortran -lm +/bin/sh ../libtool --tag=CXX --mode=link g++ -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -fopenmp -Wl,-z,relro -o autotune autotune.o -L.. /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la -lhwloc -lm -lhwloc -lz -fopenmp -L/usr/lib/gcc/aarch64-linux-gnu/14 -L/usr/lib/gcc/aarch64-linux-gnu/14/../../../aarch64-linux-gnu -L/usr/lib/gcc/aarch64-linux-gnu/14/../../../../lib -L/lib/aarch64-linux-gnu -L/lib/../lib -L/usr/lib/aarch64-linux-gnu -L/usr/lib/../lib -L/usr/lib/gcc/aarch64-linux-gnu/14/../../.. -lgfortran -lm +/bin/sh ../libtool --tag=CXX --mode=link g++ -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -fopenmp -Wl,-z,relro -o fortran fortran.o -L.. /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la -lhwloc -lm -lhwloc -lz -fopenmp -L/usr/lib/gcc/aarch64-linux-gnu/14 -L/usr/lib/gcc/aarch64-linux-gnu/14/../../../aarch64-linux-gnu -L/usr/lib/gcc/aarch64-linux-gnu/14/../../../../lib -L/lib/aarch64-linux-gnu -L/lib/../lib -L/usr/lib/aarch64-linux-gnu -L/usr/lib/../lib -L/usr/lib/gcc/aarch64-linux-gnu/14/../../.. -lgfortran -lm +/bin/sh ../libtool --tag=CXX --mode=link g++ -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -fopenmp -Wl,-z,relro -o snippets snippets.o -L.. /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la -lhwloc -lm -lhwloc -lz -fopenmp -L/usr/lib/gcc/aarch64-linux-gnu/14 -L/usr/lib/gcc/aarch64-linux-gnu/14/../../../aarch64-linux-gnu -L/usr/lib/gcc/aarch64-linux-gnu/14/../../../../lib -L/lib/aarch64-linux-gnu -L/lib/../lib -L/usr/lib/aarch64-linux-gnu -L/usr/lib/../lib -L/usr/lib/gcc/aarch64-linux-gnu/14/../../.. -lgfortran -lm libtool: link: g++ -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -fopenmp -Wl,-z -Wl,relro -o .libs/hello hello.o -fopenmp -L.. /build/reproducible-path/librsb-1.3.0.2+dfsg/.libs/librsb.so -lhwloc -lz -L/usr/lib/gcc/aarch64-linux-gnu/14 -L/usr/lib/gcc/aarch64-linux-gnu/14/../../../aarch64-linux-gnu -L/usr/lib/gcc/aarch64-linux-gnu/14/../../../../lib -L/lib/aarch64-linux-gnu -L/lib/../lib -L/usr/lib/aarch64-linux-gnu -L/usr/lib/../lib -L/usr/lib/gcc/aarch64-linux-gnu/14/../../.. -lgfortran -lm -fopenmp +libtool: link: g++ -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -fopenmp -Wl,-z -Wl,relro -o .libs/io-spblas io-spblas.o -fopenmp -L.. /build/reproducible-path/librsb-1.3.0.2+dfsg/.libs/librsb.so -lhwloc -lz -L/usr/lib/gcc/aarch64-linux-gnu/14 -L/usr/lib/gcc/aarch64-linux-gnu/14/../../../aarch64-linux-gnu -L/usr/lib/gcc/aarch64-linux-gnu/14/../../../../lib -L/lib/aarch64-linux-gnu -L/lib/../lib -L/usr/lib/aarch64-linux-gnu -L/usr/lib/../lib -L/usr/lib/gcc/aarch64-linux-gnu/14/../../.. -lgfortran -lm -fopenmp +libtool: link: g++ -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -fopenmp -Wl,-z -Wl,relro -o .libs/fortran_rsb_fi fortran_rsb_fi.o -fopenmp -L.. /build/reproducible-path/librsb-1.3.0.2+dfsg/.libs/librsb.so -lhwloc -lz -L/usr/lib/gcc/aarch64-linux-gnu/14 -L/usr/lib/gcc/aarch64-linux-gnu/14/../../../aarch64-linux-gnu -L/usr/lib/gcc/aarch64-linux-gnu/14/../../../../lib -L/lib/aarch64-linux-gnu -L/lib/../lib -L/usr/lib/aarch64-linux-gnu -L/usr/lib/../lib -L/usr/lib/gcc/aarch64-linux-gnu/14/../../.. -lgfortran -lm -fopenmp +libtool: link: g++ -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -fopenmp -Wl,-z -Wl,relro -o .libs/backsolve backsolve.o -fopenmp -L.. /build/reproducible-path/librsb-1.3.0.2+dfsg/.libs/librsb.so -lhwloc -lz -L/usr/lib/gcc/aarch64-linux-gnu/14 -L/usr/lib/gcc/aarch64-linux-gnu/14/../../../aarch64-linux-gnu -L/usr/lib/gcc/aarch64-linux-gnu/14/../../../../lib -L/lib/aarch64-linux-gnu -L/lib/../lib -L/usr/lib/aarch64-linux-gnu -L/usr/lib/../lib -L/usr/lib/gcc/aarch64-linux-gnu/14/../../.. -lgfortran -lm -fopenmp +libtool: link: g++ -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -fopenmp -Wl,-z -Wl,relro -o .libs/transpose transpose.o -fopenmp -L.. /build/reproducible-path/librsb-1.3.0.2+dfsg/.libs/librsb.so -lhwloc -lz -L/usr/lib/gcc/aarch64-linux-gnu/14 -L/usr/lib/gcc/aarch64-linux-gnu/14/../../../aarch64-linux-gnu -L/usr/lib/gcc/aarch64-linux-gnu/14/../../../../lib -L/lib/aarch64-linux-gnu -L/lib/../lib -L/usr/lib/aarch64-linux-gnu -L/usr/lib/../lib -L/usr/lib/gcc/aarch64-linux-gnu/14/../../.. -lgfortran -lm -fopenmp libtool: link: g++ -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -fopenmp -Wl,-z -Wl,relro -o .libs/power power.o -fopenmp -L.. /build/reproducible-path/librsb-1.3.0.2+dfsg/.libs/librsb.so -lhwloc -lz -L/usr/lib/gcc/aarch64-linux-gnu/14 -L/usr/lib/gcc/aarch64-linux-gnu/14/../../../aarch64-linux-gnu -L/usr/lib/gcc/aarch64-linux-gnu/14/../../../../lib -L/lib/aarch64-linux-gnu -L/lib/../lib -L/usr/lib/aarch64-linux-gnu -L/usr/lib/../lib -L/usr/lib/gcc/aarch64-linux-gnu/14/../../.. -lgfortran -lm -fopenmp libtool: link: g++ -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -fopenmp -Wl,-z -Wl,relro -o .libs/hello-spblas hello-spblas.o -fopenmp -L.. /build/reproducible-path/librsb-1.3.0.2+dfsg/.libs/librsb.so -lhwloc -lz -L/usr/lib/gcc/aarch64-linux-gnu/14 -L/usr/lib/gcc/aarch64-linux-gnu/14/../../../aarch64-linux-gnu -L/usr/lib/gcc/aarch64-linux-gnu/14/../../../../lib -L/lib/aarch64-linux-gnu -L/lib/../lib -L/usr/lib/aarch64-linux-gnu -L/usr/lib/../lib -L/usr/lib/gcc/aarch64-linux-gnu/14/../../.. -lgfortran -lm -fopenmp -libtool: link: g++ -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -fopenmp -Wl,-z -Wl,relro -o .libs/io-spblas io-spblas.o -fopenmp -L.. /build/reproducible-path/librsb-1.3.0.2+dfsg/.libs/librsb.so -lhwloc -lz -L/usr/lib/gcc/aarch64-linux-gnu/14 -L/usr/lib/gcc/aarch64-linux-gnu/14/../../../aarch64-linux-gnu -L/usr/lib/gcc/aarch64-linux-gnu/14/../../../../lib -L/lib/aarch64-linux-gnu -L/lib/../lib -L/usr/lib/aarch64-linux-gnu -L/usr/lib/../lib -L/usr/lib/gcc/aarch64-linux-gnu/14/../../.. -lgfortran -lm -fopenmp libtool: link: g++ -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -fopenmp -Wl,-z -Wl,relro -o .libs/autotune autotune.o -fopenmp -L.. /build/reproducible-path/librsb-1.3.0.2+dfsg/.libs/librsb.so -lhwloc -lz -L/usr/lib/gcc/aarch64-linux-gnu/14 -L/usr/lib/gcc/aarch64-linux-gnu/14/../../../aarch64-linux-gnu -L/usr/lib/gcc/aarch64-linux-gnu/14/../../../../lib -L/lib/aarch64-linux-gnu -L/lib/../lib -L/usr/lib/aarch64-linux-gnu -L/usr/lib/../lib -L/usr/lib/gcc/aarch64-linux-gnu/14/../../.. -lgfortran -lm -fopenmp -libtool: link: g++ -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -fopenmp -Wl,-z -Wl,relro -o .libs/backsolve backsolve.o -fopenmp -L.. /build/reproducible-path/librsb-1.3.0.2+dfsg/.libs/librsb.so -lhwloc -lz -L/usr/lib/gcc/aarch64-linux-gnu/14 -L/usr/lib/gcc/aarch64-linux-gnu/14/../../../aarch64-linux-gnu -L/usr/lib/gcc/aarch64-linux-gnu/14/../../../../lib -L/lib/aarch64-linux-gnu -L/lib/../lib -L/usr/lib/aarch64-linux-gnu -L/usr/lib/../lib -L/usr/lib/gcc/aarch64-linux-gnu/14/../../.. -lgfortran -lm -fopenmp -libtool: link: g++ -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -fopenmp -Wl,-z -Wl,relro -o .libs/fortran_rsb_fi fortran_rsb_fi.o -fopenmp -L.. /build/reproducible-path/librsb-1.3.0.2+dfsg/.libs/librsb.so -lhwloc -lz -L/usr/lib/gcc/aarch64-linux-gnu/14 -L/usr/lib/gcc/aarch64-linux-gnu/14/../../../aarch64-linux-gnu -L/usr/lib/gcc/aarch64-linux-gnu/14/../../../../lib -L/lib/aarch64-linux-gnu -L/lib/../lib -L/usr/lib/aarch64-linux-gnu -L/usr/lib/../lib -L/usr/lib/gcc/aarch64-linux-gnu/14/../../.. -lgfortran -lm -fopenmp libtool: link: g++ -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -fopenmp -Wl,-z -Wl,relro -o .libs/fortran fortran.o -fopenmp -L.. /build/reproducible-path/librsb-1.3.0.2+dfsg/.libs/librsb.so -lhwloc -lz -L/usr/lib/gcc/aarch64-linux-gnu/14 -L/usr/lib/gcc/aarch64-linux-gnu/14/../../../aarch64-linux-gnu -L/usr/lib/gcc/aarch64-linux-gnu/14/../../../../lib -L/lib/aarch64-linux-gnu -L/lib/../lib -L/usr/lib/aarch64-linux-gnu -L/usr/lib/../lib -L/usr/lib/gcc/aarch64-linux-gnu/14/../../.. -lgfortran -lm -fopenmp +/bin/sh ../libtool --tag=CXX --mode=link g++ -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -fopenmp -Wl,-z,relro -o cplusplus cplusplus.o -L.. /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la -lhwloc -lm -lhwloc -lz -fopenmp -L/usr/lib/gcc/aarch64-linux-gnu/14 -L/usr/lib/gcc/aarch64-linux-gnu/14/../../../aarch64-linux-gnu -L/usr/lib/gcc/aarch64-linux-gnu/14/../../../../lib -L/lib/aarch64-linux-gnu -L/lib/../lib -L/usr/lib/aarch64-linux-gnu -L/usr/lib/../lib -L/usr/lib/gcc/aarch64-linux-gnu/14/../../.. -lgfortran -lm libtool: link: g++ -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -fopenmp -Wl,-z -Wl,relro -o .libs/snippets snippets.o -fopenmp -L.. /build/reproducible-path/librsb-1.3.0.2+dfsg/.libs/librsb.so -lhwloc -lz -L/usr/lib/gcc/aarch64-linux-gnu/14 -L/usr/lib/gcc/aarch64-linux-gnu/14/../../../aarch64-linux-gnu -L/usr/lib/gcc/aarch64-linux-gnu/14/../../../../lib -L/lib/aarch64-linux-gnu -L/lib/../lib -L/usr/lib/aarch64-linux-gnu -L/usr/lib/../lib -L/usr/lib/gcc/aarch64-linux-gnu/14/../../.. -lgfortran -lm -fopenmp libtool: link: g++ -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -fopenmp -Wl,-z -Wl,relro -o .libs/cplusplus cplusplus.o -fopenmp -L.. /build/reproducible-path/librsb-1.3.0.2+dfsg/.libs/librsb.so -lhwloc -lz -L/usr/lib/gcc/aarch64-linux-gnu/14 -L/usr/lib/gcc/aarch64-linux-gnu/14/../../../aarch64-linux-gnu -L/usr/lib/gcc/aarch64-linux-gnu/14/../../../../lib -L/lib/aarch64-linux-gnu -L/lib/../lib -L/usr/lib/aarch64-linux-gnu -L/usr/lib/../lib -L/usr/lib/gcc/aarch64-linux-gnu/14/../../.. -lgfortran -lm -fopenmp gmake[4]: Leaving directory '/build/reproducible-path/librsb-1.3.0.2+dfsg/examples' @@ -2444,11 +2480,11 @@ gmake[4]: Entering directory '/build/reproducible-path/librsb-1.3.0.2+dfsg/doc' /usr/bin/mkdir -p man /usr/bin/mkdir -p man -SOURCE_DATE_EPOCH=1767272461 \ - help2man --name="provide configuration information for librsb" --no-info /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb-config | /usr/bin/sed 's/January //g' > man/librsb-config.1 gmake makedox -SOURCE_DATE_EPOCH=1767272461 \ +SOURCE_DATE_EPOCH=1735642861 \ help2man --name="benchmark and test for librsb" --no-info ../rsbench | /usr/bin/sed 's/January //g' > man/rsbench.1 +SOURCE_DATE_EPOCH=1735642861 \ + help2man --name="provide configuration information for librsb" --no-info /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb-config | /usr/bin/sed 's/January //g' > man/librsb-config.1 gmake[5]: Entering directory '/build/reproducible-path/librsb-1.3.0.2+dfsg/doc' DOXYGEN_PROJECT_NUMBER=1.3.0.2 doxygen Doxyfile || echo "are you sure you have doxygen installed ?" warning: Tag 'HTML_TIMESTAMP' at line 1513 of file 'Doxyfile' has become obsolete. @@ -3159,13 +3195,13 @@ g++ -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -c -o rgt-rgt.o `test -f 'rgt.cpp' || echo './'`rgt.cpp g++ -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -DRSBP_NOTHROW=1 -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -c -o rgt_ne-rgt.o `test -f 'rgt.cpp' || echo './'`rgt.cpp g++ -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -DRSBP_NOTHROW=1 -DRSBP_WANT_REV=1 -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -c -o rgt_rv-rgt.o `test -f 'rgt.cpp' || echo './'`rgt.cpp -/bin/bash ./libtool --tag=CXX --mode=link g++ -DRSBP_NOTHROW=1 -DRSBP_WANT_REV=1 -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -Wl,-z,relro -o rgt_rv rgt_rv-rgt.o -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la -/bin/bash ./libtool --tag=CXX --mode=link g++ -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -Wl,-z,relro -o rgt rgt-rgt.o -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la -/bin/bash ./libtool --tag=CXX --mode=link g++ -DRSBP_NOTHROW=1 -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -Wl,-z,relro -o rgt_ne rgt_ne-rgt.o -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la -libtool: link: g++ -DRSBP_NOTHROW=1 -DRSBP_WANT_REV=1 -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -Wl,-z -Wl,relro -o .libs/rgt_rv rgt_rv-rgt.o -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/.libs/librsb.so -fopenmp +/bin/sh ./libtool --tag=CXX --mode=link g++ -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -Wl,-z,relro -o rgt rgt-rgt.o -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la +/bin/sh ./libtool --tag=CXX --mode=link g++ -DRSBP_NOTHROW=1 -DRSBP_WANT_REV=1 -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -Wl,-z,relro -o rgt_rv rgt_rv-rgt.o -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la +/bin/sh ./libtool --tag=CXX --mode=link g++ -DRSBP_NOTHROW=1 -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -Wl,-z,relro -o rgt_ne rgt_ne-rgt.o -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la libtool: link: g++ -DRSBP_NOTHROW=1 -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -Wl,-z -Wl,relro -o .libs/rgt_ne rgt_ne-rgt.o -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/.libs/librsb.so -fopenmp +libtool: link: g++ -DRSBP_NOTHROW=1 -DRSBP_WANT_REV=1 -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -Wl,-z -Wl,relro -o .libs/rgt_rv rgt_rv-rgt.o -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/.libs/librsb.so -fopenmp libtool: link: g++ -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -Wl,-z -Wl,relro -o .libs/rgt rgt-rgt.o -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/.libs/librsb.so -fopenmp -/bin/bash ./libtool --tag=CXX --mode=link g++ -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -Wl,-z,relro -o rsb rsb.o -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la +/bin/sh ./libtool --tag=CXX --mode=link g++ -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -Wl,-z,relro -o rsb rsb.o -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la libtool: link: g++ -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -Wl,-z -Wl,relro -o .libs/rsb rsb.o -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/.libs/librsb.so -fopenmp gmake[6]: Leaving directory '/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib' Making all in examples @@ -3180,25 +3216,25 @@ g++ -DHAVE_CONFIG_H -I.. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I.. -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -c -o mtx2bin.o mtx2bin.cpp g++ -DHAVE_CONFIG_H -I.. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I.. -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -c -o render.o render.cpp g++ -DHAVE_CONFIG_H -I.. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I.. -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -c -o span.o span.cpp -/bin/bash ../libtool --tag=CXX --mode=link g++ -I.. -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -Wl,-z,relro -o span span.o -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la -/bin/bash ../libtool --tag=CXX --mode=link g++ -I.. -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -Wl,-z,relro -o assemble assemble.o -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la -libtool: link: g++ -I.. -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -Wl,-z -Wl,relro -o .libs/span span.o -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/.libs/librsb.so -fopenmp -/bin/bash ../libtool --tag=CXX --mode=link g++ -I.. -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -Wl,-z,relro -o render render.o -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la -/bin/bash ../libtool --tag=CXX --mode=link g++ -I.. -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -Wl,-z,relro -o example example.o -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la +/bin/sh ../libtool --tag=CXX --mode=link g++ -I.. -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -Wl,-z,relro -o assemble assemble.o -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la +/bin/sh ../libtool --tag=CXX --mode=link g++ -I.. -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -Wl,-z,relro -o render render.o -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la +/bin/sh ../libtool --tag=CXX --mode=link g++ -I.. -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -Wl,-z,relro -o example example.o -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la libtool: link: g++ -I.. -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -Wl,-z -Wl,relro -o .libs/assemble assemble.o -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/.libs/librsb.so -fopenmp +/bin/sh ../libtool --tag=CXX --mode=link g++ -I.. -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -Wl,-z,relro -o misc misc.o -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la +/bin/sh ../libtool --tag=CXX --mode=link g++ -I.. -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -Wl,-z,relro -o span span.o -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la libtool: link: g++ -I.. -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -Wl,-z -Wl,relro -o .libs/render render.o -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/.libs/librsb.so -fopenmp libtool: link: g++ -I.. -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -Wl,-z -Wl,relro -o .libs/example example.o -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/.libs/librsb.so -fopenmp -/bin/bash ../libtool --tag=CXX --mode=link g++ -I.. -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -Wl,-z,relro -o misc misc.o -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la libtool: link: g++ -I.. -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -Wl,-z -Wl,relro -o .libs/misc misc.o -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/.libs/librsb.so -fopenmp -/bin/bash ../libtool --tag=CXX --mode=link g++ -I.. -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -Wl,-z,relro -o build build.o -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la +libtool: link: g++ -I.. -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -Wl,-z -Wl,relro -o .libs/span span.o -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/.libs/librsb.so -fopenmp +/bin/sh ../libtool --tag=CXX --mode=link g++ -I.. -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -Wl,-z,relro -o build build.o -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la libtool: link: g++ -I.. -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -Wl,-z -Wl,relro -o .libs/build build.o -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/.libs/librsb.so -fopenmp -/bin/bash ../libtool --tag=CXX --mode=link g++ -I.. -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -Wl,-z,relro -o twonnz twonnz.o -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la -/bin/bash ../libtool --tag=CXX --mode=link g++ -I.. -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -Wl,-z,relro -o mtx2bin mtx2bin.o -lstdc++fs -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la +/bin/sh ../libtool --tag=CXX --mode=link g++ -I.. -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -Wl,-z,relro -o twonnz twonnz.o -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la libtool: link: g++ -I.. -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -Wl,-z -Wl,relro -o .libs/twonnz twonnz.o -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/.libs/librsb.so -fopenmp -libtool: link: g++ -I.. -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -Wl,-z -Wl,relro -o .libs/mtx2bin mtx2bin.o -lstdc++fs -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/.libs/librsb.so -fopenmp -/bin/bash ../libtool --tag=CXX --mode=link g++ -I.. -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -Wl,-z,relro -o autotune autotune.o -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la +/bin/sh ../libtool --tag=CXX --mode=link g++ -I.. -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -Wl,-z,relro -o autotune autotune.o -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la +/bin/sh ../libtool --tag=CXX --mode=link g++ -I.. -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -Wl,-z,relro -o mtx2bin mtx2bin.o -lstdc++fs -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la libtool: link: g++ -I.. -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -Wl,-z -Wl,relro -o .libs/autotune autotune.o -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/.libs/librsb.so -fopenmp -/bin/bash ../libtool --tag=CXX --mode=link g++ -I.. -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -Wl,-z,relro -o bench bench.o -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la +libtool: link: g++ -I.. -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -Wl,-z -Wl,relro -o .libs/mtx2bin mtx2bin.o -lstdc++fs -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/.libs/librsb.so -fopenmp +/bin/sh ../libtool --tag=CXX --mode=link g++ -I.. -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -Wl,-z,relro -o bench bench.o -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la libtool: link: g++ -I.. -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -Wl,-z -Wl,relro -o .libs/bench bench.o -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/.libs/librsb.so -fopenmp gmake[6]: Leaving directory '/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib/examples' gmake[5]: Leaving directory '/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib' @@ -3208,7 +3244,7 @@ gmake all-am gmake[5]: Entering directory '/build/reproducible-path/librsb-1.3.0.2+dfsg/rsbtest' g++ -DHAVE_CONFIG_H -I. -I/build/reproducible-path/librsb-1.3.0.2+dfsg -Wdate-time -D_FORTIFY_SOURCE=2 -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -c -o rsbtest.o rsbtest.cpp -/bin/bash ./libtool --tag=CXX --mode=link g++ -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -Wl,-z,relro -o rsbtest rsbtest.o /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la -lstdc++fs -lstdc++fs +/bin/sh ./libtool --tag=CXX --mode=link g++ -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -Wl,-z,relro -o rsbtest rsbtest.o /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la -lstdc++fs -lstdc++fs libtool: link: g++ -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -Wl,-z -Wl,relro -o .libs/rsbtest rsbtest.o /build/reproducible-path/librsb-1.3.0.2+dfsg/.libs/librsb.so -lstdc++fs -fopenmp gmake[5]: Leaving directory '/build/reproducible-path/librsb-1.3.0.2+dfsg/rsbtest' gmake[4]: Leaving directory '/build/reproducible-path/librsb-1.3.0.2+dfsg/rsbtest' @@ -3284,7 +3320,7 @@ gmake[3]: Leaving directory '/build/reproducible-path/librsb-1.3.0.2+dfsg' gmake mtests -C . gmake[3]: Entering directory '/build/reproducible-path/librsb-1.3.0.2+dfsg' -srcdir="/build/reproducible-path/librsb-1.3.0.2+dfsg" /bin/bash -ex ./scripts/readme-tests.sh +srcdir="/build/reproducible-path/librsb-1.3.0.2+dfsg" /bin/sh -ex ./scripts/readme-tests.sh + test x/build/reproducible-path/librsb-1.3.0.2+dfsg = x + ./rsbench -oa -Ob --bench -f /build/reproducible-path/librsb-1.3.0.2+dfsg/A.mtx -qH -R -n1,4 -T z --verbose --nrhs 1,2 --by-rows # --bench option implies -qH -R --write-performance-record --want-mkl-autotune --mkl-benchmark --types : --split-experimental 6 --merge-experimental 6 --also-transpose --sort-filenames-list --want-memory-benchmark @@ -3294,15 +3330,15 @@ Adding matrix file: /build/reproducible-path/librsb-1.3.0.2+dfsg/A.mtx # Sorting matrices list (use --no-sort-filenames-list to prevent this) # Using matrices: A.mtx -# beginning run at 1773327824 +# beginning run at 1738918478 # /build/reproducible-path/librsb-1.3.0.2+dfsg/.libs/rsbench -oa -Ob --bench -f /build/reproducible-path/librsb-1.3.0.2+dfsg/A.mtx -qH -R -n1,4 -T z --verbose --nrhs 1,2 --by-rows # compiled with: CC=gcc CFLAGS=-g -O2 -Werror=implicit-function-declaration -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -# average timer granularity: 7.7e-08 s -# Will write a final performance record to file rsbench_pr__1773327824_gcc-14.2-1,4th.rpr and periodic checkpoints to rsbench_pr__1773327824_gcc-14.2-1,4th.rpr.tmp +# average timer granularity: 7.81e-08 s +# Will write a final performance record to file rsbench_pr__1738918478_gcc-14.2-1,4th.rpr and periodic checkpoints to rsbench_pr__1738918478_gcc-14.2-1,4th.rpr.tmp # will NOT perform ancillary tests. # will flush cache memory: between each operation measurement series, and NOT between each operation. # will keep any zero encountered in the matrix. -# env: export PATH=/usr/sbin:/usr/bin:/sbin:/bin:/usr/games +# env: export PATH=/usr/sbin:/usr/bin:/sbin:/bin:/usr/games:/i/capture/the/path # env: export LD_LIBRARY_PATH=/build/reproducible-path/librsb-1.3.0.2+dfsg/.libs # env: HOSTNAME is not set # env: KMP_AFFINITY is not set @@ -3341,61 +3377,61 @@ # env: SLURM_NTASKS is not set # env: SLURM_STEP_TASKS_PER_NODE is not set # env: SLURM_TASKS_PER_NODE is not set -# detected hostname: codethink03-arm64 +# detected hostname: i-capture-the-hostname # user specified a verbosity level of 1 (each --verbose occurrence counts +1) # This test will measure times in scanning arrays sized and aligned to fit in caches. # 2 cache levels detected Will fill struct with 40 samples... -# Memory benchmark took 5.352s +# Memory benchmark took 5.385s # auto-tuning oriented output implies times==0 iterations and sort-after-load. #pr: allocated a performance record for 8 samples (2240 bytes). # Cache block size total 524288 bytes, per-thread 43690 bytes -# so far, program took 5.356s of wall clock time; ancillary tests 0.000s; I/O 0.000s; checks 0.000s; conversions 0.000s; rsb/mkl tuning 0.000s/0.000s . +# so far, program took 5.389s of wall clock time; ancillary tests 0.000s; I/O 0.000s; checks 0.000s; conversions 0.000s; rsb/mkl tuning 0.000s/0.000s . # Using 1 threads # reading A.mtx (184 bytes / 1 MiB / 6 nnz / 3 rows / 3 columns / 1 MiB COO) as type Z... -# file input of A.mtx took 0.00 s (6 nnz, 35951 nnz/s ) (1.10 MB/s ) -#pre-sorting (6 elements) took 0.00186896 s -#weeding duplicates (to 6 elements) took 2.86102e-06 s (and check, 3.09944e-06 s ) +# file input of A.mtx took 0.00 s (6 nnz, 35900 nnz/s ) (1.10 MB/s ) +#pre-sorting (6 elements) took 0.0184989 s +#weeding duplicates (to 6 elements) took 3.09944e-06 s (and check, 1.90735e-06 s ) # multi-nrhs benchmarking (1,2) -- now using nrhs 1. # Using alpha=1 beta=1 order=rows for rsb_spmv/rsb_spsv/rsb_spmm/rsb_spsm. # multi-transpose benchmarking -- now using transA = N. # will use input matrix flags: RSB_FLAG_USE_HALFWORD_INDICES, RSB_FLAG_SORTED_INPUT, RSB_FLAG_QUAD_PARTITIONING, RSB_FLAG_SYMMETRIC, RSB_FLAG_OWN_PARTITIONING_ARRAYS # Using 1 threads -# Constructed matrix (took 0.006s): (3 x 3)[0xaaab0efff940]{Z} @ (0(0..0),0(0..0)) (6 nnz, 2 nnz/r) flags 0x2442186 (coo:1, csr:0, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'S' +# Constructed matrix (took 0.019s): (3 x 3)[0xaaab0b448980]{Z} @ (0(0..0),0(0..0)) (6 nnz, 2 nnz/r) flags 0x2442186 (coo:1, csr:0, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'S' # matrix consistency check took 0.000s (ok) RSB Sparse Blocks Autotuner invoked requesting max 6 splits and max 6 merges in 1 rounds, threads spec.0 (specify negative values to enable threads tuning). Will autotune matrix: 3 x 3, type Z, 6 nnz, 2 nnz/r, 4 subms, 3 lsubms, 4.0000 bpnz. Parameters: verbosity:1 mintimes:3 maxtimes:10 mindt:0 maxdt:3 -3 iterations (1 th.) took 0.002438s; avg 0.0008127s ( +/- 0.22/ 0.30 %); best 0.0008109s; worst 0.0008152s; std dev. 1.809e-06 (taking best). -Reference operation time is 0.000810862 s (0.1184 Mflops) with 1 threads. -Starting merge (same threads) based auto-tuning procedure (transA=N, nrhs=1, order=rows) (max 6 steps, inclusive 3 grace steps) on: 3 x 3, type Z, 6 nnz, 2 nnz/r, 4 subms, 3 lsubms, 4.0000 bpnz (tpop: 0.0008109 Mflops: 0.118) -Merge (3 -> 1 leaves) took w.c.t. of 2.003e-05s, ~9.06e-06s of computing time (of which 9.537e-07s sorting, 3.099e-06s analysis) -3 iterations (1 th.) took 0.000303s; avg 0.000101s ( +/- 99.92/199.06 %); best 8.301e-08s; worst 0.0003021s; std dev. 0.0001422 (taking best). -Reference operation time is 8.30054e-08 s (1157 Mflops) with 1 threads. -After merge step 1: tpop: 8.301e-08 s ~Mflops: 1156.551 nsubm:1 otn:1 -Applying merge (3 -> 1 leaves, 1 th.) yielded SPEEDUP of 9768.778x: 0.0008109s -> 8.301e-08s, so taking this instance. +3 iterations (1 th.) took 0.00466s; avg 0.001553s ( +/- 32.72/ 34.35 %); best 0.001045s; worst 0.002087s; std dev. 0.0004257 (taking best). +Reference operation time is 0.00104499 s (0.09187 Mflops) with 1 threads. +Starting merge (same threads) based auto-tuning procedure (transA=N, nrhs=1, order=rows) (max 6 steps, inclusive 3 grace steps) on: 3 x 3, type Z, 6 nnz, 2 nnz/r, 4 subms, 3 lsubms, 4.0000 bpnz (tpop: 0.001045 Mflops: 0.092) +Merge (3 -> 1 leaves) took w.c.t. of 3.219e-05s, ~1.192e-05s of computing time (of which 2.146e-06s sorting, 7.153e-06s analysis) +3 iterations (1 th.) took 0.000299s; avg 9.966e-05s ( +/- 99.04/198.09 %); best 9.537e-07s; worst 0.0002971s; std dev. 0.0001396 (taking best). +Reference operation time is 9.53674e-07 s (100.7 Mflops) with 1 threads. +After merge step 1: tpop: 9.537e-07 s ~Mflops: 100.663 nsubm:1 otn:1 +Applying merge (3 -> 1 leaves, 1 th.) yielded SPEEDUP of 1095.750x: 0.001045s -> 9.537e-07s, so taking this instance. Merged all the matrix leaves: no reason to continue merging. -A total of 1 merge steps (of max 6) (3 -> 1 subms) took 0.002422s (of which 2.694e-05s partitioning, 0s I/O); computing times: 9.06e-06s in par. loops, 9.537e-07s sorting, 3.099e-06s analyzing) -Total merge + benchmarking process took 0.002422s, equivalent to 29177.1/3.0 new/old ops (0.004333s for 2 clones -- as 52201.6/5.3 ops, or 26100.8/2.7 ops per clone), SPEEDUP of 9768.778x -Applying multi-merge (3 -> 1 leaves, 1 steps, 0 -> 1 th.sp.) yielded SPEEDUP of 9768.778x (0.0008109s -> 8.301e-08s), will amortize in 3.0 ops by saving 0.0008108s per op. -In 1 tuning rounds (tot. 0.0072s, 0.0043s for constructor, 2 clones) obtained a SPEEDUP of 976777.8% (9769x) (from 0.1184 to 1157 Mflops). +A total of 1 merge steps (of max 6) (3 -> 1 subms) took 0.003905s (of which 3.791e-05s partitioning, 0s I/O); computing times: 1.192e-05s in par. loops, 2.146e-06s sorting, 7.153e-06s analyzing) +Total merge + benchmarking process took 0.003905s, equivalent to 4094.8/3.7 new/old ops (0.007133s for 2 clones -- as 7479.2/6.8 ops, or 3739.6/3.4 ops per clone), SPEEDUP of 1095.750x +Applying multi-merge (3 -> 1 leaves, 1 steps, 0 -> 1 th.sp.) yielded SPEEDUP of 1095.750x (0.001045s -> 9.537e-07s), will amortize in 3.7 ops by saving 0.001044s per op. +In 1 tuning rounds (tot. 0.012s, 0.0071s for constructor, 2 clones) obtained a SPEEDUP of 109475.0% (1096x) (from 0.09187 to 100.7 Mflops). #pr: updating sample at index 1 (0^th of 8), 0^th touch for (0,0,0,0,0,0,0). -First run of RSB Autotuner took 0.00730491 s (8.109e-04 s -> 8.301e-08 s per spmv_sxsa) (tuned: 3 -> 1 lsubm). +First run of RSB Autotuner took 0.0123999 s (1.045e-03 s -> 9.537e-07 s per spmv_sxsa) (tuned: 3 -> 1 lsubm). RSB Sparse Blocks Autotuner invoked requesting max 0 splits and max 0 merges in 1 rounds, auto threads spec. -Second run of RSB Autotuner took 0.0305431 s and estimated a speedup of 1.000000 x (8.301e-08 s -> 8.301e-08 s per op) in same matrix (1 -> 1 lsubm) +Second run of RSB Autotuner took 0.0663822 s and estimated a speedup of 1.000000 x (8.205e-08 s -> 8.205e-08 s per op) in same matrix (1 -> 1 lsubm) #min:1 0 #max:1 0 #sum:3 0 #norm:1.7320508075688772 0 #used index storage compared to COO:28 vs 48 bytes (58.33%) ; compared to CSR:28 vs 40 bytes (77.78%) #%:CONSTRUCTOR_*:SORT SCAN INSERT SCAN+INSERT -%:CONSTRUCTOR_TIMES:A.mtx S N 1 3 3 6 0.000000 0.002001 0.002088 0.004089 -%:UNSORTEDCOO2RSB_TIME:A.mtx S N 1 3 3 6 0.004089 -%:RSB_SUBDIVISION_TIME:A.mtx S N 1 3 3 6 0.002001 -%:RSB_SHUFFLE_TIME:A.mtx S N 1 3 3 6 0.002088 +%:CONSTRUCTOR_TIMES:A.mtx S N 1 3 3 6 0.000000 0.001687 0.010491 0.012178 +%:UNSORTEDCOO2RSB_TIME:A.mtx S N 1 3 3 6 0.012178 +%:RSB_SUBDIVISION_TIME:A.mtx S N 1 3 3 6 0.001687 +%:RSB_SHUFFLE_TIME:A.mtx S N 1 3 3 6 0.010491 %:ROW_MAJOR_SORT_TIME:A.mtx S N 1 3 3 6 0.000000 %:ROW_MAJOR_SORT_SCALING:A.mtx S N 1 3 3 6 nan -%:SORTEDCOO2RSB_TIME:A.mtx S N 1 3 3 6 0.004089 +%:SORTEDCOO2RSB_TIME:A.mtx S N 1 3 3 6 0.012178 %:ROW_MAJOR_SORT_TO_MOP:A.mtx S N 1 3 3 6 0.000 %:UNSORTEDCOO2RSB_SCALING:A.mtx S N 1 3 3 6 1.00 %:SORTEDCOO2RSB_SCALING:A.mtx S N 1 3 3 6 1.00 @@ -3410,47 +3446,47 @@ %:SM_MINMAXAVGNNZ:A.mtx S N 1 3 3 6 6 6 6 # # Using 4 threads -# Constructed matrix (took 0.008s): (3 x 3)[0xaaab0efff940]{Z} @ (0(0..0),0(0..0)) (6 nnz, 2 nnz/r) flags 0x2442186 (coo:1, csr:0, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'S' +# Constructed matrix (took 0.017s): (3 x 3)[0xaaab0b448980]{Z} @ (0(0..0),0(0..0)) (6 nnz, 2 nnz/r) flags 0x2442186 (coo:1, csr:0, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'S' # matrix consistency check took 0.000s (ok) RSB Sparse Blocks Autotuner invoked requesting max 6 splits and max 6 merges in 1 rounds, threads spec.1 (specify negative values to enable threads tuning). Will autotune matrix: 3 x 3, type Z, 6 nnz, 2 nnz/r, 4 subms, 3 lsubms, 4.0000 bpnz. Parameters: verbosity:1 mintimes:3 maxtimes:10 mindt:0 maxdt:3 -3 iterations (4 th.) took 0.002659s; avg 0.0008863s ( +/- 28.58/ 36.98 %); best 0.000633s; worst 0.001214s; std dev. 0.000243 (taking best). -Reference operation time is 0.000633001 s (0.1517 Mflops) with 4 threads. -Starting merge (user-supplied threads) based auto-tuning procedure (transA=N, nrhs=1, order=rows) (max 6 steps, inclusive 3 grace steps) on: 3 x 3, type Z, 6 nnz, 2 nnz/r, 4 subms, 3 lsubms, 4.0000 bpnz (tpop: 0.000633 Mflops: 0.152) -Merge (3 -> 1 leaves) took w.c.t. of 7.868e-06s, ~4.053e-06s of computing time (of which 9.537e-07s sorting, 9.537e-07s analysis) -3 iterations (4 th.) took 3.099e-06s; avg 1.033e-06s ( +/- 91.97/200.00 %); best 8.301e-08s; worst 3.099e-06s; std dev. 1.461e-06 (taking best). -Reference operation time is 8.30054e-08 s (1157 Mflops) with 4 threads. -After merge step 1: tpop: 8.301e-08 s ~Mflops: 1156.551 nsubm:1 otn:1 -Applying merge (3 -> 1 leaves, 1 th.) yielded SPEEDUP of 7626.023x: 0.000633s -> 8.301e-08s, so taking this instance. +3 iterations (4 th.) took 0.003963s; avg 0.001321s ( +/- 36.11/ 40.06 %); best 0.000844s; worst 0.00185s; std dev. 0.0004124 (taking best). +Reference operation time is 0.000844002 s (0.1137 Mflops) with 4 threads. +Starting merge (user-supplied threads) based auto-tuning procedure (transA=N, nrhs=1, order=rows) (max 6 steps, inclusive 3 grace steps) on: 3 x 3, type Z, 6 nnz, 2 nnz/r, 4 subms, 3 lsubms, 4.0000 bpnz (tpop: 0.000844 Mflops: 0.114) +Merge (3 -> 1 leaves) took w.c.t. of 1.192e-05s, ~4.053e-06s of computing time (of which 9.537e-07s sorting, 3.099e-06s analysis) +3 iterations (4 th.) took 3.099e-06s; avg 1.033e-06s ( +/- 92.06/200.00 %); best 8.205e-08s; worst 3.099e-06s; std dev. 1.461e-06 (taking best). +Reference operation time is 8.20518e-08 s (1170 Mflops) with 4 threads. +After merge step 1: tpop: 8.205e-08 s ~Mflops: 1169.993 nsubm:1 otn:1 +Applying merge (3 -> 1 leaves, 1 th.) yielded SPEEDUP of 10286.212x: 0.000844s -> 8.205e-08s, so taking this instance. Merged all the matrix leaves: no reason to continue merging. -A total of 1 merge steps (of max 6) (3 -> 1 subms) took 0.002259s (of which 1.097e-05s partitioning, 0s I/O); computing times: 4.053e-06s in par. loops, 9.537e-07s sorting, 9.537e-07s analyzing) -Total merge + benchmarking process took 0.002259s, equivalent to 27215.3/3.6 new/old ops (0.006169s for 2 clones -- as 74321.4/9.7 ops, or 37160.7/4.9 ops per clone), SPEEDUP of 7626.023x -Applying multi-merge (3 -> 1 leaves, 1 steps, 1 -> 1 th.sp.) yielded SPEEDUP of 7626.023x (0.000633s -> 8.301e-08s), will amortize in 3.6 ops by saving 0.0006329s per op. -In 1 tuning rounds (tot. 0.0089s, 0.0062s for constructor, 2 clones) obtained a SPEEDUP of 762502.3% (7626x) (from 0.1517 to 1157 Mflops). +A total of 1 merge steps (of max 6) (3 -> 1 subms) took 0.003077s (of which 1.407e-05s partitioning, 0s I/O); computing times: 4.053e-06s in par. loops, 9.537e-07s sorting, 3.099e-06s analyzing) +Total merge + benchmarking process took 0.003077s, equivalent to 37501.1/3.6 new/old ops (0.01243s for 2 clones -- as 151451.4/14.7 ops, or 75725.7/7.4 ops per clone), SPEEDUP of 10286.212x +Applying multi-merge (3 -> 1 leaves, 1 steps, 1 -> 1 th.sp.) yielded SPEEDUP of 10286.212x (0.000844s -> 8.205e-08s), will amortize in 3.6 ops by saving 0.0008439s per op. +In 1 tuning rounds (tot. 0.016s, 0.012s for constructor, 2 clones) obtained a SPEEDUP of 1028521.2% (1.029e+04x) (from 0.1137 to 1170 Mflops). #pr: updating sample at index 5 (1^th of 8), 0^th touch for (0,1,0,0,0,0,0). -First run of RSB Autotuner took 0.00888991 s (6.330e-04 s -> 8.301e-08 s per spmv_sxsa) (tuned: 3 -> 1 lsubm). +First run of RSB Autotuner took 0.0164661 s (8.440e-04 s -> 8.205e-08 s per spmv_sxsa) (tuned: 3 -> 1 lsubm). RSB Sparse Blocks Autotuner invoked requesting max 0 splits and max 0 merges in 1 rounds, auto threads spec. -Second run of RSB Autotuner took 0.039444 s and estimated a speedup of 1.000000 x (8.301e-08 s -> 8.301e-08 s per op) in same matrix (1 -> 1 lsubm) +Second run of RSB Autotuner took 0.0526161 s and estimated a speedup of 1.000000 x (8.205e-08 s -> 8.205e-08 s per op) in same matrix (1 -> 1 lsubm) #min:1 0 #max:1 0 #sum:3 0 #norm:1.7320508075688772 0 #used index storage compared to COO:28 vs 48 bytes (58.33%) ; compared to CSR:28 vs 40 bytes (77.78%) #%:CONSTRUCTOR_*:SORT SCAN INSERT SCAN+INSERT -%:CONSTRUCTOR_TIMES:A.mtx S N 4 3 3 6 0.000000 0.001255 0.003824 0.005079 -%:UNSORTEDCOO2RSB_TIME:A.mtx S N 4 3 3 6 0.005079 -%:RSB_SUBDIVISION_TIME:A.mtx S N 4 3 3 6 0.001255 -%:RSB_SHUFFLE_TIME:A.mtx S N 4 3 3 6 0.003824 +%:CONSTRUCTOR_TIMES:A.mtx S N 4 3 3 6 0.000000 0.002566 0.008956 0.011522 +%:UNSORTEDCOO2RSB_TIME:A.mtx S N 4 3 3 6 0.011522 +%:RSB_SUBDIVISION_TIME:A.mtx S N 4 3 3 6 0.002566 +%:RSB_SHUFFLE_TIME:A.mtx S N 4 3 3 6 0.008956 %:ROW_MAJOR_SORT_TIME:A.mtx S N 4 3 3 6 0.000000 %:ROW_MAJOR_SORT_SCALING:A.mtx S N 4 3 3 6 nan -%:SORTEDCOO2RSB_TIME:A.mtx S N 4 3 3 6 0.005079 +%:SORTEDCOO2RSB_TIME:A.mtx S N 4 3 3 6 0.011522 %:ROW_MAJOR_SORT_TO_MOP:A.mtx S N 4 3 3 6 0.000 -%:UNSORTEDCOO2RSB_SCALING:A.mtx S N 4 3 3 6 0.81 -%:SORTEDCOO2RSB_SCALING:A.mtx S N 4 3 3 6 0.81 -%:RSB_SUBDIVISION_SCALING:A.mtx S N 4 3 3 6 1.59 -%:RSB_SHUFFLE_SCALING:A.mtx S N 4 3 3 6 0.55 -%:CONSTRUCTOR_SCALING:A.mtx S N 4 3 3 6 nan 1.59 0.55 0.81 +%:UNSORTEDCOO2RSB_SCALING:A.mtx S N 4 3 3 6 1.06 +%:SORTEDCOO2RSB_SCALING:A.mtx S N 4 3 3 6 1.06 +%:RSB_SUBDIVISION_SCALING:A.mtx S N 4 3 3 6 0.66 +%:RSB_SHUFFLE_SCALING:A.mtx S N 4 3 3 6 1.17 +%:CONSTRUCTOR_SCALING:A.mtx S N 4 3 3 6 nan 0.66 1.17 1.06 #%:SM_COUNTS: Tot HalfwordCsr FullwordCsr HalfwordCoo FullwordCoo %:SM_COUNTS:A.mtx S N 4 3 3 6 1 1 0 0 0 %:SM_IDXOCCUPATIONRSBVSCOOANDCSR:A.mtx S N 4 3 3 6 28 48 36 @@ -3459,50 +3495,50 @@ %:SM_MINMAXAVGNNZ:A.mtx S N 4 3 3 6 6 6 6 # %operation:matrix CONSTRUCTOR[1] SPMV[1] SPMV[4] -%operation:A.mtx 0.00573301 1e+09 1e+09 +%operation:A.mtx 0.019289 1e+09 1e+09 %constructor:matrix SORT[1] SCAN[1] SHUFFLE[1] INSERT[1] -%constructor:A.mtx 0 0.00200081 0 0.00208783 +%constructor:A.mtx 0 0.00168705 0 0.0104911 # symmetric matrix --- skipping transposed benchmarking # multi-nrhs benchmarking (1,2) -- now using nrhs 2. # Using alpha=1 beta=1 order=rows for rsb_spmv/rsb_spsv/rsb_spmm/rsb_spsm. # multi-transpose benchmarking -- now using transA = N. # will use input matrix flags: RSB_FLAG_USE_HALFWORD_INDICES, RSB_FLAG_SORTED_INPUT, RSB_FLAG_QUAD_PARTITIONING, RSB_FLAG_SYMMETRIC, RSB_FLAG_OWN_PARTITIONING_ARRAYS # Using 1 threads -# Constructed matrix (took 0.004s): (3 x 3)[0xaaab0efff940]{Z} @ (0(0..0),0(0..0)) (6 nnz, 2 nnz/r) flags 0x2442186 (coo:1, csr:0, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'S' +# Constructed matrix (took 0.019s): (3 x 3)[0xaaab0b448980]{Z} @ (0(0..0),0(0..0)) (6 nnz, 2 nnz/r) flags 0x2442186 (coo:1, csr:0, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'S' # matrix consistency check took 0.000s (ok) RSB Sparse Blocks Autotuner invoked requesting max 6 splits and max 6 merges in 1 rounds, threads spec.0 (specify negative values to enable threads tuning). Will autotune matrix: 3 x 3, type Z, 6 nnz, 2 nnz/r, 4 subms, 3 lsubms, 4.0000 bpnz. Parameters: verbosity:1 mintimes:3 maxtimes:10 mindt:0 maxdt:3 -3 iterations (1 th.) took 0.002193s; avg 0.000731s ( +/- 3.72/ 3.72 %); best 0.0007038s; worst 0.0007582s; std dev. 2.219e-05 (taking best). -Reference operation time is 0.000703812 s (0.2728 Mflops) with 1 threads. -Starting merge (same threads) based auto-tuning procedure (transA=N, nrhs=2, order=rows) (max 6 steps, inclusive 3 grace steps) on: 3 x 3, type Z, 6 nnz, 2 nnz/r, 4 subms, 3 lsubms, 4.0000 bpnz (tpop: 0.0007038 Mflops: 0.273) -Merge (3 -> 1 leaves) took w.c.t. of 1.311e-05s, ~4.053e-06s of computing time (of which 9.537e-07s sorting, 1.192e-06s analysis) -3 iterations (1 th.) took 5.007e-06s; avg 1.669e-06s ( +/- 95.03/142.86 %); best 8.301e-08s; worst 4.053e-06s; std dev. 1.73e-06 (taking best). -Reference operation time is 8.30054e-08 s (2313 Mflops) with 1 threads. -After merge step 1: tpop: 8.301e-08 s ~Mflops: 2313.102 nsubm:1 otn:1 -Applying merge (3 -> 1 leaves, 1 th.) yielded SPEEDUP of 8479.104x: 0.0007038s -> 8.301e-08s, so taking this instance. +3 iterations (1 th.) took 0.001834s; avg 0.0006114s ( +/- 1.34/ 1.08 %); best 0.0006032s; worst 0.000618s; std dev. 6.138e-06 (taking best). +Reference operation time is 0.000603199 s (0.3183 Mflops) with 1 threads. +Starting merge (same threads) based auto-tuning procedure (transA=N, nrhs=2, order=rows) (max 6 steps, inclusive 3 grace steps) on: 3 x 3, type Z, 6 nnz, 2 nnz/r, 4 subms, 3 lsubms, 4.0000 bpnz (tpop: 0.0006032 Mflops: 0.318) +Merge (3 -> 1 leaves) took w.c.t. of 8.821e-06s, ~2.861e-06s of computing time (of which 9.537e-07s sorting, 1.907e-06s analysis) +3 iterations (1 th.) took 4.053e-06s; avg 1.351e-06s ( +/- 93.93/129.41 %); best 8.205e-08s; worst 3.099e-06s; std dev. 1.296e-06 (taking best). +Reference operation time is 8.20518e-08 s (2340 Mflops) with 1 threads. +After merge step 1: tpop: 8.205e-08 s ~Mflops: 2339.987 nsubm:1 otn:1 +Applying merge (3 -> 1 leaves, 1 th.) yielded SPEEDUP of 7351.446x: 0.0006032s -> 8.205e-08s, so taking this instance. Merged all the matrix leaves: no reason to continue merging. -A total of 1 merge steps (of max 6) (3 -> 1 subms) took 0.002069s (of which 1.597e-05s partitioning, 0s I/O); computing times: 4.053e-06s in par. loops, 9.537e-07s sorting, 1.192e-06s analyzing) -Total merge + benchmarking process took 0.002069s, equivalent to 24926.0/2.9 new/old ops (0.004213s for 2 clones -- as 50754.0/6.0 ops, or 25377.0/3.0 ops per clone), SPEEDUP of 8479.104x -Applying multi-merge (3 -> 1 leaves, 1 steps, 0 -> 1 th.sp.) yielded SPEEDUP of 8479.104x (0.0007038s -> 8.301e-08s), will amortize in 2.9 ops by saving 0.0007037s per op. -In 1 tuning rounds (tot. 0.0065s, 0.0042s for constructor, 2 clones) obtained a SPEEDUP of 847810.4% (8479x) (from 0.2728 to 2313 Mflops). +A total of 1 merge steps (of max 6) (3 -> 1 subms) took 0.006786s (of which 1.192e-05s partitioning, 0s I/O); computing times: 2.861e-06s in par. loops, 9.537e-07s sorting, 1.907e-06s analyzing) +Total merge + benchmarking process took 0.006786s, equivalent to 82702.3/11.2 new/old ops (0.00847s for 2 clones -- as 103228.2/14.0 ops, or 51614.1/7.0 ops per clone), SPEEDUP of 7351.446x +Applying multi-merge (3 -> 1 leaves, 1 steps, 0 -> 1 th.sp.) yielded SPEEDUP of 7351.446x (0.0006032s -> 8.205e-08s), will amortize in 11.3 ops by saving 0.0006031s per op. +In 1 tuning rounds (tot. 0.01s, 0.0085s for constructor, 2 clones) obtained a SPEEDUP of 735044.6% (7351x) (from 0.3183 to 2340 Mflops). #pr: updating sample at index 3 (2^th of 8), 0^th touch for (0,0,0,0,1,0,0). -First run of RSB Autotuner took 0.00648403 s (7.038e-04 s -> 8.301e-08 s per spmv_sxsa) (tuned: 3 -> 1 lsubm). +First run of RSB Autotuner took 0.0103781 s (6.032e-04 s -> 8.205e-08 s per spmv_sxsa) (tuned: 3 -> 1 lsubm). RSB Sparse Blocks Autotuner invoked requesting max 0 splits and max 0 merges in 1 rounds, auto threads spec. -Second run of RSB Autotuner took 0.0348201 s and estimated a speedup of 1.000000 x (8.301e-08 s -> 8.301e-08 s per op) in same matrix (1 -> 1 lsubm) +Second run of RSB Autotuner took 0.0497038 s and estimated a speedup of 1.000000 x (8.205e-08 s -> 8.205e-08 s per op) in same matrix (1 -> 1 lsubm) #min:1 0 #max:1 0 #sum:3 0 #norm:1.7320508075688772 0 #used index storage compared to COO:28 vs 48 bytes (58.33%) ; compared to CSR:28 vs 40 bytes (77.78%) #%:CONSTRUCTOR_*:SORT SCAN INSERT SCAN+INSERT -%:CONSTRUCTOR_TIMES:A.mtx S N 1 3 3 6 0.000000 0.000924 0.001550 0.002474 -%:UNSORTEDCOO2RSB_TIME:A.mtx S N 1 3 3 6 0.002474 -%:RSB_SUBDIVISION_TIME:A.mtx S N 1 3 3 6 0.000924 -%:RSB_SHUFFLE_TIME:A.mtx S N 1 3 3 6 0.001550 +%:CONSTRUCTOR_TIMES:A.mtx S N 1 3 3 6 0.000000 0.004649 0.003373 0.008022 +%:UNSORTEDCOO2RSB_TIME:A.mtx S N 1 3 3 6 0.008022 +%:RSB_SUBDIVISION_TIME:A.mtx S N 1 3 3 6 0.004649 +%:RSB_SHUFFLE_TIME:A.mtx S N 1 3 3 6 0.003373 %:ROW_MAJOR_SORT_TIME:A.mtx S N 1 3 3 6 0.000000 %:ROW_MAJOR_SORT_SCALING:A.mtx S N 1 3 3 6 nan -%:SORTEDCOO2RSB_TIME:A.mtx S N 1 3 3 6 0.002474 +%:SORTEDCOO2RSB_TIME:A.mtx S N 1 3 3 6 0.008022 %:ROW_MAJOR_SORT_TO_MOP:A.mtx S N 1 3 3 6 0.000 %:UNSORTEDCOO2RSB_SCALING:A.mtx S N 1 3 3 6 1.00 %:SORTEDCOO2RSB_SCALING:A.mtx S N 1 3 3 6 1.00 @@ -3517,47 +3553,47 @@ %:SM_MINMAXAVGNNZ:A.mtx S N 1 3 3 6 6 6 6 # # Using 4 threads -# Constructed matrix (took 0.004s): (3 x 3)[0xaaab0efff940]{Z} @ (0(0..0),0(0..0)) (6 nnz, 2 nnz/r) flags 0x2442186 (coo:1, csr:0, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'S' +# Constructed matrix (took 0.007s): (3 x 3)[0xaaab0b448980]{Z} @ (0(0..0),0(0..0)) (6 nnz, 2 nnz/r) flags 0x2442186 (coo:1, csr:0, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'S' # matrix consistency check took 0.000s (ok) RSB Sparse Blocks Autotuner invoked requesting max 6 splits and max 6 merges in 1 rounds, threads spec.1 (specify negative values to enable threads tuning). Will autotune matrix: 3 x 3, type Z, 6 nnz, 2 nnz/r, 4 subms, 3 lsubms, 4.0000 bpnz. Parameters: verbosity:1 mintimes:3 maxtimes:10 mindt:0 maxdt:3 -3 iterations (4 th.) took 0.002372s; avg 0.0007907s ( +/- 16.14/ 19.26 %); best 0.000663s; worst 0.0009429s; std dev. 0.0001156 (taking best). -Reference operation time is 0.000663042 s (0.2896 Mflops) with 4 threads. -Starting merge (user-supplied threads) based auto-tuning procedure (transA=N, nrhs=2, order=rows) (max 6 steps, inclusive 3 grace steps) on: 3 x 3, type Z, 6 nnz, 2 nnz/r, 4 subms, 3 lsubms, 4.0000 bpnz (tpop: 0.000663 Mflops: 0.290) -Merge (3 -> 1 leaves) took w.c.t. of 1.097e-05s, ~1.907e-06s of computing time (of which 9.537e-07s sorting, 2.861e-06s analysis) -3 iterations (4 th.) took 4.053e-06s; avg 1.351e-06s ( +/- 93.86/200.00 %); best 8.301e-08s; worst 4.053e-06s; std dev. 1.911e-06 (taking best). -Reference operation time is 8.30054e-08 s (2313 Mflops) with 4 threads. -After merge step 1: tpop: 8.301e-08 s ~Mflops: 2313.102 nsubm:1 otn:1 -Applying merge (3 -> 1 leaves, 1 th.) yielded SPEEDUP of 7987.936x: 0.000663s -> 8.301e-08s, so taking this instance. +3 iterations (4 th.) took 0.002351s; avg 0.0007837s ( +/- 18.34/ 27.75 %); best 0.0006399s; worst 0.001001s; std dev. 0.0001564 (taking best). +Reference operation time is 0.000639915 s (0.3 Mflops) with 4 threads. +Starting merge (user-supplied threads) based auto-tuning procedure (transA=N, nrhs=2, order=rows) (max 6 steps, inclusive 3 grace steps) on: 3 x 3, type Z, 6 nnz, 2 nnz/r, 4 subms, 3 lsubms, 4.0000 bpnz (tpop: 0.0006399 Mflops: 0.300) +Merge (3 -> 1 leaves) took w.c.t. of 7.868e-06s, ~2.146e-06s of computing time (of which 9.537e-07s sorting, 1.907e-06s analysis) +3 iterations (4 th.) took 2.861e-06s; avg 9.537e-07s ( +/- 91.40/200.00 %); best 8.205e-08s; worst 2.861e-06s; std dev. 1.349e-06 (taking best). +Reference operation time is 8.20518e-08 s (2340 Mflops) with 4 threads. +After merge step 1: tpop: 8.205e-08 s ~Mflops: 2339.987 nsubm:1 otn:1 +Applying merge (3 -> 1 leaves, 1 th.) yielded SPEEDUP of 7798.925x: 0.0006399s -> 8.205e-08s, so taking this instance. Merged all the matrix leaves: no reason to continue merging. -A total of 1 merge steps (of max 6) (3 -> 1 subms) took 0.002318s (of which 1.287e-05s partitioning, 0s I/O); computing times: 1.907e-06s in par. loops, 9.537e-07s sorting, 2.861e-06s analyzing) -Total merge + benchmarking process took 0.002318s, equivalent to 27924.7/3.5 new/old ops (0.00386s for 2 clones -- as 46502.9/5.8 ops, or 23251.5/2.9 ops per clone), SPEEDUP of 7987.936x -Applying multi-merge (3 -> 1 leaves, 1 steps, 1 -> 1 th.sp.) yielded SPEEDUP of 7987.936x (0.000663s -> 8.301e-08s), will amortize in 3.5 ops by saving 0.000663s per op. -In 1 tuning rounds (tot. 0.0063s, 0.0039s for constructor, 2 clones) obtained a SPEEDUP of 798693.6% (7988x) (from 0.2896 to 2313 Mflops). +A total of 1 merge steps (of max 6) (3 -> 1 subms) took 0.003401s (of which 8.821e-06s partitioning, 0s I/O); computing times: 2.146e-06s in par. loops, 9.537e-07s sorting, 1.907e-06s analyzing) +Total merge + benchmarking process took 0.003401s, equivalent to 41449.9/5.3 new/old ops (0.005455s for 2 clones -- as 66482.6/8.5 ops, or 33241.3/4.3 ops per clone), SPEEDUP of 7798.925x +Applying multi-merge (3 -> 1 leaves, 1 steps, 1 -> 1 th.sp.) yielded SPEEDUP of 7798.925x (0.0006399s -> 8.205e-08s), will amortize in 5.3 ops by saving 0.0006398s per op. +In 1 tuning rounds (tot. 0.0078s, 0.0055s for constructor, 2 clones) obtained a SPEEDUP of 779792.5% (7799x) (from 0.3 to 2340 Mflops). #pr: updating sample at index 7 (3^th of 8), 0^th touch for (0,1,0,0,1,0,0). -First run of RSB Autotuner took 0.00630593 s (6.630e-04 s -> 8.301e-08 s per spmv_sxsa) (tuned: 3 -> 1 lsubm). +First run of RSB Autotuner took 0.00785208 s (6.399e-04 s -> 8.205e-08 s per spmv_sxsa) (tuned: 3 -> 1 lsubm). RSB Sparse Blocks Autotuner invoked requesting max 0 splits and max 0 merges in 1 rounds, auto threads spec. -Second run of RSB Autotuner took 0.0330529 s and estimated a speedup of 1.000000 x (8.301e-08 s -> 8.301e-08 s per op) in same matrix (1 -> 1 lsubm) +Second run of RSB Autotuner took 0.0690689 s and estimated a speedup of 1.000000 x (8.205e-08 s -> 8.205e-08 s per op) in same matrix (1 -> 1 lsubm) #min:1 0 #max:1 0 #sum:3 0 #norm:1.7320508075688772 0 #used index storage compared to COO:28 vs 48 bytes (58.33%) ; compared to CSR:28 vs 40 bytes (77.78%) #%:CONSTRUCTOR_*:SORT SCAN INSERT SCAN+INSERT -%:CONSTRUCTOR_TIMES:A.mtx S N 4 3 3 6 0.000000 0.001018 0.001954 0.002972 -%:UNSORTEDCOO2RSB_TIME:A.mtx S N 4 3 3 6 0.002972 -%:RSB_SUBDIVISION_TIME:A.mtx S N 4 3 3 6 0.001018 -%:RSB_SHUFFLE_TIME:A.mtx S N 4 3 3 6 0.001954 +%:CONSTRUCTOR_TIMES:A.mtx S N 4 3 3 6 0.000000 0.001995 0.002685 0.004680 +%:UNSORTEDCOO2RSB_TIME:A.mtx S N 4 3 3 6 0.004680 +%:RSB_SUBDIVISION_TIME:A.mtx S N 4 3 3 6 0.001995 +%:RSB_SHUFFLE_TIME:A.mtx S N 4 3 3 6 0.002685 %:ROW_MAJOR_SORT_TIME:A.mtx S N 4 3 3 6 0.000000 %:ROW_MAJOR_SORT_SCALING:A.mtx S N 4 3 3 6 nan -%:SORTEDCOO2RSB_TIME:A.mtx S N 4 3 3 6 0.002972 +%:SORTEDCOO2RSB_TIME:A.mtx S N 4 3 3 6 0.004680 %:ROW_MAJOR_SORT_TO_MOP:A.mtx S N 4 3 3 6 0.000 -%:UNSORTEDCOO2RSB_SCALING:A.mtx S N 4 3 3 6 0.83 -%:SORTEDCOO2RSB_SCALING:A.mtx S N 4 3 3 6 0.83 -%:RSB_SUBDIVISION_SCALING:A.mtx S N 4 3 3 6 0.91 -%:RSB_SHUFFLE_SCALING:A.mtx S N 4 3 3 6 0.79 -%:CONSTRUCTOR_SCALING:A.mtx S N 4 3 3 6 nan 0.91 0.79 0.83 +%:UNSORTEDCOO2RSB_SCALING:A.mtx S N 4 3 3 6 1.71 +%:SORTEDCOO2RSB_SCALING:A.mtx S N 4 3 3 6 1.71 +%:RSB_SUBDIVISION_SCALING:A.mtx S N 4 3 3 6 2.33 +%:RSB_SHUFFLE_SCALING:A.mtx S N 4 3 3 6 1.26 +%:CONSTRUCTOR_SCALING:A.mtx S N 4 3 3 6 nan 2.33 1.26 1.71 #%:SM_COUNTS: Tot HalfwordCsr FullwordCsr HalfwordCoo FullwordCoo %:SM_COUNTS:A.mtx S N 4 3 3 6 1 1 0 0 0 %:SM_IDXOCCUPATIONRSBVSCOOANDCSR:A.mtx S N 4 3 3 6 28 48 36 @@ -3566,185 +3602,185 @@ %:SM_MINMAXAVGNNZ:A.mtx S N 4 3 3 6 6 6 6 # %operation:matrix CONSTRUCTOR[1] SPMV[1] SPMV[4] -%operation:A.mtx 0.00406599 1e+09 1e+09 +%operation:A.mtx 0.019347 1e+09 1e+09 %constructor:matrix SORT[1] SCAN[1] SHUFFLE[1] INSERT[1] -%constructor:A.mtx 0 0.00092411 0 0.00154996 +%constructor:A.mtx 0 0.00464916 0 0.00337315 # symmetric matrix --- skipping transposed benchmarking -# so far, program took 5.565s of wall clock time; ancillary tests 0.000s; I/O 0.000s; checks 0.000s; conversions 0.000s; rsb/mkl tuning 0.167s/0.000s . +# so far, program took 5.777s of wall clock time; ancillary tests 0.000s; I/O 0.000s; checks 0.000s; conversions 0.000s; rsb/mkl tuning 0.285s/0.000s . getrusage() stats: ru_maxrss: 6 (maximum resident set size -- MB) -ru_stime : 0.0553s (system CPU time used) -ru_utime : 7.224s (user CPU time used) +ru_stime : 0.05777s (system CPU time used) +ru_utime : 7.1s (user CPU time used) # benchmarking terminated --- finalizing run. # ====== BEGIN Total summary record. #pr: ======== Limiting to nrhs=1: #pr: 2 samples (out of 4) matched the dump limiting criteria. #pr: Dump from a base of 4 samples (of max 8) ordered by (1,2,1,1,2,1,2) = (filename x cores x incX x incY x nrhs x typecode x transA). pr: BESTCODE MTX NR NC NNZ NRHS TYPE SYM TRANS NT AT-NT AT-MKL-NT BPNZ AT-BPNZ NSUBM AT-SUBM RSBBEST-MFLOPS OPTIME MKL-OPTIME AT-OPTIME AT-MKL-OPTIME AT-TIME RWminBW-GBps CB-bpf AT-MS CMFLOPS -pr: 1:R_R A 3 3 6 1 Z S N 1 1 0 4.0000 4.6667 3 1 1156.55 8.109e-04 0.000e+00 8.301e-08 0.000e+00 7.305e-03 3.23e+00 2.29e+00 1 9.60e-05 -pr: 5:R_R A 3 3 6 1 Z S N 4 1 0 4.0000 4.6667 3 1 1156.55 6.330e-04 0.000e+00 8.301e-08 0.000e+00 8.890e-03 3.23e+00 2.29e+00 1 9.60e-05 +pr: 1:R_R A 3 3 6 1 Z S N 1 1 0 4.0000 4.6667 3 1 100.66 1.045e-03 0.000e+00 9.537e-07 0.000e+00 1.240e-02 2.81e-01 2.29e+00 1 9.60e-05 +pr: 5:R_R A 3 3 6 1 Z S N 4 1 0 4.0000 4.6667 3 1 1169.99 8.440e-04 0.000e+00 8.205e-08 0.000e+00 1.647e-02 3.27e+00 2.29e+00 1 9.60e-05 #pr: 2 samples (out of 4) matched the dump limiting criteria. #pr: below, we define 'successful' autotuning when speedup of 1.010000x is exceeded, and 'tuned' results even the ones which are same as untuned #pr: rsb autotuning was successful in 2 cases (100.00 %) and unsuccessful in 0 cases (0.00 %) -#pr: (in succ. cases rsb autotuning gave avg. 869640.1 % faster, avg. sp. ratio 8697.401x, max sp. ratio 9768.778x, avg. ratio 0.000x) -#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 97552.8/88005.2/107100.4/195105.6 tuned ops) -#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 11.5/ 9.0/ 14.0/ 23.1 untuned ops) -#pr: (and amortizes from untuned rsb in avg. 11.5, min. 9.0, max. 14.0 ops) +#pr: (in succ. cases rsb autotuning gave avg. 568998.1 % faster, avg. sp. ratio 5690.981x, max sp. ratio 10286.212x, avg. ratio 0.000x) +#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 106841.1/13002.2/200679.9/213682.2 tuned ops) +#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 15.7/ 11.9/ 19.5/ 31.4 untuned ops) +#pr: (and amortizes from untuned rsb in avg. 15.7, min. 11.9, max. 19.5 ops) #pr: (avg/min/max (avg) nnz per subm before successful tuning were 2/ 2/ 2) #pr: (avg/min/max (avg) nnz per subm after successful tuning were 6/ 6/ 6) #pr: (avg/min/max (avg) bytes per subm before successful tuning were 32/ 32/ 32) #pr: (avg/min/max (avg) bytes per subm after successful tuning were 96/ 96/ 96) #pr: (avg/min/max (avg) bytes per nnz before successful tuning were 4.000/ 4.000/ 4.000) -#pr: (avg/min/max operands (mtx,lhs,rhs) read bandwidth lower bound 2.650/ 2.650/ 2.650,GBps) -#pr: (avg/min/max operands (mtx,rhs:r;lhs:rw) bandwidth lower bound 6.457/ 3.229/ 3.229,GBps) +#pr: (avg/min/max operands (mtx,lhs,rhs) read bandwidth lower bound 1.456/ 0.231/ 2.681,GBps) +#pr: (avg/min/max operands (mtx,rhs:r;lhs:rw) bandwidth lower bound 3.547/ 0.281/ 3.266,GBps) #pr: (avg/min/max code balance (bytes read at least once per flop) 2.292/ 2.292/ 2.292) #pr: (avg/min/max (avg) bytes per nnz after successful tuning were 4.667/ 4.667/ 4.667) #pr: (matrix has been subdivided more/less/same in resp. 0 / 2 /0 cases) #pr: (matrix has used more/less/same threads in resp. 0 / 1 /1 cases) #pr: no unsuccessful rsb autotuning attempt (according to 1.01x threshold) -#pr: rsb auto tuning (either succ. or uns.) time was: on avg.: 0.01 s, min 0.01 s, max 0.01 s, tot 0.02 s (2 samples) -#pr: rsb auto tuning ( only successful ) time was: on avg.: 0.01 s, min 0.01 s, max 0.01 s, tot 0.02 s (2 samples) -#pr: best tun. rsb canon. mflops were: on avg. 1.157e+03, min 1.157e+03, max 1.157e+03 (2 samples) -#pr: ref. unt. rsb canon. mflops were: on avg. 1.350e-01, min 1.184e-01, max 1.517e-01 (2 samples) -#pr: best tun. rsb operation time was: on avg. 8.301e-08s, min 8.301e-08s, max 8.301e-08s, tot 1.660e-07s (2 samples) -#pr: ref. unt. rsb operation time was: on avg. 7.219e-04s, min 6.330e-04s, max 8.109e-04s, tot 1.444e-03s (2 samples) -#pr: min / max ratio of in-memory MEMSET bandwidth to extrapolated read bandwidth ratio: 1.750e+01 1.750e+01 -#pr: in-cache to in-memory MEMSET bandwidth ratio: 1.029e+00 +#pr: rsb auto tuning (either succ. or uns.) time was: on avg.: 0.01 s, min 0.01 s, max 0.02 s, tot 0.03 s (2 samples) +#pr: rsb auto tuning ( only successful ) time was: on avg.: 0.01 s, min 0.01 s, max 0.02 s, tot 0.03 s (2 samples) +#pr: best tun. rsb canon. mflops were: on avg. 6.353e+02, min 1.007e+02, max 1.170e+03 (2 samples) +#pr: ref. unt. rsb canon. mflops were: on avg. 1.028e-01, min 9.187e-02, max 1.137e-01 (2 samples) +#pr: best tun. rsb operation time was: on avg. 5.179e-07s, min 8.205e-08s, max 9.537e-07s, tot 1.036e-06s (2 samples) +#pr: ref. unt. rsb operation time was: on avg. 9.445e-04s, min 8.440e-04s, max 1.045e-03s, tot 1.889e-03s (2 samples) +#pr: min / max ratio of in-memory MEMSET bandwidth to extrapolated read bandwidth ratio: 1.770e+01 2.058e+02 +#pr: in-cache to in-memory MEMSET bandwidth ratio: 1.006e+00 #pr: ======== Limiting to nrhs=2: #pr: 2 samples (out of 4) matched the dump limiting criteria. #pr: Dump from a base of 4 samples (of max 8) ordered by (1,2,1,1,2,1,2) = (filename x cores x incX x incY x nrhs x typecode x transA). pr: BESTCODE MTX NR NC NNZ NRHS TYPE SYM TRANS NT AT-NT AT-MKL-NT BPNZ AT-BPNZ NSUBM AT-SUBM RSBBEST-MFLOPS OPTIME MKL-OPTIME AT-OPTIME AT-MKL-OPTIME AT-TIME RWminBW-GBps CB-bpf AT-MS CMFLOPS -pr: 3:R_R A 3 3 6 2 Z S N 1 1 0 4.0000 4.6667 3 1 2313.10 7.038e-04 0.000e+00 8.301e-08 0.000e+00 6.484e-03 4.96e+00 1.65e+00 1 1.92e-04 -pr: 7:R_R A 3 3 6 2 Z S N 4 1 0 4.0000 4.6667 3 1 2313.10 6.630e-04 0.000e+00 8.301e-08 0.000e+00 6.306e-03 4.96e+00 1.65e+00 1 1.92e-04 +pr: 3:R_R A 3 3 6 2 Z S N 1 1 0 4.0000 4.6667 3 1 2339.99 6.032e-04 0.000e+00 8.205e-08 0.000e+00 1.038e-02 5.02e+00 1.65e+00 1 1.92e-04 +pr: 7:R_R A 3 3 6 2 Z S N 4 1 0 4.0000 4.6667 3 1 2339.99 6.399e-04 0.000e+00 8.205e-08 0.000e+00 7.852e-03 5.02e+00 1.65e+00 1 1.92e-04 #pr: 2 samples (out of 4) matched the dump limiting criteria. #pr: below, we define 'successful' autotuning when speedup of 1.010000x is exceeded, and 'tuned' results even the ones which are same as untuned #pr: rsb autotuning was successful in 2 cases (100.00 %) and unsuccessful in 0 cases (0.00 %) -#pr: (in succ. cases rsb autotuning gave avg. 823252.0 % faster, avg. sp. ratio 8233.520x, max sp. ratio 8479.104x, avg. ratio 0.000x) -#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 77042.9/75970.1/78115.8/154085.9 tuned ops) -#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 9.4/ 9.2/ 9.5/ 18.7 untuned ops) -#pr: (and amortizes from untuned rsb in avg. 9.4, min. 9.2, max. 9.5 ops) +#pr: (in succ. cases rsb autotuning gave avg. 757418.5 % faster, avg. sp. ratio 7575.185x, max sp. ratio 7798.925x, avg. ratio 0.000x) +#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 111089.6/95696.6/126482.6/222179.3 tuned ops) +#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 14.7/ 12.3/ 17.2/ 29.5 untuned ops) +#pr: (and amortizes from untuned rsb in avg. 14.7, min. 12.3, max. 17.2 ops) #pr: (avg/min/max (avg) nnz per subm before successful tuning were 2/ 2/ 2) #pr: (avg/min/max (avg) nnz per subm after successful tuning were 6/ 6/ 6) #pr: (avg/min/max (avg) bytes per subm before successful tuning were 32/ 32/ 32) #pr: (avg/min/max (avg) bytes per subm after successful tuning were 96/ 96/ 96) #pr: (avg/min/max (avg) bytes per nnz before successful tuning were 4.000/ 4.000/ 4.000) -#pr: (avg/min/max operands (mtx,lhs,rhs) read bandwidth lower bound 3.807/ 3.807/ 3.807,GBps) -#pr: (avg/min/max operands (mtx,rhs:r;lhs:rw) bandwidth lower bound 9.927/ 4.964/ 4.964,GBps) +#pr: (avg/min/max operands (mtx,lhs,rhs) read bandwidth lower bound 3.851/ 3.851/ 3.851,GBps) +#pr: (avg/min/max operands (mtx,rhs:r;lhs:rw) bandwidth lower bound 10.042/ 5.021/ 5.021,GBps) #pr: (avg/min/max code balance (bytes read at least once per flop) 1.646/ 1.646/ 1.646) #pr: (avg/min/max (avg) bytes per nnz after successful tuning were 4.667/ 4.667/ 4.667) #pr: (matrix has been subdivided more/less/same in resp. 0 / 2 /0 cases) #pr: (matrix has used more/less/same threads in resp. 0 / 1 /1 cases) #pr: no unsuccessful rsb autotuning attempt (according to 1.01x threshold) -#pr: rsb auto tuning (either succ. or uns.) time was: on avg.: 0.01 s, min 0.01 s, max 0.01 s, tot 0.01 s (2 samples) -#pr: rsb auto tuning ( only successful ) time was: on avg.: 0.01 s, min 0.01 s, max 0.01 s, tot 0.01 s (2 samples) -#pr: best tun. rsb canon. mflops were: on avg. 2.313e+03, min 2.313e+03, max 2.313e+03 (2 samples) -#pr: ref. unt. rsb canon. mflops were: on avg. 2.812e-01, min 2.728e-01, max 2.896e-01 (2 samples) -#pr: best tun. rsb operation time was: on avg. 8.301e-08s, min 8.301e-08s, max 8.301e-08s, tot 1.660e-07s (2 samples) -#pr: ref. unt. rsb operation time was: on avg. 6.834e-04s, min 6.630e-04s, max 7.038e-04s, tot 1.367e-03s (2 samples) -#pr: min / max ratio of in-memory MEMSET bandwidth to extrapolated read bandwidth ratio: 1.219e+01 1.219e+01 -#pr: in-cache to in-memory MEMSET bandwidth ratio: 1.029e+00 -#pr: rsb nrhs-to-overall-min-rhs speed ratio was: on avg. 2.000e+00 x, min 2.000e+00 x, max 2.000e+00 x (2 samples, the non-min-nrhs ones) +#pr: rsb auto tuning (either succ. or uns.) time was: on avg.: 0.01 s, min 0.01 s, max 0.01 s, tot 0.02 s (2 samples) +#pr: rsb auto tuning ( only successful ) time was: on avg.: 0.01 s, min 0.01 s, max 0.01 s, tot 0.02 s (2 samples) +#pr: best tun. rsb canon. mflops were: on avg. 2.340e+03, min 2.340e+03, max 2.340e+03 (2 samples) +#pr: ref. unt. rsb canon. mflops were: on avg. 3.092e-01, min 3.000e-01, max 3.183e-01 (2 samples) +#pr: best tun. rsb operation time was: on avg. 8.205e-08s, min 8.205e-08s, max 8.205e-08s, tot 1.641e-07s (2 samples) +#pr: ref. unt. rsb operation time was: on avg. 6.216e-04s, min 6.032e-04s, max 6.399e-04s, tot 1.243e-03s (2 samples) +#pr: min / max ratio of in-memory MEMSET bandwidth to extrapolated read bandwidth ratio: 1.233e+01 1.233e+01 +#pr: in-cache to in-memory MEMSET bandwidth ratio: 1.006e+00 +#pr: rsb nrhs-to-overall-min-rhs speed ratio was: on avg. 1.262e+01 x, min 2.000e+00 x, max 2.325e+01 x (2 samples, the non-min-nrhs ones) #pr: ======== Limiting to transA=N: #pr: Dump from a base of 4 samples (of max 8) ordered by (1,2,1,1,2,1,2) = (filename x cores x incX x incY x nrhs x typecode x transA). pr: BESTCODE MTX NR NC NNZ NRHS TYPE SYM TRANS NT AT-NT AT-MKL-NT BPNZ AT-BPNZ NSUBM AT-SUBM RSBBEST-MFLOPS OPTIME MKL-OPTIME AT-OPTIME AT-MKL-OPTIME AT-TIME RWminBW-GBps CB-bpf AT-MS CMFLOPS -pr: 1:R_R A 3 3 6 1 Z S N 1 1 0 4.0000 4.6667 3 1 1156.55 8.109e-04 0.000e+00 8.301e-08 0.000e+00 7.305e-03 3.23e+00 2.29e+00 1 9.60e-05 -pr: 3:R_R A 3 3 6 2 Z S N 1 1 0 4.0000 4.6667 3 1 2313.10 7.038e-04 0.000e+00 8.301e-08 0.000e+00 6.484e-03 4.96e+00 1.65e+00 1 1.92e-04 -pr: 5:R_R A 3 3 6 1 Z S N 4 1 0 4.0000 4.6667 3 1 1156.55 6.330e-04 0.000e+00 8.301e-08 0.000e+00 8.890e-03 3.23e+00 2.29e+00 1 9.60e-05 -pr: 7:R_R A 3 3 6 2 Z S N 4 1 0 4.0000 4.6667 3 1 2313.10 6.630e-04 0.000e+00 8.301e-08 0.000e+00 6.306e-03 4.96e+00 1.65e+00 1 1.92e-04 +pr: 1:R_R A 3 3 6 1 Z S N 1 1 0 4.0000 4.6667 3 1 100.66 1.045e-03 0.000e+00 9.537e-07 0.000e+00 1.240e-02 2.81e-01 2.29e+00 1 9.60e-05 +pr: 3:R_R A 3 3 6 2 Z S N 1 1 0 4.0000 4.6667 3 1 2339.99 6.032e-04 0.000e+00 8.205e-08 0.000e+00 1.038e-02 5.02e+00 1.65e+00 1 1.92e-04 +pr: 5:R_R A 3 3 6 1 Z S N 4 1 0 4.0000 4.6667 3 1 1169.99 8.440e-04 0.000e+00 8.205e-08 0.000e+00 1.647e-02 3.27e+00 2.29e+00 1 9.60e-05 +pr: 7:R_R A 3 3 6 2 Z S N 4 1 0 4.0000 4.6667 3 1 2339.99 6.399e-04 0.000e+00 8.205e-08 0.000e+00 7.852e-03 5.02e+00 1.65e+00 1 1.92e-04 #pr: below, we define 'successful' autotuning when speedup of 1.010000x is exceeded, and 'tuned' results even the ones which are same as untuned #pr: rsb autotuning was successful in 4 cases (100.00 %) and unsuccessful in 0 cases (0.00 %) -#pr: (in succ. cases rsb autotuning gave avg. 846446.0 % faster, avg. sp. ratio 8465.460x, max sp. ratio 9768.778x, avg. ratio 0.000x) -#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 87297.9/75970.1/107100.4/349191.4 tuned ops) -#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 10.4/ 9.0/ 14.0/ 41.8 untuned ops) -#pr: (and amortizes from untuned rsb in avg. 10.4, min. 9.0, max. 14.0 ops) +#pr: (in succ. cases rsb autotuning gave avg. 663208.3 % faster, avg. sp. ratio 6633.083x, max sp. ratio 10286.212x, avg. ratio 0.000x) +#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 108965.4/13002.2/200679.9/435861.5 tuned ops) +#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 15.2/ 11.9/ 19.5/ 60.9 untuned ops) +#pr: (and amortizes from untuned rsb in avg. 15.2, min. 11.9, max. 19.5 ops) #pr: (avg/min/max (avg) nnz per subm before successful tuning were 2/ 2/ 2) #pr: (avg/min/max (avg) nnz per subm after successful tuning were 6/ 6/ 6) #pr: (avg/min/max (avg) bytes per subm before successful tuning were 32/ 32/ 32) #pr: (avg/min/max (avg) bytes per subm after successful tuning were 96/ 96/ 96) #pr: (avg/min/max (avg) bytes per nnz before successful tuning were 4.000/ 4.000/ 4.000) -#pr: (avg/min/max operands (mtx,lhs,rhs) read bandwidth lower bound 3.229/ 2.650/ 3.807,GBps) -#pr: (avg/min/max operands (mtx,rhs:r;lhs:rw) bandwidth lower bound 16.384/ 3.229/ 4.964,GBps) +#pr: (avg/min/max operands (mtx,lhs,rhs) read bandwidth lower bound 2.654/ 0.231/ 3.851,GBps) +#pr: (avg/min/max operands (mtx,rhs:r;lhs:rw) bandwidth lower bound 13.590/ 0.281/ 5.021,GBps) #pr: (avg/min/max code balance (bytes read at least once per flop) 1.969/ 1.646/ 2.292) #pr: (avg/min/max (avg) bytes per nnz after successful tuning were 4.667/ 4.667/ 4.667) #pr: (matrix has been subdivided more/less/same in resp. 0 / 4 /0 cases) #pr: (matrix has used more/less/same threads in resp. 0 / 2 /2 cases) #pr: no unsuccessful rsb autotuning attempt (according to 1.01x threshold) -#pr: rsb auto tuning (either succ. or uns.) time was: on avg.: 0.01 s, min 0.01 s, max 0.01 s, tot 0.03 s (4 samples) -#pr: rsb auto tuning ( only successful ) time was: on avg.: 0.01 s, min 0.01 s, max 0.01 s, tot 0.03 s (4 samples) -#pr: best tun. rsb canon. mflops were: on avg. 1.735e+03, min 1.157e+03, max 2.313e+03 (4 samples) -#pr: ref. unt. rsb canon. mflops were: on avg. 2.081e-01, min 1.184e-01, max 2.896e-01 (4 samples) -#pr: best tun. rsb operation time was: on avg. 8.301e-08s, min 8.301e-08s, max 8.301e-08s, tot 3.320e-07s (4 samples) -#pr: ref. unt. rsb operation time was: on avg. 7.027e-04s, min 6.330e-04s, max 8.109e-04s, tot 2.811e-03s (4 samples) -#pr: min / max ratio of in-memory MEMSET bandwidth to extrapolated read bandwidth ratio: 1.219e+01 1.750e+01 -#pr: in-cache to in-memory MEMSET bandwidth ratio: 1.029e+00 -#pr: rsb nrhs-to-overall-min-rhs speed ratio was: on avg. 2.000e+00 x, min 2.000e+00 x, max 2.000e+00 x (2 samples, the non-min-nrhs ones) +#pr: rsb auto tuning (either succ. or uns.) time was: on avg.: 0.01 s, min 0.01 s, max 0.02 s, tot 0.05 s (4 samples) +#pr: rsb auto tuning ( only successful ) time was: on avg.: 0.01 s, min 0.01 s, max 0.02 s, tot 0.05 s (4 samples) +#pr: best tun. rsb canon. mflops were: on avg. 1.488e+03, min 1.007e+02, max 2.340e+03 (4 samples) +#pr: ref. unt. rsb canon. mflops were: on avg. 2.060e-01, min 9.187e-02, max 3.183e-01 (4 samples) +#pr: best tun. rsb operation time was: on avg. 3.000e-07s, min 8.205e-08s, max 9.537e-07s, tot 1.200e-06s (4 samples) +#pr: ref. unt. rsb operation time was: on avg. 7.830e-04s, min 6.032e-04s, max 1.045e-03s, tot 3.132e-03s (4 samples) +#pr: min / max ratio of in-memory MEMSET bandwidth to extrapolated read bandwidth ratio: 1.233e+01 2.058e+02 +#pr: in-cache to in-memory MEMSET bandwidth ratio: 1.006e+00 +#pr: rsb nrhs-to-overall-min-rhs speed ratio was: on avg. 1.262e+01 x, min 2.000e+00 x, max 2.325e+01 x (2 samples, the non-min-nrhs ones) #pr: ======== Limiting to both transA=N and nrhs=1: #pr: 2 samples (out of 4) matched the dump limiting criteria. #pr: Dump from a base of 4 samples (of max 8) ordered by (1,2,1,1,2,1,2) = (filename x cores x incX x incY x nrhs x typecode x transA). pr: BESTCODE MTX NR NC NNZ NRHS TYPE SYM TRANS NT AT-NT AT-MKL-NT BPNZ AT-BPNZ NSUBM AT-SUBM RSBBEST-MFLOPS OPTIME MKL-OPTIME AT-OPTIME AT-MKL-OPTIME AT-TIME RWminBW-GBps CB-bpf AT-MS CMFLOPS -pr: 1:R_R A 3 3 6 1 Z S N 1 1 0 4.0000 4.6667 3 1 1156.55 8.109e-04 0.000e+00 8.301e-08 0.000e+00 7.305e-03 3.23e+00 2.29e+00 1 9.60e-05 -pr: 5:R_R A 3 3 6 1 Z S N 4 1 0 4.0000 4.6667 3 1 1156.55 6.330e-04 0.000e+00 8.301e-08 0.000e+00 8.890e-03 3.23e+00 2.29e+00 1 9.60e-05 +pr: 1:R_R A 3 3 6 1 Z S N 1 1 0 4.0000 4.6667 3 1 100.66 1.045e-03 0.000e+00 9.537e-07 0.000e+00 1.240e-02 2.81e-01 2.29e+00 1 9.60e-05 +pr: 5:R_R A 3 3 6 1 Z S N 4 1 0 4.0000 4.6667 3 1 1169.99 8.440e-04 0.000e+00 8.205e-08 0.000e+00 1.647e-02 3.27e+00 2.29e+00 1 9.60e-05 #pr: 2 samples (out of 4) matched the dump limiting criteria. #pr: below, we define 'successful' autotuning when speedup of 1.010000x is exceeded, and 'tuned' results even the ones which are same as untuned #pr: rsb autotuning was successful in 2 cases (100.00 %) and unsuccessful in 0 cases (0.00 %) -#pr: (in succ. cases rsb autotuning gave avg. 869640.1 % faster, avg. sp. ratio 8697.401x, max sp. ratio 9768.778x, avg. ratio 0.000x) -#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 97552.8/88005.2/107100.4/195105.6 tuned ops) -#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 11.5/ 9.0/ 14.0/ 23.1 untuned ops) -#pr: (and amortizes from untuned rsb in avg. 11.5, min. 9.0, max. 14.0 ops) +#pr: (in succ. cases rsb autotuning gave avg. 568998.1 % faster, avg. sp. ratio 5690.981x, max sp. ratio 10286.212x, avg. ratio 0.000x) +#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 106841.1/13002.2/200679.9/213682.2 tuned ops) +#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 15.7/ 11.9/ 19.5/ 31.4 untuned ops) +#pr: (and amortizes from untuned rsb in avg. 15.7, min. 11.9, max. 19.5 ops) #pr: (avg/min/max (avg) nnz per subm before successful tuning were 2/ 2/ 2) #pr: (avg/min/max (avg) nnz per subm after successful tuning were 6/ 6/ 6) #pr: (avg/min/max (avg) bytes per subm before successful tuning were 32/ 32/ 32) #pr: (avg/min/max (avg) bytes per subm after successful tuning were 96/ 96/ 96) #pr: (avg/min/max (avg) bytes per nnz before successful tuning were 4.000/ 4.000/ 4.000) -#pr: (avg/min/max operands (mtx,lhs,rhs) read bandwidth lower bound 2.650/ 2.650/ 2.650,GBps) -#pr: (avg/min/max operands (mtx,rhs:r;lhs:rw) bandwidth lower bound 6.457/ 3.229/ 3.229,GBps) +#pr: (avg/min/max operands (mtx,lhs,rhs) read bandwidth lower bound 1.456/ 0.231/ 2.681,GBps) +#pr: (avg/min/max operands (mtx,rhs:r;lhs:rw) bandwidth lower bound 3.547/ 0.281/ 3.266,GBps) #pr: (avg/min/max code balance (bytes read at least once per flop) 2.292/ 2.292/ 2.292) #pr: (avg/min/max (avg) bytes per nnz after successful tuning were 4.667/ 4.667/ 4.667) #pr: (matrix has been subdivided more/less/same in resp. 0 / 2 /0 cases) #pr: (matrix has used more/less/same threads in resp. 0 / 1 /1 cases) #pr: no unsuccessful rsb autotuning attempt (according to 1.01x threshold) -#pr: rsb auto tuning (either succ. or uns.) time was: on avg.: 0.01 s, min 0.01 s, max 0.01 s, tot 0.02 s (2 samples) -#pr: rsb auto tuning ( only successful ) time was: on avg.: 0.01 s, min 0.01 s, max 0.01 s, tot 0.02 s (2 samples) -#pr: best tun. rsb canon. mflops were: on avg. 1.157e+03, min 1.157e+03, max 1.157e+03 (2 samples) -#pr: ref. unt. rsb canon. mflops were: on avg. 1.350e-01, min 1.184e-01, max 1.517e-01 (2 samples) -#pr: best tun. rsb operation time was: on avg. 8.301e-08s, min 8.301e-08s, max 8.301e-08s, tot 1.660e-07s (2 samples) -#pr: ref. unt. rsb operation time was: on avg. 7.219e-04s, min 6.330e-04s, max 8.109e-04s, tot 1.444e-03s (2 samples) -#pr: min / max ratio of in-memory MEMSET bandwidth to extrapolated read bandwidth ratio: 1.750e+01 1.750e+01 -#pr: in-cache to in-memory MEMSET bandwidth ratio: 1.029e+00 +#pr: rsb auto tuning (either succ. or uns.) time was: on avg.: 0.01 s, min 0.01 s, max 0.02 s, tot 0.03 s (2 samples) +#pr: rsb auto tuning ( only successful ) time was: on avg.: 0.01 s, min 0.01 s, max 0.02 s, tot 0.03 s (2 samples) +#pr: best tun. rsb canon. mflops were: on avg. 6.353e+02, min 1.007e+02, max 1.170e+03 (2 samples) +#pr: ref. unt. rsb canon. mflops were: on avg. 1.028e-01, min 9.187e-02, max 1.137e-01 (2 samples) +#pr: best tun. rsb operation time was: on avg. 5.179e-07s, min 8.205e-08s, max 9.537e-07s, tot 1.036e-06s (2 samples) +#pr: ref. unt. rsb operation time was: on avg. 9.445e-04s, min 8.440e-04s, max 1.045e-03s, tot 1.889e-03s (2 samples) +#pr: min / max ratio of in-memory MEMSET bandwidth to extrapolated read bandwidth ratio: 1.770e+01 2.058e+02 +#pr: in-cache to in-memory MEMSET bandwidth ratio: 1.006e+00 #pr: ======== Limiting to both transA=N and nrhs=2: #pr: 2 samples (out of 4) matched the dump limiting criteria. #pr: Dump from a base of 4 samples (of max 8) ordered by (1,2,1,1,2,1,2) = (filename x cores x incX x incY x nrhs x typecode x transA). pr: BESTCODE MTX NR NC NNZ NRHS TYPE SYM TRANS NT AT-NT AT-MKL-NT BPNZ AT-BPNZ NSUBM AT-SUBM RSBBEST-MFLOPS OPTIME MKL-OPTIME AT-OPTIME AT-MKL-OPTIME AT-TIME RWminBW-GBps CB-bpf AT-MS CMFLOPS -pr: 3:R_R A 3 3 6 2 Z S N 1 1 0 4.0000 4.6667 3 1 2313.10 7.038e-04 0.000e+00 8.301e-08 0.000e+00 6.484e-03 4.96e+00 1.65e+00 1 1.92e-04 -pr: 7:R_R A 3 3 6 2 Z S N 4 1 0 4.0000 4.6667 3 1 2313.10 6.630e-04 0.000e+00 8.301e-08 0.000e+00 6.306e-03 4.96e+00 1.65e+00 1 1.92e-04 +pr: 3:R_R A 3 3 6 2 Z S N 1 1 0 4.0000 4.6667 3 1 2339.99 6.032e-04 0.000e+00 8.205e-08 0.000e+00 1.038e-02 5.02e+00 1.65e+00 1 1.92e-04 +pr: 7:R_R A 3 3 6 2 Z S N 4 1 0 4.0000 4.6667 3 1 2339.99 6.399e-04 0.000e+00 8.205e-08 0.000e+00 7.852e-03 5.02e+00 1.65e+00 1 1.92e-04 #pr: 2 samples (out of 4) matched the dump limiting criteria. #pr: below, we define 'successful' autotuning when speedup of 1.010000x is exceeded, and 'tuned' results even the ones which are same as untuned #pr: rsb autotuning was successful in 2 cases (100.00 %) and unsuccessful in 0 cases (0.00 %) -#pr: (in succ. cases rsb autotuning gave avg. 823252.0 % faster, avg. sp. ratio 8233.520x, max sp. ratio 8479.104x, avg. ratio 0.000x) -#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 77042.9/75970.1/78115.8/154085.9 tuned ops) -#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 9.4/ 9.2/ 9.5/ 18.7 untuned ops) -#pr: (and amortizes from untuned rsb in avg. 9.4, min. 9.2, max. 9.5 ops) +#pr: (in succ. cases rsb autotuning gave avg. 757418.5 % faster, avg. sp. ratio 7575.185x, max sp. ratio 7798.925x, avg. ratio 0.000x) +#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 111089.6/95696.6/126482.6/222179.3 tuned ops) +#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 14.7/ 12.3/ 17.2/ 29.5 untuned ops) +#pr: (and amortizes from untuned rsb in avg. 14.7, min. 12.3, max. 17.2 ops) #pr: (avg/min/max (avg) nnz per subm before successful tuning were 2/ 2/ 2) #pr: (avg/min/max (avg) nnz per subm after successful tuning were 6/ 6/ 6) #pr: (avg/min/max (avg) bytes per subm before successful tuning were 32/ 32/ 32) #pr: (avg/min/max (avg) bytes per subm after successful tuning were 96/ 96/ 96) #pr: (avg/min/max (avg) bytes per nnz before successful tuning were 4.000/ 4.000/ 4.000) -#pr: (avg/min/max operands (mtx,lhs,rhs) read bandwidth lower bound 3.807/ 3.807/ 3.807,GBps) -#pr: (avg/min/max operands (mtx,rhs:r;lhs:rw) bandwidth lower bound 9.927/ 4.964/ 4.964,GBps) +#pr: (avg/min/max operands (mtx,lhs,rhs) read bandwidth lower bound 3.851/ 3.851/ 3.851,GBps) +#pr: (avg/min/max operands (mtx,rhs:r;lhs:rw) bandwidth lower bound 10.042/ 5.021/ 5.021,GBps) #pr: (avg/min/max code balance (bytes read at least once per flop) 1.646/ 1.646/ 1.646) #pr: (avg/min/max (avg) bytes per nnz after successful tuning were 4.667/ 4.667/ 4.667) #pr: (matrix has been subdivided more/less/same in resp. 0 / 2 /0 cases) #pr: (matrix has used more/less/same threads in resp. 0 / 1 /1 cases) #pr: no unsuccessful rsb autotuning attempt (according to 1.01x threshold) -#pr: rsb auto tuning (either succ. or uns.) time was: on avg.: 0.01 s, min 0.01 s, max 0.01 s, tot 0.01 s (2 samples) -#pr: rsb auto tuning ( only successful ) time was: on avg.: 0.01 s, min 0.01 s, max 0.01 s, tot 0.01 s (2 samples) -#pr: best tun. rsb canon. mflops were: on avg. 2.313e+03, min 2.313e+03, max 2.313e+03 (2 samples) -#pr: ref. unt. rsb canon. mflops were: on avg. 2.812e-01, min 2.728e-01, max 2.896e-01 (2 samples) -#pr: best tun. rsb operation time was: on avg. 8.301e-08s, min 8.301e-08s, max 8.301e-08s, tot 1.660e-07s (2 samples) -#pr: ref. unt. rsb operation time was: on avg. 6.834e-04s, min 6.630e-04s, max 7.038e-04s, tot 1.367e-03s (2 samples) -#pr: min / max ratio of in-memory MEMSET bandwidth to extrapolated read bandwidth ratio: 1.219e+01 1.219e+01 -#pr: in-cache to in-memory MEMSET bandwidth ratio: 1.029e+00 -#pr: rsb nrhs-to-overall-min-rhs speed ratio was: on avg. 2.000e+00 x, min 2.000e+00 x, max 2.000e+00 x (2 samples, the non-min-nrhs ones) +#pr: rsb auto tuning (either succ. or uns.) time was: on avg.: 0.01 s, min 0.01 s, max 0.01 s, tot 0.02 s (2 samples) +#pr: rsb auto tuning ( only successful ) time was: on avg.: 0.01 s, min 0.01 s, max 0.01 s, tot 0.02 s (2 samples) +#pr: best tun. rsb canon. mflops were: on avg. 2.340e+03, min 2.340e+03, max 2.340e+03 (2 samples) +#pr: ref. unt. rsb canon. mflops were: on avg. 3.092e-01, min 3.000e-01, max 3.183e-01 (2 samples) +#pr: best tun. rsb operation time was: on avg. 8.205e-08s, min 8.205e-08s, max 8.205e-08s, tot 1.641e-07s (2 samples) +#pr: ref. unt. rsb operation time was: on avg. 6.216e-04s, min 6.032e-04s, max 6.399e-04s, tot 1.243e-03s (2 samples) +#pr: min / max ratio of in-memory MEMSET bandwidth to extrapolated read bandwidth ratio: 1.233e+01 1.233e+01 +#pr: in-cache to in-memory MEMSET bandwidth ratio: 1.006e+00 +#pr: rsb nrhs-to-overall-min-rhs speed ratio was: on avg. 1.262e+01 x, min 2.000e+00 x, max 2.325e+01 x (2 samples, the non-min-nrhs ones) #pr: ======== Limiting to transA=T: #pr: No sample (out of 4) matched the dump criteria -- skipping dump round. #pr: ======== Limiting to both transA=T and nrhs=1: @@ -3754,44 +3790,44 @@ #pr: ======== All results (not limiting) #pr: Dump from a base of 4 samples (of max 8) ordered by (1,2,1,1,2,1,2) = (filename x cores x incX x incY x nrhs x typecode x transA). pr: BESTCODE MTX NR NC NNZ NRHS TYPE SYM TRANS NT AT-NT AT-MKL-NT BPNZ AT-BPNZ NSUBM AT-SUBM RSBBEST-MFLOPS OPTIME MKL-OPTIME AT-OPTIME AT-MKL-OPTIME AT-TIME RWminBW-GBps CB-bpf AT-MS CMFLOPS -pr: 1:R_R A 3 3 6 1 Z S N 1 1 0 4.0000 4.6667 3 1 1156.55 8.109e-04 0.000e+00 8.301e-08 0.000e+00 7.305e-03 3.23e+00 2.29e+00 1 9.60e-05 -pr: 3:R_R A 3 3 6 2 Z S N 1 1 0 4.0000 4.6667 3 1 2313.10 7.038e-04 0.000e+00 8.301e-08 0.000e+00 6.484e-03 4.96e+00 1.65e+00 1 1.92e-04 -pr: 5:R_R A 3 3 6 1 Z S N 4 1 0 4.0000 4.6667 3 1 1156.55 6.330e-04 0.000e+00 8.301e-08 0.000e+00 8.890e-03 3.23e+00 2.29e+00 1 9.60e-05 -pr: 7:R_R A 3 3 6 2 Z S N 4 1 0 4.0000 4.6667 3 1 2313.10 6.630e-04 0.000e+00 8.301e-08 0.000e+00 6.306e-03 4.96e+00 1.65e+00 1 1.92e-04 +pr: 1:R_R A 3 3 6 1 Z S N 1 1 0 4.0000 4.6667 3 1 100.66 1.045e-03 0.000e+00 9.537e-07 0.000e+00 1.240e-02 2.81e-01 2.29e+00 1 9.60e-05 +pr: 3:R_R A 3 3 6 2 Z S N 1 1 0 4.0000 4.6667 3 1 2339.99 6.032e-04 0.000e+00 8.205e-08 0.000e+00 1.038e-02 5.02e+00 1.65e+00 1 1.92e-04 +pr: 5:R_R A 3 3 6 1 Z S N 4 1 0 4.0000 4.6667 3 1 1169.99 8.440e-04 0.000e+00 8.205e-08 0.000e+00 1.647e-02 3.27e+00 2.29e+00 1 9.60e-05 +pr: 7:R_R A 3 3 6 2 Z S N 4 1 0 4.0000 4.6667 3 1 2339.99 6.399e-04 0.000e+00 8.205e-08 0.000e+00 7.852e-03 5.02e+00 1.65e+00 1 1.92e-04 #pr: below, we define 'successful' autotuning when speedup of 1.010000x is exceeded, and 'tuned' results even the ones which are same as untuned #pr: rsb autotuning was successful in 4 cases (100.00 %) and unsuccessful in 0 cases (0.00 %) -#pr: (in succ. cases rsb autotuning gave avg. 846446.0 % faster, avg. sp. ratio 8465.460x, max sp. ratio 9768.778x, avg. ratio 0.000x) -#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 87297.9/75970.1/107100.4/349191.4 tuned ops) -#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 10.4/ 9.0/ 14.0/ 41.8 untuned ops) -#pr: (and amortizes from untuned rsb in avg. 10.4, min. 9.0, max. 14.0 ops) +#pr: (in succ. cases rsb autotuning gave avg. 663208.3 % faster, avg. sp. ratio 6633.083x, max sp. ratio 10286.212x, avg. ratio 0.000x) +#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 108965.4/13002.2/200679.9/435861.5 tuned ops) +#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 15.2/ 11.9/ 19.5/ 60.9 untuned ops) +#pr: (and amortizes from untuned rsb in avg. 15.2, min. 11.9, max. 19.5 ops) #pr: (avg/min/max (avg) nnz per subm before successful tuning were 2/ 2/ 2) #pr: (avg/min/max (avg) nnz per subm after successful tuning were 6/ 6/ 6) #pr: (avg/min/max (avg) bytes per subm before successful tuning were 32/ 32/ 32) #pr: (avg/min/max (avg) bytes per subm after successful tuning were 96/ 96/ 96) #pr: (avg/min/max (avg) bytes per nnz before successful tuning were 4.000/ 4.000/ 4.000) -#pr: (avg/min/max operands (mtx,lhs,rhs) read bandwidth lower bound 3.229/ 2.650/ 3.807,GBps) -#pr: (avg/min/max operands (mtx,rhs:r;lhs:rw) bandwidth lower bound 16.384/ 3.229/ 4.964,GBps) +#pr: (avg/min/max operands (mtx,lhs,rhs) read bandwidth lower bound 2.654/ 0.231/ 3.851,GBps) +#pr: (avg/min/max operands (mtx,rhs:r;lhs:rw) bandwidth lower bound 13.590/ 0.281/ 5.021,GBps) #pr: (avg/min/max code balance (bytes read at least once per flop) 1.969/ 1.646/ 2.292) #pr: (avg/min/max (avg) bytes per nnz after successful tuning were 4.667/ 4.667/ 4.667) #pr: (matrix has been subdivided more/less/same in resp. 0 / 4 /0 cases) #pr: (matrix has used more/less/same threads in resp. 0 / 2 /2 cases) #pr: no unsuccessful rsb autotuning attempt (according to 1.01x threshold) -#pr: rsb auto tuning (either succ. or uns.) time was: on avg.: 0.01 s, min 0.01 s, max 0.01 s, tot 0.03 s (4 samples) -#pr: rsb auto tuning ( only successful ) time was: on avg.: 0.01 s, min 0.01 s, max 0.01 s, tot 0.03 s (4 samples) -#pr: best tun. rsb canon. mflops were: on avg. 1.735e+03, min 1.157e+03, max 2.313e+03 (4 samples) -#pr: ref. unt. rsb canon. mflops were: on avg. 2.081e-01, min 1.184e-01, max 2.896e-01 (4 samples) -#pr: best tun. rsb operation time was: on avg. 8.301e-08s, min 8.301e-08s, max 8.301e-08s, tot 3.320e-07s (4 samples) -#pr: ref. unt. rsb operation time was: on avg. 7.027e-04s, min 6.330e-04s, max 8.109e-04s, tot 2.811e-03s (4 samples) -#pr: min / max ratio of in-memory MEMSET bandwidth to extrapolated read bandwidth ratio: 1.219e+01 1.750e+01 -#pr: in-cache to in-memory MEMSET bandwidth ratio: 1.029e+00 -#pr: rsb nrhs-to-overall-min-rhs speed ratio was: on avg. 2.000e+00 x, min 2.000e+00 x, max 2.000e+00 x (2 samples, the non-min-nrhs ones) -#pr: Record collection took 0.17 s. +#pr: rsb auto tuning (either succ. or uns.) time was: on avg.: 0.01 s, min 0.01 s, max 0.02 s, tot 0.05 s (4 samples) +#pr: rsb auto tuning ( only successful ) time was: on avg.: 0.01 s, min 0.01 s, max 0.02 s, tot 0.05 s (4 samples) +#pr: best tun. rsb canon. mflops were: on avg. 1.488e+03, min 1.007e+02, max 2.340e+03 (4 samples) +#pr: ref. unt. rsb canon. mflops were: on avg. 2.060e-01, min 9.187e-02, max 3.183e-01 (4 samples) +#pr: best tun. rsb operation time was: on avg. 3.000e-07s, min 8.205e-08s, max 9.537e-07s, tot 1.200e-06s (4 samples) +#pr: ref. unt. rsb operation time was: on avg. 7.830e-04s, min 6.032e-04s, max 1.045e-03s, tot 3.132e-03s (4 samples) +#pr: min / max ratio of in-memory MEMSET bandwidth to extrapolated read bandwidth ratio: 1.233e+01 2.058e+02 +#pr: in-cache to in-memory MEMSET bandwidth ratio: 1.006e+00 +#pr: rsb nrhs-to-overall-min-rhs speed ratio was: on avg. 1.262e+01 x, min 2.000e+00 x, max 2.325e+01 x (2 samples, the non-min-nrhs ones) +#pr: Record collection took 0.31 s. #pr: Record comprises 40 memory benchmark samples (prepend RSB_PR_MBW=1 to dump this). -#pr: Record comprises 100 environment variables in 5413 bytes (prepend RSB_PR_ENV=1 to dump this). +#pr: Record comprises 100 environment variables in 5467 bytes (prepend RSB_PR_ENV=1 to dump this). # ====== END Total summary record. -#pr: ======== Saved a performance record of 8 samples to rsbench_pr__1773327824_gcc-14.2-1,4th.rpr -# Removing the temporary record file rsbench_pr__1773327824_gcc-14.2-1,4th.rpr.tmp. -# terminating run at 1773327830 (after 5.6s of w.c.t.) +#pr: ======== Saved a performance record of 8 samples to rsbench_pr__1738918478_gcc-14.2-1,4th.rpr +# Removing the temporary record file rsbench_pr__1738918478_gcc-14.2-1,4th.rpr.tmp. +# terminating run at 1738918483 (after 5.8s of w.c.t.) + ./rsbench -oa -Ob --help /build/reproducible-path/librsb-1.3.0.2+dfsg/.libs/rsbench is a swiss army knife for testing the library functionality and performance. You can use it to perform sparse matrix - unitary vector multiplication, specifying the blocking parameters, the times to perform multiplication. @@ -4063,10 +4099,10 @@ L1 size: 24576 L2 size: 524288 sysconf() : 4096 bytes per pagesize -sysconf() : 15402653 physical pages -sysconf() : 63089266688 bytes (60166 MB) of physical memory -sysconf() : 12695244 available (free) physical pages -sysconf() : 51999719424 available (free) physical memory +sysconf() : 15402651 physical pages +sysconf() : 63089258496 bytes (60166 MB) of physical memory +sysconf() : 4748291 available (free) physical pages +sysconf() : 19448999936 available (free) physical memory sysconf() , processors : 12 sysconf() , processors online : 12 sysconf() : no level 1 cache @@ -4091,30 +4127,30 @@ RSB_SUBM_IDX_MARKER : 2147483647 RSB_MAX_ALLOCATABLE_MEMORY_CHUNK: 18446744073709551615 timing min delta (if negative, don't complain with us) : 0 s -timing granularity : 7.74503e-08 s +timing granularity : 3.33428e-08 s CFLAGS : -g -O2 -Werror=implicit-function-declaration -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 CXXFLAGS : -g -O2 -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -fopenmp CC : gcc memhinfo : L2:4/64/512K,L1:8/64/24K -detected free memory : 51999719424 -detected total memory : 63089266688 -for array sized 524288 elems, took 0.000434875 s for linear search and 0 s for binary search for element 524287, in 136 tries, for a total of 0.100156 s (ignore this:142606064) -for array sized 524288 elems, took 0.000174999 s for linear search and 0 s for binary search for element 262143, in 542 tries, for a total of 0.100061 s (ignore this:426769076) -for array sized 524288 elems, took 8.67844e-05 s for linear search and 0 s for binary search for element 131071, in 1130 tries, for a total of 0.100065 s (ignore this:722989536) -for array sized 524288 elems, took 4.29153e-05 s for linear search and 0 s for binary search for element 65535, in 2263 tries, for a total of 0.100034 s (ignore this:1019600946) -for array sized 524288 elems, took 2.09808e-05 s for linear search and 0 s for binary search for element 32767, in 4538 tries, for a total of 0.100009 s (ignore this:1316994238) -for array sized 524288 elems, took 1.09673e-05 s for linear search and 0 s for binary search for element 16383, in 9011 tries, for a total of 0.100006 s (ignore this:1612248664) -for array sized 524288 elems, took 4.76837e-06 s for linear search and 0 s for binary search for element 8191, in 17947 tries, for a total of 0.100000 s (ignore this:1906256418) -for array sized 524288 elems, took 1.90735e-06 s for linear search and 0 s for binary search for element 4095, in 35299 tries, for a total of 0.100001 s (ignore this:-2099612068) -for array sized 524288 elems, took 9.53674e-07 s for linear search and 0 s for binary search for element 2047, in 68382 tries, for a total of 0.100001 s (ignore this:-1819656160) -for array sized 524288 elems, took 0 s for linear search and 0 s for binary search for element 1023, in 128447 tries, for a total of 0.100001 s (ignore this:-1556853598) -for array sized 524288 elems, took 0 s for linear search and 0 s for binary search for element 511, in 229247 tries, for a total of 0.100000 s (ignore this:-1322563164) -for array sized 524288 elems, took 0 s for linear search and 0 s for binary search for element 255, in 389241 tries, for a total of 0.100000 s (ignore this:-1124050254) -for array sized 524288 elems, took 0 s for linear search and 0 s for binary search for element 127, in 588702 tries, for a total of 0.100001 s (ignore this:-974519946) -for array sized 524288 elems, took 0 s for linear search and 0 s for binary search for element 63, in 786115 tries, for a total of 0.100000 s (ignore this:-875469456) -for array sized 524288 elems, took 0 s for linear search and 0 s for binary search for element 31, in 956518 tries, for a total of 0.100000 s (ignore this:-816165340) -for array sized 524288 elems, took 0 s for linear search and 0 s for binary search for element 15, in 1074709 tries, for a total of 0.100000 s (ignore this:-783924070) -for array sized 524288 elems, took 0 s for linear search and 0 s for binary search for element 7, in 1135997 tries, for a total of 0.100000 s (ignore this:-768020112) +detected free memory : 19448999936 +detected total memory : 63089258496 +for array sized 524288 elems, took 0.000349998 s for linear search and 0 s for binary search for element 524287, in 270 tries, for a total of 0.100292 s (ignore this:283114980) +for array sized 524288 elems, took 0.000174999 s for linear search and 0 s for binary search for element 262143, in 570 tries, for a total of 0.100123 s (ignore this:581958000) +for array sized 524288 elems, took 8.67844e-05 s for linear search and 0 s for binary search for element 131071, in 1138 tries, for a total of 0.100078 s (ignore this:880275596) +for array sized 524288 elems, took 4.29153e-05 s for linear search and 0 s for binary search for element 65535, in 2274 tries, for a total of 0.100008 s (ignore this:1178328776) +for array sized 524288 elems, took 2.09808e-05 s for linear search and 0 s for binary search for element 32767, in 4538 tries, for a total of 0.100013 s (ignore this:1475722068) +for array sized 524288 elems, took 1.09673e-05 s for linear search and 0 s for binary search for element 16383, in 9017 tries, for a total of 0.100010 s (ignore this:1771173090) +for array sized 524288 elems, took 4.76837e-06 s for linear search and 0 s for binary search for element 8191, in 17957 tries, for a total of 0.100005 s (ignore this:2065344664) +for array sized 524288 elems, took 1.90735e-06 s for linear search and 0 s for binary search for element 4095, in 35327 tries, for a total of 0.100002 s (ignore this:-1940294502) +for array sized 524288 elems, took 9.53674e-07 s for linear search and 0 s for binary search for element 2047, in 68315 tries, for a total of 0.100000 s (ignore this:-1660612892) +for array sized 524288 elems, took 0 s for linear search and 0 s for binary search for element 1023, in 128256 tries, for a total of 0.100000 s (ignore this:-1398201116) +for array sized 524288 elems, took 0 s for linear search and 0 s for binary search for element 511, in 231433 tries, for a total of 0.100001 s (ignore this:-1161676590) +for array sized 524288 elems, took 0 s for linear search and 0 s for binary search for element 255, in 387903 tries, for a total of 0.100000 s (ignore this:-963846060) +for array sized 524288 elems, took 0 s for linear search and 0 s for binary search for element 127, in 580014 tries, for a total of 0.100000 s (ignore this:-816522504) +for array sized 524288 elems, took 0 s for linear search and 0 s for binary search for element 63, in 779128 tries, for a total of 0.100001 s (ignore this:-718352376) +for array sized 524288 elems, took 0 s for linear search and 0 s for binary search for element 31, in 936102 tries, for a total of 0.100001 s (ignore this:-660314052) +for array sized 524288 elems, took 0 s for linear search and 0 s for binary search for element 15, in 1054527 tries, for a total of 0.100000 s (ignore this:-628678242) +for array sized 524288 elems, took 0 s for linear search and 0 s for binary search for element 7, in 1114441 tries, for a total of 0.100000 s (ignore this:-613076068) + ./rsbench -C /build/reproducible-path/librsb-1.3.0.2+dfsg/.libs/rsbench version: 1.3.0 format switches:br @@ -4161,17 +4197,17 @@ Adding matrix file: /build/reproducible-path/librsb-1.3.0.2+dfsg/A.mtx # Sorting matrices list (use --no-sort-filenames-list to prevent this) # Using matrices: A.mtx -# beginning run at 1773327832 +# beginning run at 1738918486 # /build/reproducible-path/librsb-1.3.0.2+dfsg/.libs/rsbench -oa -Ob --bench -f /build/reproducible-path/librsb-1.3.0.2+dfsg/A.mtx --verbose --nrhs 1,4 --by-rows # compiled with: CC=gcc CFLAGS=-g -O2 -Werror=implicit-function-declaration -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 # User did not specify threads; assuming 1. Environment provides max 12 threads; this build supports max 128. # User did not specify threads; assuming 1. Environment provides max 12 threads; this build supports max 128. -# average timer granularity: 7.86e-08 s -# Will write a final performance record to file rsbench_pr__1773327832_gcc-14.2.rpr and periodic checkpoints to rsbench_pr__1773327832_gcc-14.2.rpr.tmp +# average timer granularity: 7.82e-08 s +# Will write a final performance record to file rsbench_pr__1738918486_gcc-14.2.rpr and periodic checkpoints to rsbench_pr__1738918486_gcc-14.2.rpr.tmp # will NOT perform ancillary tests. # will flush cache memory: between each operation measurement series, and NOT between each operation. # will keep any zero encountered in the matrix. -# env: export PATH=/usr/sbin:/usr/bin:/sbin:/bin:/usr/games +# env: export PATH=/usr/sbin:/usr/bin:/sbin:/bin:/usr/games:/i/capture/the/path # env: export LD_LIBRARY_PATH=/build/reproducible-path/librsb-1.3.0.2+dfsg/.libs # env: HOSTNAME is not set # env: KMP_AFFINITY is not set @@ -4210,61 +4246,61 @@ # env: SLURM_NTASKS is not set # env: SLURM_STEP_TASKS_PER_NODE is not set # env: SLURM_TASKS_PER_NODE is not set -# detected hostname: codethink03-arm64 +# detected hostname: i-capture-the-hostname # user specified a verbosity level of 1 (each --verbose occurrence counts +1) # This test will measure times in scanning arrays sized and aligned to fit in caches. # 2 cache levels detected Will fill struct with 40 samples... -# Memory benchmark took 5.382s +# Memory benchmark took 5.320s # auto-tuning oriented output implies times==0 iterations and sort-after-load. #pr: allocated a performance record for 16 samples (4480 bytes). # multi-type benchmarking (DSCZ) -- now using typecode D (last was D). # Cache block size total 524288 bytes, per-thread 43690 bytes -# so far, program took 5.386s of wall clock time; ancillary tests 0.000s; I/O 0.000s; checks 0.000s; conversions 0.000s; rsb/mkl tuning 0.000s/0.000s . +# so far, program took 5.324s of wall clock time; ancillary tests 0.000s; I/O 0.000s; checks 0.000s; conversions 0.000s; rsb/mkl tuning 0.000s/0.000s . # reading A.mtx (184 bytes / 1 MiB / 6 nnz / 3 rows / 3 columns / 1 MiB COO) as type D... -# file input of A.mtx took 0.00 s (6 nnz, 69711 nnz/s ) (2.14 MB/s ) -#pre-sorting (6 elements) took 0.00166011 s -#weeding duplicates (to 6 elements) took 2.86102e-06 s (and check, 1.90735e-06 s ) +# file input of A.mtx took 0.00 s (6 nnz, 66052 nnz/s ) (2.03 MB/s ) +#pre-sorting (6 elements) took 0.00831699 s +#weeding duplicates (to 6 elements) took 3.09944e-06 s (and check, 1.90735e-06 s ) # multi-nrhs benchmarking (1,4) -- now using nrhs 1. # Using alpha=1 beta=1 order=rows for rsb_spmv/rsb_spsv/rsb_spmm/rsb_spsm. # multi-transpose benchmarking -- now using transA = N. # will use input matrix flags: RSB_FLAG_USE_HALFWORD_INDICES, RSB_FLAG_SORTED_INPUT, RSB_FLAG_QUAD_PARTITIONING, RSB_FLAG_SYMMETRIC, RSB_FLAG_OWN_PARTITIONING_ARRAYS # Using 12 threads -# Constructed matrix (took 0.007s): (3 x 3)[0xaaaae3f6e110]{D} @ (0(0..0),0(0..0)) (6 nnz, 2 nnz/r) flags 0x2442186 (coo:1, csr:0, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'S' +# Constructed matrix (took 0.008s): (3 x 3)[0xaaaadbff4110]{D} @ (0(0..0),0(0..0)) (6 nnz, 2 nnz/r) flags 0x2442186 (coo:1, csr:0, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'S' # matrix consistency check took 0.000s (ok) RSB Sparse Blocks Autotuner invoked requesting max 6 splits and max 6 merges in 1 rounds, threads spec.0 (specify negative values to enable threads tuning). Will autotune matrix: 3 x 3, type D, 6 nnz, 2 nnz/r, 4 subms, 3 lsubms, 4.0000 bpnz. Parameters: verbosity:1 mintimes:3 maxtimes:10 mindt:0 maxdt:3 -3 iterations (12 th.) took 0.001572s; avg 0.000524s ( +/- 0.36/ 0.36 %); best 0.0005221s; worst 0.000526s; std dev. 1.557e-06 (taking best). -Reference operation time is 0.000522137 s (0.04596 Mflops) with 12 threads. -Starting merge (same threads) based auto-tuning procedure (transA=N, nrhs=1, order=rows) (max 6 steps, inclusive 3 grace steps) on: 3 x 3, type D, 6 nnz, 2 nnz/r, 4 subms, 3 lsubms, 4.0000 bpnz (tpop: 0.0005221 Mflops: 0.046) -Merge (3 -> 1 leaves) took w.c.t. of 2.313e-05s, ~8.821e-06s of computing time (of which 9.537e-07s sorting, 3.099e-06s analysis) -3 iterations (12 th.) took 0.0001121s; avg 3.735e-05s ( +/- 99.79/196.81 %); best 7.82e-08s; worst 0.0001109s; std dev. 5.198e-05 (taking best). -Reference operation time is 7.82013e-08 s (306.9 Mflops) with 12 threads. -After merge step 1: tpop: 7.82e-08 s ~Mflops: 306.900 nsubm:1 otn:12 -Applying merge (3 -> 1 leaves, 12 th.) yielded SPEEDUP of 6676.829x: 0.0005221s -> 7.82e-08s, so taking this instance. +3 iterations (12 th.) took 0.005986s; avg 0.001995s ( +/- 34.20/ 33.86 %); best 0.001313s; worst 0.002671s; std dev. 0.0005544 (taking best). +Reference operation time is 0.00131297 s (0.01828 Mflops) with 12 threads. +Starting merge (same threads) based auto-tuning procedure (transA=N, nrhs=1, order=rows) (max 6 steps, inclusive 3 grace steps) on: 3 x 3, type D, 6 nnz, 2 nnz/r, 4 subms, 3 lsubms, 4.0000 bpnz (tpop: 0.001313 Mflops: 0.018) +Merge (3 -> 1 leaves) took w.c.t. of 2.909e-05s, ~1.097e-05s of computing time (of which 9.537e-07s sorting, 5.96e-06s analysis) +3 iterations (12 th.) took 0.0001259s; avg 4.196e-05s ( +/- 97.73/195.45 %); best 9.537e-07s; worst 0.000124s; std dev. 5.799e-05 (taking best). +Reference operation time is 9.53674e-07 s (25.17 Mflops) with 12 threads. +After merge step 1: tpop: 9.537e-07 s ~Mflops: 25.166 nsubm:1 otn:12 +Applying merge (3 -> 1 leaves, 12 th.) yielded SPEEDUP of 1376.750x: 0.001313s -> 9.537e-07s, so taking this instance. Merged all the matrix leaves: no reason to continue merging. -A total of 1 merge steps (of max 6) (3 -> 1 subms) took 0.001556s (of which 2.813e-05s partitioning, 0s I/O); computing times: 8.821e-06s in par. loops, 9.537e-07s sorting, 3.099e-06s analyzing) -Total merge + benchmarking process took 0.001556s, equivalent to 19899.4/3.0 new/old ops (0.00289s for 2 clones -- as 36960.4/5.5 ops, or 18480.2/2.8 ops per clone), SPEEDUP of 6676.829x -Applying multi-merge (3 -> 1 leaves, 1 steps, 0 -> 12 th.sp.) yielded SPEEDUP of 6676.829x (0.0005221s -> 7.82e-08s), will amortize in 3.0 ops by saving 0.0005221s per op. -In 1 tuning rounds (tot. 0.0047s, 0.0029s for constructor, 2 clones) obtained a SPEEDUP of 667582.9% (6677x) (from 0.04596 to 306.9 Mflops). +A total of 1 merge steps (of max 6) (3 -> 1 subms) took 0.005963s (of which 3.505e-05s partitioning, 0s I/O); computing times: 1.097e-05s in par. loops, 9.537e-07s sorting, 5.96e-06s analyzing) +Total merge + benchmarking process took 0.005963s, equivalent to 6252.5/4.5 new/old ops (0.009907s for 2 clones -- as 10388.0/7.5 ops, or 5194.0/3.8 ops per clone), SPEEDUP of 1376.750x +Applying multi-merge (3 -> 1 leaves, 1 steps, 0 -> 12 th.sp.) yielded SPEEDUP of 1376.750x (0.001313s -> 9.537e-07s), will amortize in 4.5 ops by saving 0.001312s per op. +In 1 tuning rounds (tot. 0.016s, 0.0099s for constructor, 2 clones) obtained a SPEEDUP of 137575.0% (1377x) (from 0.01828 to 25.17 Mflops). #pr: updating sample at index 1 (0^th of 16), 0^th touch for (0,0,0,0,0,0,0). -First run of RSB Autotuner took 0.00471997 s (5.221e-04 s -> 7.820e-08 s per spmv_sxsa) (tuned: 3 -> 1 lsubm). +First run of RSB Autotuner took 0.0161819 s (1.313e-03 s -> 9.537e-07 s per spmv_sxsa) (tuned: 3 -> 1 lsubm). RSB Sparse Blocks Autotuner invoked requesting max 0 splits and max 0 merges in 1 rounds, auto threads spec. -Second run of RSB Autotuner took 0.0441082 s and estimated a speedup of 1.000000 x (7.820e-08 s -> 7.820e-08 s per op) in same matrix (1 -> 1 lsubm) +Second run of RSB Autotuner took 0.0634949 s and estimated a speedup of 1.000000 x (7.915e-08 s -> 7.915e-08 s per op) in same matrix (1 -> 1 lsubm) #min:1 #max:1 #sum:3 #norm:1.7320508075688772 #used index storage compared to COO:28 vs 48 bytes (58.33%) ; compared to CSR:28 vs 40 bytes (77.78%) #%:CONSTRUCTOR_*:SORT SCAN INSERT SCAN+INSERT -%:CONSTRUCTOR_TIMES:A.mtx S N 12 3 3 6 0.000000 0.002557 0.002566 0.005123 -%:UNSORTEDCOO2RSB_TIME:A.mtx S N 12 3 3 6 0.005123 -%:RSB_SUBDIVISION_TIME:A.mtx S N 12 3 3 6 0.002557 -%:RSB_SHUFFLE_TIME:A.mtx S N 12 3 3 6 0.002566 +%:CONSTRUCTOR_TIMES:A.mtx S N 12 3 3 6 0.000000 0.002947 0.003174 0.006121 +%:UNSORTEDCOO2RSB_TIME:A.mtx S N 12 3 3 6 0.006121 +%:RSB_SUBDIVISION_TIME:A.mtx S N 12 3 3 6 0.002947 +%:RSB_SHUFFLE_TIME:A.mtx S N 12 3 3 6 0.003174 %:ROW_MAJOR_SORT_TIME:A.mtx S N 12 3 3 6 0.000000 %:ROW_MAJOR_SORT_SCALING:A.mtx S N 12 3 3 6 nan -%:SORTEDCOO2RSB_TIME:A.mtx S N 12 3 3 6 0.005123 +%:SORTEDCOO2RSB_TIME:A.mtx S N 12 3 3 6 0.006121 %:ROW_MAJOR_SORT_TO_MOP:A.mtx S N 12 3 3 6 0.000 %:UNSORTEDCOO2RSB_SCALING:A.mtx S N 12 3 3 6 1.00 %:SORTEDCOO2RSB_SCALING:A.mtx S N 12 3 3 6 1.00 @@ -4279,50 +4315,50 @@ %:SM_MINMAXAVGNNZ:A.mtx S N 12 3 3 6 6 6 6 # %operation:matrix CONSTRUCTOR[12] SPMV[12] SPMV[12] -%operation:A.mtx 0.00648999 1e+09 1e+09 +%operation:A.mtx 0.00807023 1e+09 1e+09 %constructor:matrix SORT[12] SCAN[12] SHUFFLE[12] INSERT[12] -%constructor:A.mtx 0 0.00255704 0 0.0025661 +%constructor:A.mtx 0 0.00294685 0 0.00317407 # symmetric matrix --- skipping transposed benchmarking # multi-nrhs benchmarking (1,4) -- now using nrhs 4. # Using alpha=1 beta=1 order=rows for rsb_spmv/rsb_spsv/rsb_spmm/rsb_spsm. # multi-transpose benchmarking -- now using transA = N. # will use input matrix flags: RSB_FLAG_USE_HALFWORD_INDICES, RSB_FLAG_SORTED_INPUT, RSB_FLAG_QUAD_PARTITIONING, RSB_FLAG_SYMMETRIC, RSB_FLAG_OWN_PARTITIONING_ARRAYS # Using 12 threads -# Constructed matrix (took 0.005s): (3 x 3)[0xaaaae3f6e110]{D} @ (0(0..0),0(0..0)) (6 nnz, 2 nnz/r) flags 0x2442186 (coo:1, csr:0, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'S' +# Constructed matrix (took 0.006s): (3 x 3)[0xaaaadbff4110]{D} @ (0(0..0),0(0..0)) (6 nnz, 2 nnz/r) flags 0x2442186 (coo:1, csr:0, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'S' # matrix consistency check took 0.000s (ok) RSB Sparse Blocks Autotuner invoked requesting max 6 splits and max 6 merges in 1 rounds, threads spec.0 (specify negative values to enable threads tuning). Will autotune matrix: 3 x 3, type D, 6 nnz, 2 nnz/r, 4 subms, 3 lsubms, 4.0000 bpnz. Parameters: verbosity:1 mintimes:3 maxtimes:10 mindt:0 maxdt:3 -3 iterations (12 th.) took 0.003424s; avg 0.001141s ( +/- 27.01/ 39.84 %); best 0.000833s; worst 0.001596s; std dev. 0.0003282 (taking best). -Reference operation time is 0.000833035 s (0.1152 Mflops) with 12 threads. -Starting merge (same threads) based auto-tuning procedure (transA=N, nrhs=4, order=rows) (max 6 steps, inclusive 3 grace steps) on: 3 x 3, type D, 6 nnz, 2 nnz/r, 4 subms, 3 lsubms, 4.0000 bpnz (tpop: 0.000833 Mflops: 0.115) -Merge (3 -> 1 leaves) took w.c.t. of 1.407e-05s, ~5.007e-06s of computing time (of which 1.907e-06s sorting, 2.146e-06s analysis) -3 iterations (12 th.) took 2.408e-05s; avg 8.027e-06s ( +/- 99.03/188.12 %); best 7.82e-08s; worst 2.313e-05s; std dev. 1.068e-05 (taking best). -Reference operation time is 7.82013e-08 s (1228 Mflops) with 12 threads. -After merge step 1: tpop: 7.82e-08 s ~Mflops: 1227.601 nsubm:1 otn:12 -Applying merge (3 -> 1 leaves, 12 th.) yielded SPEEDUP of 10652.439x: 0.000833s -> 7.82e-08s, so taking this instance. +3 iterations (12 th.) took 0.008735s; avg 0.002912s ( +/- 62.29/ 34.53 %); best 0.001098s; worst 0.003917s; std dev. 0.001285 (taking best). +Reference operation time is 0.00109792 s (0.08744 Mflops) with 12 threads. +Starting merge (same threads) based auto-tuning procedure (transA=N, nrhs=4, order=rows) (max 6 steps, inclusive 3 grace steps) on: 3 x 3, type D, 6 nnz, 2 nnz/r, 4 subms, 3 lsubms, 4.0000 bpnz (tpop: 0.001098 Mflops: 0.087) +Merge (3 -> 1 leaves) took w.c.t. of 1.812e-05s, ~5.007e-06s of computing time (of which 1.192e-06s sorting, 4.053e-06s analysis) +3 iterations (12 th.) took 2.384e-05s; avg 7.947e-06s ( +/- 88.00/176.00 %); best 9.537e-07s; worst 2.193e-05s; std dev. 9.89e-06 (taking best). +Reference operation time is 9.53674e-07 s (100.7 Mflops) with 12 threads. +After merge step 1: tpop: 9.537e-07 s ~Mflops: 100.663 nsubm:1 otn:12 +Applying merge (3 -> 1 leaves, 12 th.) yielded SPEEDUP of 1151.250x: 0.001098s -> 9.537e-07s, so taking this instance. Merged all the matrix leaves: no reason to continue merging. -A total of 1 merge steps (of max 6) (3 -> 1 subms) took 0.002449s (of which 3.505e-05s partitioning, 0s I/O); computing times: 5.007e-06s in par. loops, 1.907e-06s sorting, 2.146e-06s analyzing) -Total merge + benchmarking process took 0.002449s, equivalent to 31317.1/2.9 new/old ops (0.004809s for 2 clones -- as 61500.0/5.8 ops, or 30750.0/2.9 ops per clone), SPEEDUP of 10652.439x -Applying multi-merge (3 -> 1 leaves, 1 steps, 0 -> 12 th.sp.) yielded SPEEDUP of 10652.439x (0.000833s -> 7.82e-08s), will amortize in 2.9 ops by saving 0.000833s per op. -In 1 tuning rounds (tot. 0.0084s, 0.0048s for constructor, 2 clones) obtained a SPEEDUP of 1065143.9% (1.065e+04x) (from 0.1152 to 1228 Mflops). +A total of 1 merge steps (of max 6) (3 -> 1 subms) took 0.003793s (of which 2.289e-05s partitioning, 0s I/O); computing times: 5.007e-06s in par. loops, 1.192e-06s sorting, 4.053e-06s analyzing) +Total merge + benchmarking process took 0.003793s, equivalent to 3977.2/3.5 new/old ops (0.01576s for 2 clones -- as 16523.5/14.4 ops, or 8261.8/7.2 ops per clone), SPEEDUP of 1151.250x +Applying multi-merge (3 -> 1 leaves, 1 steps, 0 -> 12 th.sp.) yielded SPEEDUP of 1151.250x (0.001098s -> 9.537e-07s), will amortize in 3.5 ops by saving 0.001097s per op. +In 1 tuning rounds (tot. 0.025s, 0.016s for constructor, 2 clones) obtained a SPEEDUP of 115025.0% (1151x) (from 0.08744 to 100.7 Mflops). #pr: updating sample at index 9 (1^th of 16), 0^th touch for (0,0,0,0,1,0,0). -First run of RSB Autotuner took 0.00837898 s (8.330e-04 s -> 7.820e-08 s per spmv_sxsa) (tuned: 3 -> 1 lsubm). +First run of RSB Autotuner took 0.0246432 s (1.098e-03 s -> 9.537e-07 s per spmv_sxsa) (tuned: 3 -> 1 lsubm). RSB Sparse Blocks Autotuner invoked requesting max 0 splits and max 0 merges in 1 rounds, auto threads spec. -Second run of RSB Autotuner took 0.034416 s and estimated a speedup of 1.000000 x (7.820e-08 s -> 7.820e-08 s per op) in same matrix (1 -> 1 lsubm) +Second run of RSB Autotuner took 0.0536649 s and estimated a speedup of 1.000000 x (7.915e-08 s -> 7.915e-08 s per op) in same matrix (1 -> 1 lsubm) #min:1 #max:1 #sum:3 #norm:1.7320508075688772 #used index storage compared to COO:28 vs 48 bytes (58.33%) ; compared to CSR:28 vs 40 bytes (77.78%) #%:CONSTRUCTOR_*:SORT SCAN INSERT SCAN+INSERT -%:CONSTRUCTOR_TIMES:A.mtx S N 12 3 3 6 0.000000 0.001663 0.001662 0.003325 -%:UNSORTEDCOO2RSB_TIME:A.mtx S N 12 3 3 6 0.003325 -%:RSB_SUBDIVISION_TIME:A.mtx S N 12 3 3 6 0.001663 -%:RSB_SHUFFLE_TIME:A.mtx S N 12 3 3 6 0.001662 +%:CONSTRUCTOR_TIMES:A.mtx S N 12 3 3 6 0.000000 0.001814 0.002020 0.003834 +%:UNSORTEDCOO2RSB_TIME:A.mtx S N 12 3 3 6 0.003834 +%:RSB_SUBDIVISION_TIME:A.mtx S N 12 3 3 6 0.001814 +%:RSB_SHUFFLE_TIME:A.mtx S N 12 3 3 6 0.002020 %:ROW_MAJOR_SORT_TIME:A.mtx S N 12 3 3 6 0.000000 %:ROW_MAJOR_SORT_SCALING:A.mtx S N 12 3 3 6 nan -%:SORTEDCOO2RSB_TIME:A.mtx S N 12 3 3 6 0.003325 +%:SORTEDCOO2RSB_TIME:A.mtx S N 12 3 3 6 0.003834 %:ROW_MAJOR_SORT_TO_MOP:A.mtx S N 12 3 3 6 0.000 %:UNSORTEDCOO2RSB_SCALING:A.mtx S N 12 3 3 6 1.00 %:SORTEDCOO2RSB_SCALING:A.mtx S N 12 3 3 6 1.00 @@ -4337,59 +4373,59 @@ %:SM_MINMAXAVGNNZ:A.mtx S N 12 3 3 6 6 6 6 # %operation:matrix CONSTRUCTOR[12] SPMV[12] SPMV[12] -%operation:A.mtx 0.00497794 1e+09 1e+09 +%operation:A.mtx 0.0059731 1e+09 1e+09 %constructor:matrix SORT[12] SCAN[12] SHUFFLE[12] INSERT[12] -%constructor:A.mtx 0 0.00166297 0 0.00166202 +%constructor:A.mtx 0 0.00181389 0 0.00202012 # symmetric matrix --- skipping transposed benchmarking -# so far, program took 5.502s of wall clock time; ancillary tests 0.000s; I/O 0.000s; checks 0.000s; conversions 0.000s; rsb/mkl tuning 0.092s/0.000s . +# so far, program took 5.520s of wall clock time; ancillary tests 0.000s; I/O 0.000s; checks 0.000s; conversions 0.000s; rsb/mkl tuning 0.158s/0.000s . getrusage() stats: -ru_maxrss: 6 (maximum resident set size -- MB) -ru_stime : 0.02814s (system CPU time used) -ru_utime : 6.42s (user CPU time used) +ru_maxrss: 8 (maximum resident set size -- MB) +ru_stime : 0.03124s (system CPU time used) +ru_utime : 6.418s (user CPU time used) # multi-type benchmarking (DSCZ) -- now using typecode S (last was D). # Cache block size total 524288 bytes, per-thread 43690 bytes -# so far, program took 5.502s of wall clock time; ancillary tests 0.000s; I/O 0.000s; checks 0.000s; conversions 0.000s; rsb/mkl tuning 0.092s/0.000s . +# so far, program took 5.520s of wall clock time; ancillary tests 0.000s; I/O 0.000s; checks 0.000s; conversions 0.000s; rsb/mkl tuning 0.158s/0.000s . # Reusing type converted (D->S) arrays from last iteration instead of reloading matrix file. # multi-nrhs benchmarking (1,4) -- now using nrhs 1. # Using alpha=1 beta=1 order=rows for rsb_spmv/rsb_spsv/rsb_spmm/rsb_spsm. # multi-transpose benchmarking -- now using transA = N. # will use input matrix flags: RSB_FLAG_USE_HALFWORD_INDICES, RSB_FLAG_SORTED_INPUT, RSB_FLAG_QUAD_PARTITIONING, RSB_FLAG_SYMMETRIC, RSB_FLAG_OWN_PARTITIONING_ARRAYS # Using 12 threads -# Constructed matrix (took 0.005s): (3 x 3)[0xaaaae3f6e110]{S} @ (0(0..0),0(0..0)) (6 nnz, 2 nnz/r) flags 0x2442186 (coo:1, csr:0, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'S' +# Constructed matrix (took 0.012s): (3 x 3)[0xaaaadbff4110]{S} @ (0(0..0),0(0..0)) (6 nnz, 2 nnz/r) flags 0x2442186 (coo:1, csr:0, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'S' # matrix consistency check took 0.000s (ok) RSB Sparse Blocks Autotuner invoked requesting max 6 splits and max 6 merges in 1 rounds, threads spec.0 (specify negative values to enable threads tuning). Will autotune matrix: 3 x 3, type S, 6 nnz, 2 nnz/r, 4 subms, 3 lsubms, 4.0000 bpnz. Parameters: verbosity:1 mintimes:3 maxtimes:10 mindt:0 maxdt:3 -3 iterations (12 th.) took 0.002236s; avg 0.0007453s ( +/- 44.47/ 67.47 %); best 0.0004139s; worst 0.001248s; std dev. 0.0003615 (taking best). -Reference operation time is 0.000413895 s (0.05799 Mflops) with 12 threads. -Starting merge (same threads) based auto-tuning procedure (transA=N, nrhs=1, order=rows) (max 6 steps, inclusive 3 grace steps) on: 3 x 3, type S, 6 nnz, 2 nnz/r, 4 subms, 3 lsubms, 4.0000 bpnz (tpop: 0.0004139 Mflops: 0.058) -Merge (3 -> 1 leaves) took w.c.t. of 1.287e-05s, ~5.007e-06s of computing time (of which 1.192e-06s sorting, 2.146e-06s analysis) -3 iterations (12 th.) took 5.007e-06s; avg 1.669e-06s ( +/- 95.31/128.57 %); best 7.82e-08s; worst 3.815e-06s; std dev. 1.593e-06 (taking best). -Reference operation time is 7.82013e-08 s (306.9 Mflops) with 12 threads. -After merge step 1: tpop: 7.82e-08 s ~Mflops: 306.900 nsubm:1 otn:12 -Applying merge (3 -> 1 leaves, 12 th.) yielded SPEEDUP of 5292.683x: 0.0004139s -> 7.82e-08s, so taking this instance. +3 iterations (12 th.) took 0.002882s; avg 0.0009607s ( +/- 1.84/ 3.04 %); best 0.0009429s; worst 0.0009899s; std dev. 2.083e-05 (taking best). +Reference operation time is 0.000942945 s (0.02545 Mflops) with 12 threads. +Starting merge (same threads) based auto-tuning procedure (transA=N, nrhs=1, order=rows) (max 6 steps, inclusive 3 grace steps) on: 3 x 3, type S, 6 nnz, 2 nnz/r, 4 subms, 3 lsubms, 4.0000 bpnz (tpop: 0.0009429 Mflops: 0.025) +Merge (3 -> 1 leaves) took w.c.t. of 1.407e-05s, ~4.053e-06s of computing time (of which 1.192e-06s sorting, 1.907e-06s analysis) +3 iterations (12 th.) took 6.199e-06s; avg 2.066e-06s ( +/- 96.17/142.31 %); best 7.915e-08s; worst 5.007e-06s; std dev. 2.135e-06 (taking best). +Reference operation time is 7.9155e-08 s (303.2 Mflops) with 12 threads. +After merge step 1: tpop: 7.915e-08 s ~Mflops: 303.203 nsubm:1 otn:12 +Applying merge (3 -> 1 leaves, 12 th.) yielded SPEEDUP of 11912.651x: 0.0009429s -> 7.915e-08s, so taking this instance. Merged all the matrix leaves: no reason to continue merging. -A total of 1 merge steps (of max 6) (3 -> 1 subms) took 0.001211s (of which 1.597e-05s partitioning, 0s I/O); computing times: 5.007e-06s in par. loops, 1.192e-06s sorting, 2.146e-06s analyzing) -Total merge + benchmarking process took 0.001211s, equivalent to 15484.8/2.9 new/old ops (0.00452s for 2 clones -- as 57798.8/10.9 ops, or 28899.4/5.5 ops per clone), SPEEDUP of 5292.683x -Applying multi-merge (3 -> 1 leaves, 1 steps, 0 -> 12 th.sp.) yielded SPEEDUP of 5292.683x (0.0004139s -> 7.82e-08s), will amortize in 2.9 ops by saving 0.0004138s per op. -In 1 tuning rounds (tot. 0.0069s, 0.0045s for constructor, 2 clones) obtained a SPEEDUP of 529168.3% (5293x) (from 0.05799 to 306.9 Mflops). +A total of 1 merge steps (of max 6) (3 -> 1 subms) took 0.00274s (of which 1.693e-05s partitioning, 0s I/O); computing times: 4.053e-06s in par. loops, 1.192e-06s sorting, 1.907e-06s analyzing) +Total merge + benchmarking process took 0.00274s, equivalent to 34614.5/2.9 new/old ops (0.005962s for 2 clones -- as 75319.3/6.3 ops, or 37659.6/3.2 ops per clone), SPEEDUP of 11912.651x +Applying multi-merge (3 -> 1 leaves, 1 steps, 0 -> 12 th.sp.) yielded SPEEDUP of 11912.651x (0.0009429s -> 7.915e-08s), will amortize in 2.9 ops by saving 0.0009429s per op. +In 1 tuning rounds (tot. 0.009s, 0.006s for constructor, 2 clones) obtained a SPEEDUP of 1191165.1% (1.191e+04x) (from 0.02545 to 303.2 Mflops). #pr: updating sample at index 3 (2^th of 16), 0^th touch for (0,0,0,0,0,1,0). -First run of RSB Autotuner took 0.00686288 s (4.139e-04 s -> 7.820e-08 s per spmv_sxsa) (tuned: 3 -> 1 lsubm). +First run of RSB Autotuner took 0.00903893 s (9.429e-04 s -> 7.915e-08 s per spmv_sxsa) (tuned: 3 -> 1 lsubm). RSB Sparse Blocks Autotuner invoked requesting max 0 splits and max 0 merges in 1 rounds, auto threads spec. -Second run of RSB Autotuner took 0.0300519 s and estimated a speedup of 1.000000 x (7.820e-08 s -> 7.820e-08 s per op) in same matrix (1 -> 1 lsubm) +Second run of RSB Autotuner took 0.052115 s and estimated a speedup of 1.000000 x (7.915e-08 s -> 7.915e-08 s per op) in same matrix (1 -> 1 lsubm) #min:1 #max:1 #sum:3 #norm:1.73205078 #used index storage compared to COO:28 vs 48 bytes (58.33%) ; compared to CSR:28 vs 40 bytes (77.78%) #%:CONSTRUCTOR_*:SORT SCAN INSERT SCAN+INSERT -%:CONSTRUCTOR_TIMES:A.mtx S N 12 3 3 6 0.000000 0.001736 0.001618 0.003354 -%:UNSORTEDCOO2RSB_TIME:A.mtx S N 12 3 3 6 0.003354 -%:RSB_SUBDIVISION_TIME:A.mtx S N 12 3 3 6 0.001736 -%:RSB_SHUFFLE_TIME:A.mtx S N 12 3 3 6 0.001618 +%:CONSTRUCTOR_TIMES:A.mtx S N 12 3 3 6 0.000000 0.007968 0.002015 0.009983 +%:UNSORTEDCOO2RSB_TIME:A.mtx S N 12 3 3 6 0.009983 +%:RSB_SUBDIVISION_TIME:A.mtx S N 12 3 3 6 0.007968 +%:RSB_SHUFFLE_TIME:A.mtx S N 12 3 3 6 0.002015 %:ROW_MAJOR_SORT_TIME:A.mtx S N 12 3 3 6 0.000000 %:ROW_MAJOR_SORT_SCALING:A.mtx S N 12 3 3 6 nan -%:SORTEDCOO2RSB_TIME:A.mtx S N 12 3 3 6 0.003354 +%:SORTEDCOO2RSB_TIME:A.mtx S N 12 3 3 6 0.009983 %:ROW_MAJOR_SORT_TO_MOP:A.mtx S N 12 3 3 6 0.000 %:UNSORTEDCOO2RSB_SCALING:A.mtx S N 12 3 3 6 1.00 %:SORTEDCOO2RSB_SCALING:A.mtx S N 12 3 3 6 1.00 @@ -4404,50 +4440,50 @@ %:SM_MINMAXAVGNNZ:A.mtx S N 12 3 3 6 6 6 6 # %operation:matrix CONSTRUCTOR[12] SPMV[12] SPMV[12] -%operation:A.mtx 0.00483704 1e+09 1e+09 +%operation:A.mtx 0.0119729 1e+09 1e+09 %constructor:matrix SORT[12] SCAN[12] SHUFFLE[12] INSERT[12] -%constructor:A.mtx 0 0.00173593 0 0.00161791 +%constructor:A.mtx 0 0.00796795 0 0.00201488 # symmetric matrix --- skipping transposed benchmarking # multi-nrhs benchmarking (1,4) -- now using nrhs 4. # Using alpha=1 beta=1 order=rows for rsb_spmv/rsb_spsv/rsb_spmm/rsb_spsm. # multi-transpose benchmarking -- now using transA = N. # will use input matrix flags: RSB_FLAG_USE_HALFWORD_INDICES, RSB_FLAG_SORTED_INPUT, RSB_FLAG_QUAD_PARTITIONING, RSB_FLAG_SYMMETRIC, RSB_FLAG_OWN_PARTITIONING_ARRAYS # Using 12 threads -# Constructed matrix (took 0.006s): (3 x 3)[0xaaaae3f6e4a0]{S} @ (0(0..0),0(0..0)) (6 nnz, 2 nnz/r) flags 0x2442186 (coo:1, csr:0, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'S' +# Constructed matrix (took 0.005s): (3 x 3)[0xaaaadbff4110]{S} @ (0(0..0),0(0..0)) (6 nnz, 2 nnz/r) flags 0x2442186 (coo:1, csr:0, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'S' # matrix consistency check took 0.000s (ok) RSB Sparse Blocks Autotuner invoked requesting max 6 splits and max 6 merges in 1 rounds, threads spec.0 (specify negative values to enable threads tuning). Will autotune matrix: 3 x 3, type S, 6 nnz, 2 nnz/r, 4 subms, 3 lsubms, 4.0000 bpnz. Parameters: verbosity:1 mintimes:3 maxtimes:10 mindt:0 maxdt:3 -3 iterations (12 th.) took 0.002079s; avg 0.000693s ( +/- 3.88/ 5.62 %); best 0.0006661s; worst 0.0007319s; std dev. 2.819e-05 (taking best). -Reference operation time is 0.000666142 s (0.1441 Mflops) with 12 threads. -Starting merge (same threads) based auto-tuning procedure (transA=N, nrhs=4, order=rows) (max 6 steps, inclusive 3 grace steps) on: 3 x 3, type S, 6 nnz, 2 nnz/r, 4 subms, 3 lsubms, 4.0000 bpnz (tpop: 0.0006661 Mflops: 0.144) -Merge (3 -> 1 leaves) took w.c.t. of 1.216e-05s, ~5.007e-06s of computing time (of which 9.537e-07s sorting, 2.146e-06s analysis) -3 iterations (12 th.) took 3.099e-06s; avg 1.033e-06s ( +/- 92.43/200.00 %); best 7.82e-08s; worst 3.099e-06s; std dev. 1.461e-06 (taking best). -Reference operation time is 7.82013e-08 s (1228 Mflops) with 12 threads. -After merge step 1: tpop: 7.82e-08 s ~Mflops: 1227.601 nsubm:1 otn:12 -Applying merge (3 -> 1 leaves, 12 th.) yielded SPEEDUP of 8518.293x: 0.0006661s -> 7.82e-08s, so taking this instance. +3 iterations (12 th.) took 0.002936s; avg 0.0009786s ( +/- 12.61/ 22.91 %); best 0.0008552s; worst 0.001203s; std dev. 0.0001588 (taking best). +Reference operation time is 0.000855207 s (0.1123 Mflops) with 12 threads. +Starting merge (same threads) based auto-tuning procedure (transA=N, nrhs=4, order=rows) (max 6 steps, inclusive 3 grace steps) on: 3 x 3, type S, 6 nnz, 2 nnz/r, 4 subms, 3 lsubms, 4.0000 bpnz (tpop: 0.0008552 Mflops: 0.112) +Merge (3 -> 1 leaves) took w.c.t. of 1.597e-05s, ~5.007e-06s of computing time (of which 9.537e-07s sorting, 3.099e-06s analysis) +3 iterations (12 th.) took 5.96e-06s; avg 1.987e-06s ( +/- 96.02/152.00 %); best 7.915e-08s; worst 5.007e-06s; std dev. 2.171e-06 (taking best). +Reference operation time is 7.9155e-08 s (1213 Mflops) with 12 threads. +After merge step 1: tpop: 7.915e-08 s ~Mflops: 1212.811 nsubm:1 otn:12 +Applying merge (3 -> 1 leaves, 12 th.) yielded SPEEDUP of 10804.217x: 0.0008552s -> 7.915e-08s, so taking this instance. Merged all the matrix leaves: no reason to continue merging. -A total of 1 merge steps (of max 6) (3 -> 1 subms) took 0.002552s (of which 1.502e-05s partitioning, 0s I/O); computing times: 5.007e-06s in par. loops, 9.537e-07s sorting, 2.146e-06s analyzing) -Total merge + benchmarking process took 0.002552s, equivalent to 32634.1/3.8 new/old ops (0.005074s for 2 clones -- as 64887.2/7.6 ops, or 32443.6/3.8 ops per clone), SPEEDUP of 8518.293x -Applying multi-merge (3 -> 1 leaves, 1 steps, 0 -> 12 th.sp.) yielded SPEEDUP of 8518.293x (0.0006661s -> 7.82e-08s), will amortize in 3.8 ops by saving 0.0006661s per op. -In 1 tuning rounds (tot. 0.0073s, 0.0051s for constructor, 2 clones) obtained a SPEEDUP of 851729.3% (8518x) (from 0.1441 to 1228 Mflops). +A total of 1 merge steps (of max 6) (3 -> 1 subms) took 0.002506s (of which 2.408e-05s partitioning, 0s I/O); computing times: 5.007e-06s in par. loops, 9.537e-07s sorting, 3.099e-06s analyzing) +Total merge + benchmarking process took 0.002506s, equivalent to 31659.6/2.9 new/old ops (0.00522s for 2 clones -- as 65942.8/6.1 ops, or 32971.4/3.1 ops per clone), SPEEDUP of 10804.217x +Applying multi-merge (3 -> 1 leaves, 1 steps, 0 -> 12 th.sp.) yielded SPEEDUP of 10804.217x (0.0008552s -> 7.915e-08s), will amortize in 2.9 ops by saving 0.0008551s per op. +In 1 tuning rounds (tot. 0.0083s, 0.0052s for constructor, 2 clones) obtained a SPEEDUP of 1080321.7% (1.08e+04x) (from 0.1123 to 1213 Mflops). #pr: updating sample at index 11 (3^th of 16), 0^th touch for (0,0,0,0,1,1,0). -First run of RSB Autotuner took 0.00734901 s (6.661e-04 s -> 7.820e-08 s per spmv_sxsa) (tuned: 3 -> 1 lsubm). +First run of RSB Autotuner took 0.00835896 s (8.552e-04 s -> 7.915e-08 s per spmv_sxsa) (tuned: 3 -> 1 lsubm). RSB Sparse Blocks Autotuner invoked requesting max 0 splits and max 0 merges in 1 rounds, auto threads spec. -Second run of RSB Autotuner took 0.0308981 s and estimated a speedup of 1.000000 x (7.820e-08 s -> 7.820e-08 s per op) in same matrix (1 -> 1 lsubm) +Second run of RSB Autotuner took 0.0421669 s and estimated a speedup of 1.000000 x (7.915e-08 s -> 7.915e-08 s per op) in same matrix (1 -> 1 lsubm) #min:1 #max:1 #sum:3 #norm:1.73205078 #used index storage compared to COO:28 vs 48 bytes (58.33%) ; compared to CSR:28 vs 40 bytes (77.78%) #%:CONSTRUCTOR_*:SORT SCAN INSERT SCAN+INSERT -%:CONSTRUCTOR_TIMES:A.mtx S N 12 3 3 6 0.000000 0.001940 0.001829 0.003769 -%:UNSORTEDCOO2RSB_TIME:A.mtx S N 12 3 3 6 0.003769 -%:RSB_SUBDIVISION_TIME:A.mtx S N 12 3 3 6 0.001940 -%:RSB_SHUFFLE_TIME:A.mtx S N 12 3 3 6 0.001829 +%:CONSTRUCTOR_TIMES:A.mtx S N 12 3 3 6 0.000000 0.001572 0.001579 0.003151 +%:UNSORTEDCOO2RSB_TIME:A.mtx S N 12 3 3 6 0.003151 +%:RSB_SUBDIVISION_TIME:A.mtx S N 12 3 3 6 0.001572 +%:RSB_SHUFFLE_TIME:A.mtx S N 12 3 3 6 0.001579 %:ROW_MAJOR_SORT_TIME:A.mtx S N 12 3 3 6 0.000000 %:ROW_MAJOR_SORT_SCALING:A.mtx S N 12 3 3 6 nan -%:SORTEDCOO2RSB_TIME:A.mtx S N 12 3 3 6 0.003769 +%:SORTEDCOO2RSB_TIME:A.mtx S N 12 3 3 6 0.003151 %:ROW_MAJOR_SORT_TO_MOP:A.mtx S N 12 3 3 6 0.000 %:UNSORTEDCOO2RSB_SCALING:A.mtx S N 12 3 3 6 1.00 %:SORTEDCOO2RSB_SCALING:A.mtx S N 12 3 3 6 1.00 @@ -4462,59 +4498,59 @@ %:SM_MINMAXAVGNNZ:A.mtx S N 12 3 3 6 6 6 6 # %operation:matrix CONSTRUCTOR[12] SPMV[12] SPMV[12] -%operation:A.mtx 0.00604296 1e+09 1e+09 +%operation:A.mtx 0.00494099 1e+09 1e+09 %constructor:matrix SORT[12] SCAN[12] SHUFFLE[12] INSERT[12] -%constructor:A.mtx 0 0.00194001 0 0.00182891 +%constructor:A.mtx 0 0.00157213 0 0.00157881 # symmetric matrix --- skipping transposed benchmarking -# so far, program took 5.595s of wall clock time; ancillary tests 0.000s; I/O 0.000s; checks 0.000s; conversions 0.000s; rsb/mkl tuning 0.167s/0.000s . +# so far, program took 5.662s of wall clock time; ancillary tests 0.000s; I/O 0.000s; checks 0.000s; conversions 0.000s; rsb/mkl tuning 0.270s/0.000s . getrusage() stats: -ru_maxrss: 6 (maximum resident set size -- MB) -ru_stime : 0.03235s (system CPU time used) -ru_utime : 7.171s (user CPU time used) +ru_maxrss: 8 (maximum resident set size -- MB) +ru_stime : 0.0394s (system CPU time used) +ru_utime : 7.175s (user CPU time used) # multi-type benchmarking (DSCZ) -- now using typecode C (last was S). # Cache block size total 524288 bytes, per-thread 43690 bytes -# so far, program took 5.595s of wall clock time; ancillary tests 0.000s; I/O 0.000s; checks 0.000s; conversions 0.000s; rsb/mkl tuning 0.167s/0.000s . +# so far, program took 5.662s of wall clock time; ancillary tests 0.000s; I/O 0.000s; checks 0.000s; conversions 0.000s; rsb/mkl tuning 0.270s/0.000s . # Reusing type converted (S->C) arrays from last iteration instead of reloading matrix file. # multi-nrhs benchmarking (1,4) -- now using nrhs 1. # Using alpha=1 beta=1 order=rows for rsb_spmv/rsb_spsv/rsb_spmm/rsb_spsm. # multi-transpose benchmarking -- now using transA = N. # will use input matrix flags: RSB_FLAG_USE_HALFWORD_INDICES, RSB_FLAG_SORTED_INPUT, RSB_FLAG_QUAD_PARTITIONING, RSB_FLAG_SYMMETRIC, RSB_FLAG_OWN_PARTITIONING_ARRAYS # Using 12 threads -# Constructed matrix (took 0.004s): (3 x 3)[0xaaaae3f71500]{C} @ (0(0..0),0(0..0)) (6 nnz, 2 nnz/r) flags 0x2442186 (coo:1, csr:0, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'S' +# Constructed matrix (took 0.006s): (3 x 3)[0xaaaadbff7520]{C} @ (0(0..0),0(0..0)) (6 nnz, 2 nnz/r) flags 0x2442186 (coo:1, csr:0, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'S' # matrix consistency check took 0.000s (ok) RSB Sparse Blocks Autotuner invoked requesting max 6 splits and max 6 merges in 1 rounds, threads spec.0 (specify negative values to enable threads tuning). Will autotune matrix: 3 x 3, type C, 6 nnz, 2 nnz/r, 4 subms, 3 lsubms, 4.0000 bpnz. Parameters: verbosity:1 mintimes:3 maxtimes:10 mindt:0 maxdt:3 -3 iterations (12 th.) took 0.001618s; avg 0.0005393s ( +/- 12.64/ 24.58 %); best 0.0004711s; worst 0.0006719s; std dev. 9.375e-05 (taking best). -Reference operation time is 0.000471115 s (0.2038 Mflops) with 12 threads. -Starting merge (same threads) based auto-tuning procedure (transA=N, nrhs=1, order=rows) (max 6 steps, inclusive 3 grace steps) on: 3 x 3, type C, 6 nnz, 2 nnz/r, 4 subms, 3 lsubms, 4.0000 bpnz (tpop: 0.0004711 Mflops: 0.204) -Merge (3 -> 1 leaves) took w.c.t. of 1.097e-05s, ~4.053e-06s of computing time (of which 0s sorting, 2.146e-06s analysis) -3 iterations (12 th.) took 9.394e-05s; avg 3.131e-05s ( +/- 99.75/196.95 %); best 7.82e-08s; worst 9.298e-05s; std dev. 4.361e-05 (taking best). -Reference operation time is 7.82013e-08 s (1228 Mflops) with 12 threads. -After merge step 1: tpop: 7.82e-08 s ~Mflops: 1227.601 nsubm:1 otn:12 -Applying merge (3 -> 1 leaves, 12 th.) yielded SPEEDUP of 6024.390x: 0.0004711s -> 7.82e-08s, so taking this instance. +3 iterations (12 th.) took 0.002621s; avg 0.0008736s ( +/- 24.46/ 23.27 %); best 0.0006599s; worst 0.001077s; std dev. 0.0001704 (taking best). +Reference operation time is 0.000659943 s (0.1455 Mflops) with 12 threads. +Starting merge (same threads) based auto-tuning procedure (transA=N, nrhs=1, order=rows) (max 6 steps, inclusive 3 grace steps) on: 3 x 3, type C, 6 nnz, 2 nnz/r, 4 subms, 3 lsubms, 4.0000 bpnz (tpop: 0.0006599 Mflops: 0.145) +Merge (3 -> 1 leaves) took w.c.t. of 1.192e-05s, ~4.053e-06s of computing time (of which 0s sorting, 2.146e-06s analysis) +3 iterations (12 th.) took 9.513e-05s; avg 3.171e-05s ( +/- 99.75/196.24 %); best 7.915e-08s; worst 9.394e-05s; std dev. 4.4e-05 (taking best). +Reference operation time is 7.9155e-08 s (1213 Mflops) with 12 threads. +After merge step 1: tpop: 7.915e-08 s ~Mflops: 1212.811 nsubm:1 otn:12 +Applying merge (3 -> 1 leaves, 12 th.) yielded SPEEDUP of 8337.349x: 0.0006599s -> 7.915e-08s, so taking this instance. Merged all the matrix leaves: no reason to continue merging. -A total of 1 merge steps (of max 6) (3 -> 1 subms) took 0.001577s (of which 1.311e-05s partitioning, 0s I/O); computing times: 4.053e-06s in par. loops, 0s sorting, 2.146e-06s analyzing) -Total merge + benchmarking process took 0.001577s, equivalent to 20167.7/3.3 new/old ops (0.00289s for 2 clones -- as 36954.3/6.1 ops, or 18477.1/3.1 ops per clone), SPEEDUP of 6024.390x -Applying multi-merge (3 -> 1 leaves, 1 steps, 0 -> 12 th.sp.) yielded SPEEDUP of 6024.390x (0.0004711s -> 7.82e-08s), will amortize in 3.3 ops by saving 0.000471s per op. -In 1 tuning rounds (tot. 0.0047s, 0.0029s for constructor, 2 clones) obtained a SPEEDUP of 602339.0% (6024x) (from 0.2038 to 1228 Mflops). +A total of 1 merge steps (of max 6) (3 -> 1 subms) took 0.002353s (of which 1.407e-05s partitioning, 0s I/O); computing times: 4.053e-06s in par. loops, 0s sorting, 2.146e-06s analyzing) +Total merge + benchmarking process took 0.002353s, equivalent to 29725.9/3.6 new/old ops (0.005988s for 2 clones -- as 75650.6/9.1 ops, or 37825.3/4.5 ops per clone), SPEEDUP of 8337.349x +Applying multi-merge (3 -> 1 leaves, 1 steps, 0 -> 12 th.sp.) yielded SPEEDUP of 8337.349x (0.0006599s -> 7.915e-08s), will amortize in 3.6 ops by saving 0.0006599s per op. +In 1 tuning rounds (tot. 0.0088s, 0.006s for constructor, 2 clones) obtained a SPEEDUP of 833634.9% (8337x) (from 0.1455 to 1213 Mflops). #pr: updating sample at index 5 (4^th of 16), 0^th touch for (0,0,0,0,0,2,0). -First run of RSB Autotuner took 0.00466204 s (4.711e-04 s -> 7.820e-08 s per spmv_sxsa) (tuned: 3 -> 1 lsubm). +First run of RSB Autotuner took 0.00876617 s (6.599e-04 s -> 7.915e-08 s per spmv_sxsa) (tuned: 3 -> 1 lsubm). RSB Sparse Blocks Autotuner invoked requesting max 0 splits and max 0 merges in 1 rounds, auto threads spec. -Second run of RSB Autotuner took 0.0310402 s and estimated a speedup of 1.000000 x (7.820e-08 s -> 7.820e-08 s per op) in same matrix (1 -> 1 lsubm) +Second run of RSB Autotuner took 0.0452509 s and estimated a speedup of 1.000000 x (7.915e-08 s -> 7.915e-08 s per op) in same matrix (1 -> 1 lsubm) #min:1 0 #max:1 0 #sum:3 0 #norm:1.73205078 0 #used index storage compared to COO:28 vs 48 bytes (58.33%) ; compared to CSR:28 vs 40 bytes (77.78%) #%:CONSTRUCTOR_*:SORT SCAN INSERT SCAN+INSERT -%:CONSTRUCTOR_TIMES:A.mtx S N 12 3 3 6 0.000000 0.001625 0.001138 0.002763 -%:UNSORTEDCOO2RSB_TIME:A.mtx S N 12 3 3 6 0.002763 -%:RSB_SUBDIVISION_TIME:A.mtx S N 12 3 3 6 0.001625 -%:RSB_SHUFFLE_TIME:A.mtx S N 12 3 3 6 0.001138 +%:CONSTRUCTOR_TIMES:A.mtx S N 12 3 3 6 0.000000 0.001893 0.002646 0.004539 +%:UNSORTEDCOO2RSB_TIME:A.mtx S N 12 3 3 6 0.004539 +%:RSB_SUBDIVISION_TIME:A.mtx S N 12 3 3 6 0.001893 +%:RSB_SHUFFLE_TIME:A.mtx S N 12 3 3 6 0.002646 %:ROW_MAJOR_SORT_TIME:A.mtx S N 12 3 3 6 0.000000 %:ROW_MAJOR_SORT_SCALING:A.mtx S N 12 3 3 6 nan -%:SORTEDCOO2RSB_TIME:A.mtx S N 12 3 3 6 0.002763 +%:SORTEDCOO2RSB_TIME:A.mtx S N 12 3 3 6 0.004539 %:ROW_MAJOR_SORT_TO_MOP:A.mtx S N 12 3 3 6 0.000 %:UNSORTEDCOO2RSB_SCALING:A.mtx S N 12 3 3 6 1.00 %:SORTEDCOO2RSB_SCALING:A.mtx S N 12 3 3 6 1.00 @@ -4529,50 +4565,50 @@ %:SM_MINMAXAVGNNZ:A.mtx S N 12 3 3 6 6 6 6 # %operation:matrix CONSTRUCTOR[12] SPMV[12] SPMV[12] -%operation:A.mtx 0.00383806 1e+09 1e+09 +%operation:A.mtx 0.00575495 1e+09 1e+09 %constructor:matrix SORT[12] SCAN[12] SHUFFLE[12] INSERT[12] -%constructor:A.mtx 0 0.00162506 0 0.00113797 +%constructor:A.mtx 0 0.00189281 0 0.00264597 # symmetric matrix --- skipping transposed benchmarking # multi-nrhs benchmarking (1,4) -- now using nrhs 4. # Using alpha=1 beta=1 order=rows for rsb_spmv/rsb_spsv/rsb_spmm/rsb_spsm. # multi-transpose benchmarking -- now using transA = N. # will use input matrix flags: RSB_FLAG_USE_HALFWORD_INDICES, RSB_FLAG_SORTED_INPUT, RSB_FLAG_QUAD_PARTITIONING, RSB_FLAG_SYMMETRIC, RSB_FLAG_OWN_PARTITIONING_ARRAYS # Using 12 threads -# Constructed matrix (took 0.003s): (3 x 3)[0xaaaae3f71500]{C} @ (0(0..0),0(0..0)) (6 nnz, 2 nnz/r) flags 0x2442186 (coo:1, csr:0, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'S' +# Constructed matrix (took 0.005s): (3 x 3)[0xaaaadbff7520]{C} @ (0(0..0),0(0..0)) (6 nnz, 2 nnz/r) flags 0x2442186 (coo:1, csr:0, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'S' # matrix consistency check took 0.000s (ok) RSB Sparse Blocks Autotuner invoked requesting max 6 splits and max 6 merges in 1 rounds, threads spec.0 (specify negative values to enable threads tuning). Will autotune matrix: 3 x 3, type C, 6 nnz, 2 nnz/r, 4 subms, 3 lsubms, 4.0000 bpnz. Parameters: verbosity:1 mintimes:3 maxtimes:10 mindt:0 maxdt:3 -3 iterations (12 th.) took 0.00139s; avg 0.0004633s ( +/- 0.48/ 0.81 %); best 0.0004611s; worst 0.0004671s; std dev. 2.657e-06 (taking best). -Reference operation time is 0.000461102 s (0.8328 Mflops) with 12 threads. -Starting merge (same threads) based auto-tuning procedure (transA=N, nrhs=4, order=rows) (max 6 steps, inclusive 3 grace steps) on: 3 x 3, type C, 6 nnz, 2 nnz/r, 4 subms, 3 lsubms, 4.0000 bpnz (tpop: 0.0004611 Mflops: 0.833) -Merge (3 -> 1 leaves) took w.c.t. of 6.914e-06s, ~3.099e-06s of computing time (of which 0s sorting, 9.537e-07s analysis) -3 iterations (12 th.) took 3.815e-06s; avg 1.272e-06s ( +/- 93.85/125.00 %); best 7.82e-08s; worst 2.861e-06s; std dev. 1.189e-06 (taking best). -Reference operation time is 7.82013e-08 s (4910 Mflops) with 12 threads. -After merge step 1: tpop: 7.82e-08 s ~Mflops: 4910.405 nsubm:1 otn:12 -Applying merge (3 -> 1 leaves, 12 th.) yielded SPEEDUP of 5896.341x: 0.0004611s -> 7.82e-08s, so taking this instance. +3 iterations (12 th.) took 0.003579s; avg 0.001193s ( +/- 52.47/ 67.16 %); best 0.000567s; worst 0.001994s; std dev. 0.0005957 (taking best). +Reference operation time is 0.000566959 s (0.6773 Mflops) with 12 threads. +Starting merge (same threads) based auto-tuning procedure (transA=N, nrhs=4, order=rows) (max 6 steps, inclusive 3 grace steps) on: 3 x 3, type C, 6 nnz, 2 nnz/r, 4 subms, 3 lsubms, 4.0000 bpnz (tpop: 0.000567 Mflops: 0.677) +Merge (3 -> 1 leaves) took w.c.t. of 1.907e-05s, ~5.96e-06s of computing time (of which 1.192e-06s sorting, 5.007e-06s analysis) +3 iterations (12 th.) took 5.007e-06s; avg 1.669e-06s ( +/- 95.26/142.86 %); best 7.915e-08s; worst 4.053e-06s; std dev. 1.73e-06 (taking best). +Reference operation time is 7.9155e-08 s (4851 Mflops) with 12 threads. +After merge step 1: tpop: 7.915e-08 s ~Mflops: 4851.243 nsubm:1 otn:12 +Applying merge (3 -> 1 leaves, 12 th.) yielded SPEEDUP of 7162.651x: 0.000567s -> 7.915e-08s, so taking this instance. Merged all the matrix leaves: no reason to continue merging. -A total of 1 merge steps (of max 6) (3 -> 1 subms) took 0.001697s (of which 0.0001738s partitioning, 0s I/O); computing times: 3.099e-06s in par. loops, 0s sorting, 9.537e-07s analyzing) -Total merge + benchmarking process took 0.001697s, equivalent to 21698.2/3.7 new/old ops (0.002866s for 2 clones -- as 36649.4/6.2 ops, or 18324.7/3.1 ops per clone), SPEEDUP of 5896.341x -Applying multi-merge (3 -> 1 leaves, 1 steps, 0 -> 12 th.sp.) yielded SPEEDUP of 5896.341x (0.0004611s -> 7.82e-08s), will amortize in 3.7 ops by saving 0.000461s per op. -In 1 tuning rounds (tot. 0.0045s, 0.0029s for constructor, 2 clones) obtained a SPEEDUP of 589534.1% (5896x) (from 0.8328 to 4910 Mflops). +A total of 1 merge steps (of max 6) (3 -> 1 subms) took 0.002307s (of which 2.289e-05s partitioning, 0s I/O); computing times: 5.96e-06s in par. loops, 1.192e-06s sorting, 5.007e-06s analyzing) +Total merge + benchmarking process took 0.002307s, equivalent to 29144.6/4.1 new/old ops (0.005051s for 2 clones -- as 63810.2/8.9 ops, or 31905.1/4.5 ops per clone), SPEEDUP of 7162.651x +Applying multi-merge (3 -> 1 leaves, 1 steps, 0 -> 12 th.sp.) yielded SPEEDUP of 7162.651x (0.000567s -> 7.915e-08s), will amortize in 4.1 ops by saving 0.0005669s per op. +In 1 tuning rounds (tot. 0.0087s, 0.0051s for constructor, 2 clones) obtained a SPEEDUP of 716165.1% (7163x) (from 0.6773 to 4851 Mflops). #pr: updating sample at index 13 (5^th of 16), 0^th touch for (0,0,0,0,1,2,0). -First run of RSB Autotuner took 0.00447702 s (4.611e-04 s -> 7.820e-08 s per spmv_sxsa) (tuned: 3 -> 1 lsubm). +First run of RSB Autotuner took 0.00872517 s (5.670e-04 s -> 7.915e-08 s per spmv_sxsa) (tuned: 3 -> 1 lsubm). RSB Sparse Blocks Autotuner invoked requesting max 0 splits and max 0 merges in 1 rounds, auto threads spec. -Second run of RSB Autotuner took 0.025599 s and estimated a speedup of 1.000000 x (7.820e-08 s -> 7.820e-08 s per op) in same matrix (1 -> 1 lsubm) +Second run of RSB Autotuner took 0.0580771 s and estimated a speedup of 1.000000 x (7.915e-08 s -> 7.915e-08 s per op) in same matrix (1 -> 1 lsubm) #min:1 0 #max:1 0 #sum:3 0 #norm:1.73205078 0 #used index storage compared to COO:28 vs 48 bytes (58.33%) ; compared to CSR:28 vs 40 bytes (77.78%) #%:CONSTRUCTOR_*:SORT SCAN INSERT SCAN+INSERT -%:CONSTRUCTOR_TIMES:A.mtx S N 12 3 3 6 0.000000 0.001054 0.000939 0.001993 -%:UNSORTEDCOO2RSB_TIME:A.mtx S N 12 3 3 6 0.001993 -%:RSB_SUBDIVISION_TIME:A.mtx S N 12 3 3 6 0.001054 -%:RSB_SHUFFLE_TIME:A.mtx S N 12 3 3 6 0.000939 +%:CONSTRUCTOR_TIMES:A.mtx S N 12 3 3 6 0.000000 0.001227 0.001476 0.002703 +%:UNSORTEDCOO2RSB_TIME:A.mtx S N 12 3 3 6 0.002703 +%:RSB_SUBDIVISION_TIME:A.mtx S N 12 3 3 6 0.001227 +%:RSB_SHUFFLE_TIME:A.mtx S N 12 3 3 6 0.001476 %:ROW_MAJOR_SORT_TIME:A.mtx S N 12 3 3 6 0.000000 %:ROW_MAJOR_SORT_SCALING:A.mtx S N 12 3 3 6 nan -%:SORTEDCOO2RSB_TIME:A.mtx S N 12 3 3 6 0.001993 +%:SORTEDCOO2RSB_TIME:A.mtx S N 12 3 3 6 0.002703 %:ROW_MAJOR_SORT_TO_MOP:A.mtx S N 12 3 3 6 0.000 %:UNSORTEDCOO2RSB_SCALING:A.mtx S N 12 3 3 6 1.00 %:SORTEDCOO2RSB_SCALING:A.mtx S N 12 3 3 6 1.00 @@ -4587,59 +4623,59 @@ %:SM_MINMAXAVGNNZ:A.mtx S N 12 3 3 6 6 6 6 # %operation:matrix CONSTRUCTOR[12] SPMV[12] SPMV[12] -%operation:A.mtx 0.00292397 1e+09 1e+09 +%operation:A.mtx 0.00478792 1e+09 1e+09 %constructor:matrix SORT[12] SCAN[12] SHUFFLE[12] INSERT[12] -%constructor:A.mtx 0 0.00105405 0 0.000939131 +%constructor:A.mtx 0 0.0012269 0 0.00147605 # symmetric matrix --- skipping transposed benchmarking -# so far, program took 5.675s of wall clock time; ancillary tests 0.000s; I/O 0.000s; checks 0.000s; conversions 0.000s; rsb/mkl tuning 0.233s/0.000s . +# so far, program took 5.803s of wall clock time; ancillary tests 0.000s; I/O 0.000s; checks 0.000s; conversions 0.000s; rsb/mkl tuning 0.390s/0.000s . getrusage() stats: -ru_maxrss: 6 (maximum resident set size -- MB) -ru_stime : 0.03251s (system CPU time used) -ru_utime : 7.833s (user CPU time used) +ru_maxrss: 8 (maximum resident set size -- MB) +ru_stime : 0.0514s (system CPU time used) +ru_utime : 7.796s (user CPU time used) # multi-type benchmarking (DSCZ) -- now using typecode Z (last was C). # Cache block size total 524288 bytes, per-thread 43690 bytes -# so far, program took 5.675s of wall clock time; ancillary tests 0.000s; I/O 0.000s; checks 0.000s; conversions 0.000s; rsb/mkl tuning 0.233s/0.000s . +# so far, program took 5.803s of wall clock time; ancillary tests 0.000s; I/O 0.000s; checks 0.000s; conversions 0.000s; rsb/mkl tuning 0.390s/0.000s . # Reusing type converted (C->Z) arrays from last iteration instead of reloading matrix file. # multi-nrhs benchmarking (1,4) -- now using nrhs 1. # Using alpha=1 beta=1 order=rows for rsb_spmv/rsb_spsv/rsb_spmm/rsb_spsm. # multi-transpose benchmarking -- now using transA = N. # will use input matrix flags: RSB_FLAG_USE_HALFWORD_INDICES, RSB_FLAG_SORTED_INPUT, RSB_FLAG_QUAD_PARTITIONING, RSB_FLAG_SYMMETRIC, RSB_FLAG_OWN_PARTITIONING_ARRAYS # Using 12 threads -# Constructed matrix (took 0.003s): (3 x 3)[0xaaaae3f71500]{Z} @ (0(0..0),0(0..0)) (6 nnz, 2 nnz/r) flags 0x2442186 (coo:1, csr:0, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'S' +# Constructed matrix (took 0.005s): (3 x 3)[0xaaaadbff7520]{Z} @ (0(0..0),0(0..0)) (6 nnz, 2 nnz/r) flags 0x2442186 (coo:1, csr:0, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'S' # matrix consistency check took 0.000s (ok) RSB Sparse Blocks Autotuner invoked requesting max 6 splits and max 6 merges in 1 rounds, threads spec.0 (specify negative values to enable threads tuning). Will autotune matrix: 3 x 3, type Z, 6 nnz, 2 nnz/r, 4 subms, 3 lsubms, 4.0000 bpnz. Parameters: verbosity:1 mintimes:3 maxtimes:10 mindt:0 maxdt:3 -3 iterations (12 th.) took 0.001655s; avg 0.0005517s ( +/- 2.12/ 3.33 %); best 0.00054s; worst 0.0005701s; std dev. 1.314e-05 (taking best). -Reference operation time is 0.000540018 s (0.1778 Mflops) with 12 threads. -Starting merge (same threads) based auto-tuning procedure (transA=N, nrhs=1, order=rows) (max 6 steps, inclusive 3 grace steps) on: 3 x 3, type Z, 6 nnz, 2 nnz/r, 4 subms, 3 lsubms, 4.0000 bpnz (tpop: 0.00054 Mflops: 0.178) -Merge (3 -> 1 leaves) took w.c.t. of 6.914e-06s, ~3.099e-06s of computing time (of which 1.192e-06s sorting, 9.537e-07s analysis) -3 iterations (12 th.) took 1.001e-05s; avg 3.338e-06s ( +/- 97.66/171.43 %); best 7.82e-08s; worst 9.06e-06s; std dev. 4.065e-06 (taking best). -Reference operation time is 7.82013e-08 s (1228 Mflops) with 12 threads. -After merge step 1: tpop: 7.82e-08 s ~Mflops: 1227.601 nsubm:1 otn:12 -Applying merge (3 -> 1 leaves, 12 th.) yielded SPEEDUP of 6905.488x: 0.00054s -> 7.82e-08s, so taking this instance. +3 iterations (12 th.) took 0.002171s; avg 0.0007237s ( +/- 20.40/ 15.37 %); best 0.000576s; worst 0.0008349s; std dev. 0.0001088 (taking best). +Reference operation time is 0.000576019 s (0.1667 Mflops) with 12 threads. +Starting merge (same threads) based auto-tuning procedure (transA=N, nrhs=1, order=rows) (max 6 steps, inclusive 3 grace steps) on: 3 x 3, type Z, 6 nnz, 2 nnz/r, 4 subms, 3 lsubms, 4.0000 bpnz (tpop: 0.000576 Mflops: 0.167) +Merge (3 -> 1 leaves) took w.c.t. of 1.407e-05s, ~4.053e-06s of computing time (of which 9.537e-07s sorting, 1.907e-06s analysis) +3 iterations (12 th.) took 1.478e-05s; avg 4.927e-06s ( +/- 98.39/200.00 %); best 7.915e-08s; worst 1.478e-05s; std dev. 6.968e-06 (taking best). +Reference operation time is 7.9155e-08 s (1213 Mflops) with 12 threads. +After merge step 1: tpop: 7.915e-08 s ~Mflops: 1212.811 nsubm:1 otn:12 +Applying merge (3 -> 1 leaves, 12 th.) yielded SPEEDUP of 7277.108x: 0.000576s -> 7.915e-08s, so taking this instance. Merged all the matrix leaves: no reason to continue merging. -A total of 1 merge steps (of max 6) (3 -> 1 subms) took 0.001572s (of which 8.821e-06s partitioning, 0s I/O); computing times: 3.099e-06s in par. loops, 1.192e-06s sorting, 9.537e-07s analyzing) -Total merge + benchmarking process took 0.001572s, equivalent to 20100.6/2.9 new/old ops (0.003163s for 2 clones -- as 40445.1/5.9 ops, or 20222.6/2.9 ops per clone), SPEEDUP of 6905.488x -Applying multi-merge (3 -> 1 leaves, 1 steps, 0 -> 12 th.sp.) yielded SPEEDUP of 6905.488x (0.00054s -> 7.82e-08s), will amortize in 2.9 ops by saving 0.0005399s per op. -In 1 tuning rounds (tot. 0.0049s, 0.0032s for constructor, 2 clones) obtained a SPEEDUP of 690448.8% (6905x) (from 0.1778 to 1228 Mflops). +A total of 1 merge steps (of max 6) (3 -> 1 subms) took 0.002024s (of which 1.693e-05s partitioning, 0s I/O); computing times: 4.053e-06s in par. loops, 9.537e-07s sorting, 1.907e-06s analyzing) +Total merge + benchmarking process took 0.002024s, equivalent to 25569.3/3.5 new/old ops (0.00948s for 2 clones -- as 119762.0/16.5 ops, or 59881.0/8.2 ops per clone), SPEEDUP of 7277.108x +Applying multi-merge (3 -> 1 leaves, 1 steps, 0 -> 12 th.sp.) yielded SPEEDUP of 7277.108x (0.000576s -> 7.915e-08s), will amortize in 3.5 ops by saving 0.0005759s per op. +In 1 tuning rounds (tot. 0.012s, 0.0095s for constructor, 2 clones) obtained a SPEEDUP of 727610.8% (7277x) (from 0.1667 to 1213 Mflops). #pr: updating sample at index 7 (6^th of 16), 0^th touch for (0,0,0,0,0,3,0). -First run of RSB Autotuner took 0.00486994 s (5.400e-04 s -> 7.820e-08 s per spmv_sxsa) (tuned: 3 -> 1 lsubm). +First run of RSB Autotuner took 0.0117428 s (5.760e-04 s -> 7.915e-08 s per spmv_sxsa) (tuned: 3 -> 1 lsubm). RSB Sparse Blocks Autotuner invoked requesting max 0 splits and max 0 merges in 1 rounds, auto threads spec. -Second run of RSB Autotuner took 0.0234501 s and estimated a speedup of 1.000000 x (7.820e-08 s -> 7.820e-08 s per op) in same matrix (1 -> 1 lsubm) +Second run of RSB Autotuner took 0.043571 s and estimated a speedup of 1.000000 x (7.915e-08 s -> 7.915e-08 s per op) in same matrix (1 -> 1 lsubm) #min:1 0 #max:1 0 #sum:3 0 #norm:1.7320508075688772 0 #used index storage compared to COO:28 vs 48 bytes (58.33%) ; compared to CSR:28 vs 40 bytes (77.78%) #%:CONSTRUCTOR_*:SORT SCAN INSERT SCAN+INSERT -%:CONSTRUCTOR_TIMES:A.mtx S N 12 3 3 6 0.000000 0.001192 0.001180 0.002372 -%:UNSORTEDCOO2RSB_TIME:A.mtx S N 12 3 3 6 0.002372 -%:RSB_SUBDIVISION_TIME:A.mtx S N 12 3 3 6 0.001192 -%:RSB_SHUFFLE_TIME:A.mtx S N 12 3 3 6 0.001180 +%:CONSTRUCTOR_TIMES:A.mtx S N 12 3 3 6 0.000000 0.001668 0.001110 0.002778 +%:UNSORTEDCOO2RSB_TIME:A.mtx S N 12 3 3 6 0.002778 +%:RSB_SUBDIVISION_TIME:A.mtx S N 12 3 3 6 0.001668 +%:RSB_SHUFFLE_TIME:A.mtx S N 12 3 3 6 0.001110 %:ROW_MAJOR_SORT_TIME:A.mtx S N 12 3 3 6 0.000000 %:ROW_MAJOR_SORT_SCALING:A.mtx S N 12 3 3 6 nan -%:SORTEDCOO2RSB_TIME:A.mtx S N 12 3 3 6 0.002372 +%:SORTEDCOO2RSB_TIME:A.mtx S N 12 3 3 6 0.002778 %:ROW_MAJOR_SORT_TO_MOP:A.mtx S N 12 3 3 6 0.000 %:UNSORTEDCOO2RSB_SCALING:A.mtx S N 12 3 3 6 1.00 %:SORTEDCOO2RSB_SCALING:A.mtx S N 12 3 3 6 1.00 @@ -4654,50 +4690,50 @@ %:SM_MINMAXAVGNNZ:A.mtx S N 12 3 3 6 6 6 6 # %operation:matrix CONSTRUCTOR[12] SPMV[12] SPMV[12] -%operation:A.mtx 0.003479 1e+09 1e+09 +%operation:A.mtx 0.00467992 1e+09 1e+09 %constructor:matrix SORT[12] SCAN[12] SHUFFLE[12] INSERT[12] -%constructor:A.mtx 0 0.00119185 0 0.00118017 +%constructor:A.mtx 0 0.00166798 0 0.00110984 # symmetric matrix --- skipping transposed benchmarking # multi-nrhs benchmarking (1,4) -- now using nrhs 4. # Using alpha=1 beta=1 order=rows for rsb_spmv/rsb_spsv/rsb_spmm/rsb_spsm. # multi-transpose benchmarking -- now using transA = N. # will use input matrix flags: RSB_FLAG_USE_HALFWORD_INDICES, RSB_FLAG_SORTED_INPUT, RSB_FLAG_QUAD_PARTITIONING, RSB_FLAG_SYMMETRIC, RSB_FLAG_OWN_PARTITIONING_ARRAYS # Using 12 threads -# Constructed matrix (took 0.003s): (3 x 3)[0xaaaae3f71500]{Z} @ (0(0..0),0(0..0)) (6 nnz, 2 nnz/r) flags 0x2442186 (coo:1, csr:0, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'S' +# Constructed matrix (took 0.005s): (3 x 3)[0xaaaadbff7520]{Z} @ (0(0..0),0(0..0)) (6 nnz, 2 nnz/r) flags 0x2442186 (coo:1, csr:0, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'S' # matrix consistency check took 0.000s (ok) RSB Sparse Blocks Autotuner invoked requesting max 6 splits and max 6 merges in 1 rounds, threads spec.0 (specify negative values to enable threads tuning). Will autotune matrix: 3 x 3, type Z, 6 nnz, 2 nnz/r, 4 subms, 3 lsubms, 4.0000 bpnz. Parameters: verbosity:1 mintimes:3 maxtimes:10 mindt:0 maxdt:3 -3 iterations (12 th.) took 0.001289s; avg 0.0004296s ( +/- 2.05/ 1.50 %); best 0.0004208s; worst 0.0004361s; std dev. 6.453e-06 (taking best). -Reference operation time is 0.000420809 s (0.9125 Mflops) with 12 threads. -Starting merge (same threads) based auto-tuning procedure (transA=N, nrhs=4, order=rows) (max 6 steps, inclusive 3 grace steps) on: 3 x 3, type Z, 6 nnz, 2 nnz/r, 4 subms, 3 lsubms, 4.0000 bpnz (tpop: 0.0004208 Mflops: 0.913) -Merge (3 -> 1 leaves) took w.c.t. of 6.914e-06s, ~3.099e-06s of computing time (of which 9.537e-07s sorting, 9.537e-07s analysis) -3 iterations (12 th.) took 2.861e-06s; avg 9.537e-07s ( +/- 91.80/100.00 %); best 7.82e-08s; worst 1.907e-06s; std dev. 7.787e-07 (taking best). -Reference operation time is 7.82013e-08 s (4910 Mflops) with 12 threads. -After merge step 1: tpop: 7.82e-08 s ~Mflops: 4910.405 nsubm:1 otn:12 -Applying merge (3 -> 1 leaves, 12 th.) yielded SPEEDUP of 5381.098x: 0.0004208s -> 7.82e-08s, so taking this instance. +3 iterations (12 th.) took 0.002832s; avg 0.000944s ( +/- 33.27/ 43.23 %); best 0.0006299s; worst 0.001352s; std dev. 0.0003022 (taking best). +Reference operation time is 0.000629902 s (0.6096 Mflops) with 12 threads. +Starting merge (same threads) based auto-tuning procedure (transA=N, nrhs=4, order=rows) (max 6 steps, inclusive 3 grace steps) on: 3 x 3, type Z, 6 nnz, 2 nnz/r, 4 subms, 3 lsubms, 4.0000 bpnz (tpop: 0.0006299 Mflops: 0.610) +Merge (3 -> 1 leaves) took w.c.t. of 1.192e-05s, ~4.053e-06s of computing time (of which 1.192e-06s sorting, 2.146e-06s analysis) +3 iterations (12 th.) took 5.007e-06s; avg 1.669e-06s ( +/- 95.26/142.86 %); best 7.915e-08s; worst 4.053e-06s; std dev. 1.73e-06 (taking best). +Reference operation time is 7.9155e-08 s (4851 Mflops) with 12 threads. +After merge step 1: tpop: 7.915e-08 s ~Mflops: 4851.243 nsubm:1 otn:12 +Applying merge (3 -> 1 leaves, 12 th.) yielded SPEEDUP of 7957.831x: 0.0006299s -> 7.915e-08s, so taking this instance. Merged all the matrix leaves: no reason to continue merging. -A total of 1 merge steps (of max 6) (3 -> 1 subms) took 0.001824s (of which 8.821e-06s partitioning, 0s I/O); computing times: 3.099e-06s in par. loops, 9.537e-07s sorting, 9.537e-07s analyzing) -Total merge + benchmarking process took 0.001824s, equivalent to 23323.2/4.3 new/old ops (0.003073s for 2 clones -- as 39295.7/7.3 ops, or 19647.9/3.7 ops per clone), SPEEDUP of 5381.098x -Applying multi-merge (3 -> 1 leaves, 1 steps, 0 -> 12 th.sp.) yielded SPEEDUP of 5381.098x (0.0004208s -> 7.82e-08s), will amortize in 4.3 ops by saving 0.0004207s per op. -In 1 tuning rounds (tot. 0.0044s, 0.0031s for constructor, 2 clones) obtained a SPEEDUP of 538009.8% (5381x) (from 0.9125 to 4910 Mflops). +A total of 1 merge steps (of max 6) (3 -> 1 subms) took 0.002721s (of which 1.311e-05s partitioning, 0s I/O); computing times: 4.053e-06s in par. loops, 1.192e-06s sorting, 2.146e-06s analyzing) +Total merge + benchmarking process took 0.002721s, equivalent to 34376.5/4.3 new/old ops (0.006685s for 2 clones -- as 84454.8/10.6 ops, or 42227.4/5.3 ops per clone), SPEEDUP of 7957.831x +Applying multi-merge (3 -> 1 leaves, 1 steps, 0 -> 12 th.sp.) yielded SPEEDUP of 7957.831x (0.0006299s -> 7.915e-08s), will amortize in 4.3 ops by saving 0.0006298s per op. +In 1 tuning rounds (tot. 0.0096s, 0.0067s for constructor, 2 clones) obtained a SPEEDUP of 795683.1% (7958x) (from 0.6096 to 4851 Mflops). #pr: updating sample at index 15 (7^th of 16), 0^th touch for (0,0,0,0,1,3,0). -First run of RSB Autotuner took 0.00442004 s (4.208e-04 s -> 7.820e-08 s per spmv_sxsa) (tuned: 3 -> 1 lsubm). +First run of RSB Autotuner took 0.00960708 s (6.299e-04 s -> 7.915e-08 s per spmv_sxsa) (tuned: 3 -> 1 lsubm). RSB Sparse Blocks Autotuner invoked requesting max 0 splits and max 0 merges in 1 rounds, auto threads spec. -Second run of RSB Autotuner took 0.0238569 s and estimated a speedup of 1.000000 x (7.820e-08 s -> 7.820e-08 s per op) in same matrix (1 -> 1 lsubm) +Second run of RSB Autotuner took 0.041456 s and estimated a speedup of 1.000000 x (7.915e-08 s -> 7.915e-08 s per op) in same matrix (1 -> 1 lsubm) #min:1 0 #max:1 0 #sum:3 0 #norm:1.7320508075688772 0 #used index storage compared to COO:28 vs 48 bytes (58.33%) ; compared to CSR:28 vs 40 bytes (77.78%) #%:CONSTRUCTOR_*:SORT SCAN INSERT SCAN+INSERT -%:CONSTRUCTOR_TIMES:A.mtx S N 12 3 3 6 0.000000 0.000996 0.000847 0.001843 -%:UNSORTEDCOO2RSB_TIME:A.mtx S N 12 3 3 6 0.001843 -%:RSB_SUBDIVISION_TIME:A.mtx S N 12 3 3 6 0.000996 -%:RSB_SHUFFLE_TIME:A.mtx S N 12 3 3 6 0.000847 +%:CONSTRUCTOR_TIMES:A.mtx S N 12 3 3 6 0.000000 0.001060 0.001877 0.002937 +%:UNSORTEDCOO2RSB_TIME:A.mtx S N 12 3 3 6 0.002937 +%:RSB_SUBDIVISION_TIME:A.mtx S N 12 3 3 6 0.001060 +%:RSB_SHUFFLE_TIME:A.mtx S N 12 3 3 6 0.001877 %:ROW_MAJOR_SORT_TIME:A.mtx S N 12 3 3 6 0.000000 %:ROW_MAJOR_SORT_SCALING:A.mtx S N 12 3 3 6 nan -%:SORTEDCOO2RSB_TIME:A.mtx S N 12 3 3 6 0.001843 +%:SORTEDCOO2RSB_TIME:A.mtx S N 12 3 3 6 0.002937 %:ROW_MAJOR_SORT_TO_MOP:A.mtx S N 12 3 3 6 0.000 %:UNSORTEDCOO2RSB_SCALING:A.mtx S N 12 3 3 6 1.00 %:SORTEDCOO2RSB_SCALING:A.mtx S N 12 3 3 6 1.00 @@ -4712,332 +4748,332 @@ %:SM_MINMAXAVGNNZ:A.mtx S N 12 3 3 6 6 6 6 # %operation:matrix CONSTRUCTOR[12] SPMV[12] SPMV[12] -%operation:A.mtx 0.00268912 1e+09 1e+09 +%operation:A.mtx 0.00462103 1e+09 1e+09 %constructor:matrix SORT[12] SCAN[12] SHUFFLE[12] INSERT[12] -%constructor:A.mtx 0 0.000995874 0 0.000847101 +%constructor:A.mtx 0 0.00106001 0 0.00187707 # symmetric matrix --- skipping transposed benchmarking -# so far, program took 5.743s of wall clock time; ancillary tests 0.000s; I/O 0.000s; checks 0.000s; conversions 0.000s; rsb/mkl tuning 0.289s/0.000s . +# so far, program took 5.928s of wall clock time; ancillary tests 0.000s; I/O 0.000s; checks 0.000s; conversions 0.000s; rsb/mkl tuning 0.497s/0.000s . getrusage() stats: -ru_maxrss: 6 (maximum resident set size -- MB) -ru_stime : 0.03271s (system CPU time used) -ru_utime : 8.401s (user CPU time used) +ru_maxrss: 8 (maximum resident set size -- MB) +ru_stime : 0.05901s (system CPU time used) +ru_utime : 8.387s (user CPU time used) # benchmarking terminated --- finalizing run. # ====== BEGIN Total summary record. #pr: ======== Limiting to type D: #pr: 2 samples (out of 8) matched the dump limiting criteria. #pr: Dump from a base of 8 samples (of max 16) ordered by (1,1,1,1,2,4,2) = (filename x cores x incX x incY x nrhs x typecode x transA). pr: BESTCODE MTX NR NC NNZ NRHS TYPE SYM TRANS NT AT-NT AT-MKL-NT BPNZ AT-BPNZ NSUBM AT-SUBM RSBBEST-MFLOPS OPTIME MKL-OPTIME AT-OPTIME AT-MKL-OPTIME AT-TIME RWminBW-GBps CB-bpf AT-MS CMFLOPS -pr: 1:R_R A 3 3 6 1 D S N 12 12 0 4.0000 4.6667 3 1 306.90 5.221e-04 0.000e+00 7.820e-08 0.000e+00 4.720e-03 1.89e+00 5.17e+00 1 2.40e-05 -pr: 9:R_R A 3 3 6 4 D S N 12 12 0 4.0000 4.6667 3 1 1227.60 8.330e-04 0.000e+00 7.820e-08 0.000e+00 8.379e-03 4.65e+00 2.79e+00 1 9.60e-05 +pr: 1:R_R A 3 3 6 1 D S N 12 12 0 4.0000 4.6667 3 1 25.17 1.313e-03 0.000e+00 9.537e-07 0.000e+00 1.618e-02 1.55e-01 5.17e+00 1 2.40e-05 +pr: 9:R_R A 3 3 6 4 D S N 12 12 0 4.0000 4.6667 3 1 100.66 1.098e-03 0.000e+00 9.537e-07 0.000e+00 2.464e-02 3.82e-01 2.79e+00 1 9.60e-05 #pr: 2 samples (out of 8) matched the dump limiting criteria. #pr: below, we define 'successful' autotuning when speedup of 1.010000x is exceeded, and 'tuned' results even the ones which are same as untuned #pr: rsb autotuning was successful in 2 cases (100.00 %) and unsuccessful in 0 cases (0.00 %) -#pr: (in succ. cases rsb autotuning gave avg. 866363.4 % faster, avg. sp. ratio 8664.634x, max sp. ratio 10652.439x, avg. ratio 0.000x) -#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 83751.5/60356.7/107146.3/167503.0 tuned ops) -#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 9.5/ 9.0/ 10.1/ 19.1 untuned ops) -#pr: (and amortizes from untuned rsb in avg. 9.6, min. 9.0, max. 10.1 ops) +#pr: (in succ. cases rsb autotuning gave avg. 126300.0 % faster, avg. sp. ratio 1264.000x, max sp. ratio 1376.750x, avg. ratio 0.000x) +#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 21404.1/16968.0/25840.2/42808.2 tuned ops) +#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 17.4/ 12.3/ 22.4/ 34.8 untuned ops) +#pr: (and amortizes from untuned rsb in avg. 17.4, min. 12.3, max. 22.5 ops) #pr: (avg/min/max (avg) nnz per subm before successful tuning were 2/ 2/ 2) #pr: (avg/min/max (avg) nnz per subm after successful tuning were 6/ 6/ 6) #pr: (avg/min/max (avg) bytes per subm before successful tuning were 16/ 16/ 16) #pr: (avg/min/max (avg) bytes per subm after successful tuning were 48/ 48/ 48) #pr: (avg/min/max (avg) bytes per nnz before successful tuning were 4.000/ 4.000/ 4.000) -#pr: (avg/min/max operands (mtx,lhs,rhs) read bandwidth lower bound 2.506/ 1.586/ 3.427,GBps) -#pr: (avg/min/max operands (mtx,rhs:r;lhs:rw) bandwidth lower bound 6.547/ 1.893/ 4.655,GBps) +#pr: (avg/min/max operands (mtx,lhs,rhs) read bandwidth lower bound 0.206/ 0.130/ 0.281,GBps) +#pr: (avg/min/max operands (mtx,rhs:r;lhs:rw) bandwidth lower bound 0.537/ 0.155/ 0.382,GBps) #pr: (avg/min/max code balance (bytes read at least once per flop) 3.979/ 2.792/ 5.167) #pr: (avg/min/max (avg) bytes per nnz after successful tuning were 4.667/ 4.667/ 4.667) #pr: (matrix has been subdivided more/less/same in resp. 0 / 2 /0 cases) #pr: (matrix has used more/less/same threads in resp. 0 / 0 /2 cases) #pr: no unsuccessful rsb autotuning attempt (according to 1.01x threshold) -#pr: rsb auto tuning (either succ. or uns.) time was: on avg.: 0.01 s, min 0.00 s, max 0.01 s, tot 0.01 s (2 samples) -#pr: rsb auto tuning ( only successful ) time was: on avg.: 0.01 s, min 0.00 s, max 0.01 s, tot 0.01 s (2 samples) -#pr: best tun. rsb canon. mflops were: on avg. 7.673e+02, min 3.069e+02, max 1.228e+03 (2 samples) -#pr: ref. unt. rsb canon. mflops were: on avg. 8.060e-02, min 4.596e-02, max 1.152e-01 (2 samples) -#pr: best tun. rsb operation time was: on avg. 7.820e-08s, min 7.820e-08s, max 7.820e-08s, tot 1.564e-07s (2 samples) -#pr: ref. unt. rsb operation time was: on avg. 6.776e-04s, min 5.221e-04s, max 8.330e-04s, tot 1.355e-03s (2 samples) -#pr: min / max ratio of in-memory MEMSET bandwidth to extrapolated read bandwidth ratio: 1.368e+01 2.957e+01 -#pr: in-cache to in-memory MEMSET bandwidth ratio: 1.018e+00 +#pr: rsb auto tuning (either succ. or uns.) time was: on avg.: 0.02 s, min 0.02 s, max 0.02 s, tot 0.04 s (2 samples) +#pr: rsb auto tuning ( only successful ) time was: on avg.: 0.02 s, min 0.02 s, max 0.02 s, tot 0.04 s (2 samples) +#pr: best tun. rsb canon. mflops were: on avg. 6.291e+01, min 2.517e+01, max 1.007e+02 (2 samples) +#pr: ref. unt. rsb canon. mflops were: on avg. 5.286e-02, min 1.828e-02, max 8.744e-02 (2 samples) +#pr: best tun. rsb operation time was: on avg. 9.537e-07s, min 9.537e-07s, max 9.537e-07s, tot 1.907e-06s (2 samples) +#pr: ref. unt. rsb operation time was: on avg. 1.205e-03s, min 1.098e-03s, max 1.313e-03s, tot 2.411e-03s (2 samples) +#pr: min / max ratio of in-memory MEMSET bandwidth to extrapolated read bandwidth ratio: 1.676e+02 3.622e+02 +#pr: in-cache to in-memory MEMSET bandwidth ratio: 1.013e+00 #pr: rsb nrhs-to-overall-min-rhs speed ratio was: on avg. 4.000e+00 x, min 4.000e+00 x, max 4.000e+00 x (1 samples, the non-min-nrhs ones) #pr: ======== Limiting to type S: #pr: 2 samples (out of 8) matched the dump limiting criteria. #pr: Dump from a base of 8 samples (of max 16) ordered by (1,1,1,1,2,4,2) = (filename x cores x incX x incY x nrhs x typecode x transA). pr: BESTCODE MTX NR NC NNZ NRHS TYPE SYM TRANS NT AT-NT AT-MKL-NT BPNZ AT-BPNZ NSUBM AT-SUBM RSBBEST-MFLOPS OPTIME MKL-OPTIME AT-OPTIME AT-MKL-OPTIME AT-TIME RWminBW-GBps CB-bpf AT-MS CMFLOPS -pr: 3:R_R A 3 3 6 1 S S N 12 12 0 4.0000 4.6667 3 1 306.90 4.139e-04 0.000e+00 7.820e-08 0.000e+00 6.863e-03 1.13e+00 3.17e+00 1 2.40e-05 -pr: 11:R_R A 3 3 6 4 S S N 12 12 0 4.0000 4.6667 3 1 1227.60 6.661e-04 0.000e+00 7.820e-08 0.000e+00 7.349e-03 2.51e+00 1.54e+00 1 9.60e-05 +pr: 3:R_R A 3 3 6 1 S S N 12 12 0 4.0000 4.6667 3 1 303.20 9.429e-04 0.000e+00 7.915e-08 0.000e+00 9.039e-03 1.11e+00 3.17e+00 1 2.40e-05 +pr: 11:R_R A 3 3 6 4 S S N 12 12 0 4.0000 4.6667 3 1 1212.81 8.552e-04 0.000e+00 7.915e-08 0.000e+00 8.359e-03 2.48e+00 1.54e+00 1 9.60e-05 #pr: 2 samples (out of 8) matched the dump limiting criteria. #pr: below, we define 'successful' autotuning when speedup of 1.010000x is exceeded, and 'tuned' results even the ones which are same as untuned #pr: rsb autotuning was successful in 2 cases (100.00 %) and unsuccessful in 0 cases (0.00 %) -#pr: (in succ. cases rsb autotuning gave avg. 690448.8 % faster, avg. sp. ratio 6905.488x, max sp. ratio 8518.293x, avg. ratio 0.000x) -#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 90867.4/87759.1/93975.6/181734.8 tuned ops) -#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 13.8/ 11.0/ 16.6/ 27.6 untuned ops) -#pr: (and amortizes from untuned rsb in avg. 13.8, min. 11.0, max. 16.6 ops) +#pr: (in succ. cases rsb autotuning gave avg. 1135743.4 % faster, avg. sp. ratio 11358.434x, max sp. ratio 11912.651x, avg. ratio 0.000x) +#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 109897.6/105602.4/114192.8/219795.2 tuned ops) +#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 9.7/ 9.6/ 9.8/ 19.4 untuned ops) +#pr: (and amortizes from untuned rsb in avg. 9.7, min. 9.6, max. 9.8 ops) #pr: (avg/min/max (avg) nnz per subm before successful tuning were 2/ 2/ 2) #pr: (avg/min/max (avg) nnz per subm after successful tuning were 6/ 6/ 6) #pr: (avg/min/max (avg) bytes per subm before successful tuning were 8/ 8/ 8) #pr: (avg/min/max (avg) bytes per subm after successful tuning were 24/ 24/ 24) #pr: (avg/min/max (avg) bytes per nnz before successful tuning were 4.000/ 4.000/ 4.000) -#pr: (avg/min/max operands (mtx,lhs,rhs) read bandwidth lower bound 1.432/ 0.972/ 1.893,GBps) -#pr: (avg/min/max operands (mtx,rhs:r;lhs:rw) bandwidth lower bound 3.632/ 1.125/ 2.506,GBps) +#pr: (avg/min/max operands (mtx,lhs,rhs) read bandwidth lower bound 1.415/ 0.960/ 1.870,GBps) +#pr: (avg/min/max operands (mtx,rhs:r;lhs:rw) bandwidth lower bound 3.588/ 1.112/ 2.476,GBps) #pr: (avg/min/max code balance (bytes read at least once per flop) 2.354/ 1.542/ 3.167) #pr: (avg/min/max (avg) bytes per nnz after successful tuning were 4.667/ 4.667/ 4.667) #pr: (matrix has been subdivided more/less/same in resp. 0 / 2 /0 cases) #pr: (matrix has used more/less/same threads in resp. 0 / 0 /2 cases) #pr: no unsuccessful rsb autotuning attempt (according to 1.01x threshold) -#pr: rsb auto tuning (either succ. or uns.) time was: on avg.: 0.01 s, min 0.01 s, max 0.01 s, tot 0.01 s (2 samples) -#pr: rsb auto tuning ( only successful ) time was: on avg.: 0.01 s, min 0.01 s, max 0.01 s, tot 0.01 s (2 samples) -#pr: best tun. rsb canon. mflops were: on avg. 7.673e+02, min 3.069e+02, max 1.228e+03 (2 samples) -#pr: ref. unt. rsb canon. mflops were: on avg. 1.010e-01, min 5.799e-02, max 1.441e-01 (2 samples) -#pr: best tun. rsb operation time was: on avg. 7.820e-08s, min 7.820e-08s, max 7.820e-08s, tot 1.564e-07s (2 samples) -#pr: ref. unt. rsb operation time was: on avg. 5.400e-04s, min 4.139e-04s, max 6.661e-04s, tot 1.080e-03s (2 samples) -#pr: min / max ratio of in-memory MEMSET bandwidth to extrapolated read bandwidth ratio: 2.478e+01 4.825e+01 -#pr: in-cache to in-memory MEMSET bandwidth ratio: 1.018e+00 +#pr: rsb auto tuning (either succ. or uns.) time was: on avg.: 0.01 s, min 0.01 s, max 0.01 s, tot 0.02 s (2 samples) +#pr: rsb auto tuning ( only successful ) time was: on avg.: 0.01 s, min 0.01 s, max 0.01 s, tot 0.02 s (2 samples) +#pr: best tun. rsb canon. mflops were: on avg. 7.580e+02, min 3.032e+02, max 1.213e+03 (2 samples) +#pr: ref. unt. rsb canon. mflops were: on avg. 6.885e-02, min 2.545e-02, max 1.123e-01 (2 samples) +#pr: best tun. rsb operation time was: on avg. 7.915e-08s, min 7.915e-08s, max 7.915e-08s, tot 1.583e-07s (2 samples) +#pr: ref. unt. rsb operation time was: on avg. 8.991e-04s, min 8.552e-04s, max 9.429e-04s, tot 1.798e-03s (2 samples) +#pr: min / max ratio of in-memory MEMSET bandwidth to extrapolated read bandwidth ratio: 2.519e+01 4.905e+01 +#pr: in-cache to in-memory MEMSET bandwidth ratio: 1.013e+00 #pr: rsb nrhs-to-overall-min-rhs speed ratio was: on avg. 4.000e+00 x, min 4.000e+00 x, max 4.000e+00 x (1 samples, the non-min-nrhs ones) #pr: ======== Limiting to type C: #pr: 2 samples (out of 8) matched the dump limiting criteria. #pr: Dump from a base of 8 samples (of max 16) ordered by (1,1,1,1,2,4,2) = (filename x cores x incX x incY x nrhs x typecode x transA). pr: BESTCODE MTX NR NC NNZ NRHS TYPE SYM TRANS NT AT-NT AT-MKL-NT BPNZ AT-BPNZ NSUBM AT-SUBM RSBBEST-MFLOPS OPTIME MKL-OPTIME AT-OPTIME AT-MKL-OPTIME AT-TIME RWminBW-GBps CB-bpf AT-MS CMFLOPS -pr: 5:R_R A 3 3 6 1 C S N 12 12 0 4.0000 4.6667 3 1 1227.60 4.711e-04 0.000e+00 7.820e-08 0.000e+00 4.662e-03 1.89e+00 1.29e+00 1 9.60e-05 -pr: 13:R_R A 3 3 6 4 C S N 12 12 0 4.0000 4.6667 3 1 4910.40 4.611e-04 0.000e+00 7.820e-08 0.000e+00 4.477e-03 4.65e+00 6.98e-01 1 3.84e-04 +pr: 5:R_R A 3 3 6 1 C S N 12 12 0 4.0000 4.6667 3 1 1212.81 6.599e-04 0.000e+00 7.915e-08 0.000e+00 8.766e-03 1.87e+00 1.29e+00 1 9.60e-05 +pr: 13:R_R A 3 3 6 4 C S N 12 12 0 4.0000 4.6667 3 1 4851.24 5.670e-04 0.000e+00 7.915e-08 0.000e+00 8.725e-03 4.60e+00 6.98e-01 1 3.84e-04 #pr: 2 samples (out of 8) matched the dump limiting criteria. #pr: below, we define 'successful' autotuning when speedup of 1.010000x is exceeded, and 'tuned' results even the ones which are same as untuned #pr: rsb autotuning was successful in 2 cases (100.00 %) and unsuccessful in 0 cases (0.00 %) -#pr: (in succ. cases rsb autotuning gave avg. 595936.6 % faster, avg. sp. ratio 5960.366x, max sp. ratio 6024.390x, avg. ratio 0.000x) -#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 58432.9/57250.0/59615.9/116865.9 tuned ops) -#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 9.8/ 9.7/ 9.9/ 19.6 untuned ops) -#pr: (and amortizes from untuned rsb in avg. 9.8, min. 9.7, max. 9.9 ops) +#pr: (in succ. cases rsb autotuning gave avg. 774900.0 % faster, avg. sp. ratio 7750.000x, max sp. ratio 8337.349x, avg. ratio 0.000x) +#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 110488.0/110228.9/110747.0/220975.9 tuned ops) +#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 14.3/ 13.3/ 15.4/ 28.7 untuned ops) +#pr: (and amortizes from untuned rsb in avg. 14.3, min. 13.3, max. 15.4 ops) #pr: (avg/min/max (avg) nnz per subm before successful tuning were 2/ 2/ 2) #pr: (avg/min/max (avg) nnz per subm after successful tuning were 6/ 6/ 6) #pr: (avg/min/max (avg) bytes per subm before successful tuning were 16/ 16/ 16) #pr: (avg/min/max (avg) bytes per subm after successful tuning were 48/ 48/ 48) #pr: (avg/min/max (avg) bytes per nnz before successful tuning were 4.000/ 4.000/ 4.000) -#pr: (avg/min/max operands (mtx,lhs,rhs) read bandwidth lower bound 2.506/ 1.586/ 3.427,GBps) -#pr: (avg/min/max operands (mtx,rhs:r;lhs:rw) bandwidth lower bound 6.547/ 1.893/ 4.655,GBps) +#pr: (avg/min/max operands (mtx,lhs,rhs) read bandwidth lower bound 2.476/ 1.567/ 3.386,GBps) +#pr: (avg/min/max operands (mtx,rhs:r;lhs:rw) bandwidth lower bound 6.468/ 1.870/ 4.599,GBps) #pr: (avg/min/max code balance (bytes read at least once per flop) 0.995/ 0.698/ 1.292) #pr: (avg/min/max (avg) bytes per nnz after successful tuning were 4.667/ 4.667/ 4.667) #pr: (matrix has been subdivided more/less/same in resp. 0 / 2 /0 cases) #pr: (matrix has used more/less/same threads in resp. 0 / 0 /2 cases) #pr: no unsuccessful rsb autotuning attempt (according to 1.01x threshold) -#pr: rsb auto tuning (either succ. or uns.) time was: on avg.: 0.00 s, min 0.00 s, max 0.00 s, tot 0.01 s (2 samples) -#pr: rsb auto tuning ( only successful ) time was: on avg.: 0.00 s, min 0.00 s, max 0.00 s, tot 0.01 s (2 samples) -#pr: best tun. rsb canon. mflops were: on avg. 3.069e+03, min 1.228e+03, max 4.910e+03 (2 samples) -#pr: ref. unt. rsb canon. mflops were: on avg. 5.183e-01, min 2.038e-01, max 8.328e-01 (2 samples) -#pr: best tun. rsb operation time was: on avg. 7.820e-08s, min 7.820e-08s, max 7.820e-08s, tot 1.564e-07s (2 samples) -#pr: ref. unt. rsb operation time was: on avg. 4.661e-04s, min 4.611e-04s, max 4.711e-04s, tot 9.322e-04s (2 samples) -#pr: min / max ratio of in-memory MEMSET bandwidth to extrapolated read bandwidth ratio: 1.368e+01 2.957e+01 -#pr: in-cache to in-memory MEMSET bandwidth ratio: 1.018e+00 +#pr: rsb auto tuning (either succ. or uns.) time was: on avg.: 0.01 s, min 0.01 s, max 0.01 s, tot 0.02 s (2 samples) +#pr: rsb auto tuning ( only successful ) time was: on avg.: 0.01 s, min 0.01 s, max 0.01 s, tot 0.02 s (2 samples) +#pr: best tun. rsb canon. mflops were: on avg. 3.032e+03, min 1.213e+03, max 4.851e+03 (2 samples) +#pr: ref. unt. rsb canon. mflops were: on avg. 4.114e-01, min 1.455e-01, max 6.773e-01 (2 samples) +#pr: best tun. rsb operation time was: on avg. 7.915e-08s, min 7.915e-08s, max 7.915e-08s, tot 1.583e-07s (2 samples) +#pr: ref. unt. rsb operation time was: on avg. 6.135e-04s, min 5.670e-04s, max 6.599e-04s, tot 1.227e-03s (2 samples) +#pr: min / max ratio of in-memory MEMSET bandwidth to extrapolated read bandwidth ratio: 1.391e+01 3.006e+01 +#pr: in-cache to in-memory MEMSET bandwidth ratio: 1.013e+00 #pr: rsb nrhs-to-overall-min-rhs speed ratio was: on avg. 4.000e+00 x, min 4.000e+00 x, max 4.000e+00 x (1 samples, the non-min-nrhs ones) #pr: ======== Limiting to type Z: #pr: 2 samples (out of 8) matched the dump limiting criteria. #pr: Dump from a base of 8 samples (of max 16) ordered by (1,1,1,1,2,4,2) = (filename x cores x incX x incY x nrhs x typecode x transA). pr: BESTCODE MTX NR NC NNZ NRHS TYPE SYM TRANS NT AT-NT AT-MKL-NT BPNZ AT-BPNZ NSUBM AT-SUBM RSBBEST-MFLOPS OPTIME MKL-OPTIME AT-OPTIME AT-MKL-OPTIME AT-TIME RWminBW-GBps CB-bpf AT-MS CMFLOPS -pr: 7:R_R A 3 3 6 1 Z S N 12 12 0 4.0000 4.6667 3 1 1227.60 5.400e-04 0.000e+00 7.820e-08 0.000e+00 4.870e-03 3.43e+00 2.29e+00 1 9.60e-05 -pr: 15:R_R A 3 3 6 4 Z S N 12 12 0 4.0000 4.6667 3 1 4910.40 4.208e-04 0.000e+00 7.820e-08 0.000e+00 4.420e-03 8.95e+00 1.32e+00 1 3.84e-04 +pr: 7:R_R A 3 3 6 1 Z S N 12 12 0 4.0000 4.6667 3 1 1212.81 5.760e-04 0.000e+00 7.915e-08 0.000e+00 1.174e-02 3.39e+00 2.29e+00 1 9.60e-05 +pr: 15:R_R A 3 3 6 4 Z S N 12 12 0 4.0000 4.6667 3 1 4851.24 6.299e-04 0.000e+00 7.915e-08 0.000e+00 9.607e-03 8.84e+00 1.32e+00 1 3.84e-04 #pr: 2 samples (out of 8) matched the dump limiting criteria. #pr: below, we define 'successful' autotuning when speedup of 1.010000x is exceeded, and 'tuned' results even the ones which are same as untuned #pr: rsb autotuning was successful in 2 cases (100.00 %) and unsuccessful in 0 cases (0.00 %) -#pr: (in succ. cases rsb autotuning gave avg. 614229.3 % faster, avg. sp. ratio 6143.293x, max sp. ratio 6905.488x, avg. ratio 0.000x) -#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 59397.9/56521.3/62274.4/118795.7 tuned ops) -#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 9.8/ 9.0/ 10.5/ 19.5 untuned ops) -#pr: (and amortizes from untuned rsb in avg. 9.8, min. 9.0, max. 10.5 ops) +#pr: (in succ. cases rsb autotuning gave avg. 761647.0 % faster, avg. sp. ratio 7617.470x, max sp. ratio 7957.831x, avg. ratio 0.000x) +#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 134861.4/121370.5/148352.4/269722.9 tuned ops) +#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 17.8/ 15.3/ 20.4/ 35.6 untuned ops) +#pr: (and amortizes from untuned rsb in avg. 17.8, min. 15.3, max. 20.4 ops) #pr: (avg/min/max (avg) nnz per subm before successful tuning were 2/ 2/ 2) #pr: (avg/min/max (avg) nnz per subm after successful tuning were 6/ 6/ 6) #pr: (avg/min/max (avg) bytes per subm before successful tuning were 32/ 32/ 32) #pr: (avg/min/max (avg) bytes per subm after successful tuning were 96/ 96/ 96) #pr: (avg/min/max (avg) bytes per nnz before successful tuning were 4.000/ 4.000/ 4.000) -#pr: (avg/min/max operands (mtx,lhs,rhs) read bandwidth lower bound 4.655/ 2.813/ 6.496,GBps) -#pr: (avg/min/max operands (mtx,rhs:r;lhs:rw) bandwidth lower bound 12.378/ 3.427/ 8.951,GBps) +#pr: (avg/min/max operands (mtx,lhs,rhs) read bandwidth lower bound 4.599/ 2.779/ 6.418,GBps) +#pr: (avg/min/max operands (mtx,rhs:r;lhs:rw) bandwidth lower bound 12.229/ 3.386/ 8.843,GBps) #pr: (avg/min/max code balance (bytes read at least once per flop) 1.807/ 1.323/ 2.292) #pr: (avg/min/max (avg) bytes per nnz after successful tuning were 4.667/ 4.667/ 4.667) #pr: (matrix has been subdivided more/less/same in resp. 0 / 2 /0 cases) #pr: (matrix has used more/less/same threads in resp. 0 / 0 /2 cases) #pr: no unsuccessful rsb autotuning attempt (according to 1.01x threshold) -#pr: rsb auto tuning (either succ. or uns.) time was: on avg.: 0.00 s, min 0.00 s, max 0.00 s, tot 0.01 s (2 samples) -#pr: rsb auto tuning ( only successful ) time was: on avg.: 0.00 s, min 0.00 s, max 0.00 s, tot 0.01 s (2 samples) -#pr: best tun. rsb canon. mflops were: on avg. 3.069e+03, min 1.228e+03, max 4.910e+03 (2 samples) -#pr: ref. unt. rsb canon. mflops were: on avg. 5.452e-01, min 1.778e-01, max 9.125e-01 (2 samples) -#pr: best tun. rsb operation time was: on avg. 7.820e-08s, min 7.820e-08s, max 7.820e-08s, tot 1.564e-07s (2 samples) -#pr: ref. unt. rsb operation time was: on avg. 4.804e-04s, min 4.208e-04s, max 5.400e-04s, tot 9.608e-04s (2 samples) -#pr: min / max ratio of in-memory MEMSET bandwidth to extrapolated read bandwidth ratio: 7.218e+00 1.667e+01 -#pr: in-cache to in-memory MEMSET bandwidth ratio: 1.018e+00 +#pr: rsb auto tuning (either succ. or uns.) time was: on avg.: 0.01 s, min 0.01 s, max 0.01 s, tot 0.02 s (2 samples) +#pr: rsb auto tuning ( only successful ) time was: on avg.: 0.01 s, min 0.01 s, max 0.01 s, tot 0.02 s (2 samples) +#pr: best tun. rsb canon. mflops were: on avg. 3.032e+03, min 1.213e+03, max 4.851e+03 (2 samples) +#pr: ref. unt. rsb canon. mflops were: on avg. 3.881e-01, min 1.667e-01, max 6.096e-01 (2 samples) +#pr: best tun. rsb operation time was: on avg. 7.915e-08s, min 7.915e-08s, max 7.915e-08s, tot 1.583e-07s (2 samples) +#pr: ref. unt. rsb operation time was: on avg. 6.030e-04s, min 5.760e-04s, max 6.299e-04s, tot 1.206e-03s (2 samples) +#pr: min / max ratio of in-memory MEMSET bandwidth to extrapolated read bandwidth ratio: 7.338e+00 1.694e+01 +#pr: in-cache to in-memory MEMSET bandwidth ratio: 1.013e+00 #pr: rsb nrhs-to-overall-min-rhs speed ratio was: on avg. 4.000e+00 x, min 4.000e+00 x, max 4.000e+00 x (1 samples, the non-min-nrhs ones) #pr: ======== Limiting to nrhs=1: #pr: 4 samples (out of 8) matched the dump limiting criteria. #pr: Dump from a base of 8 samples (of max 16) ordered by (1,1,1,1,2,4,2) = (filename x cores x incX x incY x nrhs x typecode x transA). pr: BESTCODE MTX NR NC NNZ NRHS TYPE SYM TRANS NT AT-NT AT-MKL-NT BPNZ AT-BPNZ NSUBM AT-SUBM RSBBEST-MFLOPS OPTIME MKL-OPTIME AT-OPTIME AT-MKL-OPTIME AT-TIME RWminBW-GBps CB-bpf AT-MS CMFLOPS -pr: 1:R_R A 3 3 6 1 D S N 12 12 0 4.0000 4.6667 3 1 306.90 5.221e-04 0.000e+00 7.820e-08 0.000e+00 4.720e-03 1.89e+00 5.17e+00 1 2.40e-05 -pr: 3:R_R A 3 3 6 1 S S N 12 12 0 4.0000 4.6667 3 1 306.90 4.139e-04 0.000e+00 7.820e-08 0.000e+00 6.863e-03 1.13e+00 3.17e+00 1 2.40e-05 -pr: 5:R_R A 3 3 6 1 C S N 12 12 0 4.0000 4.6667 3 1 1227.60 4.711e-04 0.000e+00 7.820e-08 0.000e+00 4.662e-03 1.89e+00 1.29e+00 1 9.60e-05 -pr: 7:R_R A 3 3 6 1 Z S N 12 12 0 4.0000 4.6667 3 1 1227.60 5.400e-04 0.000e+00 7.820e-08 0.000e+00 4.870e-03 3.43e+00 2.29e+00 1 9.60e-05 +pr: 1:R_R A 3 3 6 1 D S N 12 12 0 4.0000 4.6667 3 1 25.17 1.313e-03 0.000e+00 9.537e-07 0.000e+00 1.618e-02 1.55e-01 5.17e+00 1 2.40e-05 +pr: 3:R_R A 3 3 6 1 S S N 12 12 0 4.0000 4.6667 3 1 303.20 9.429e-04 0.000e+00 7.915e-08 0.000e+00 9.039e-03 1.11e+00 3.17e+00 1 2.40e-05 +pr: 5:R_R A 3 3 6 1 C S N 12 12 0 4.0000 4.6667 3 1 1212.81 6.599e-04 0.000e+00 7.915e-08 0.000e+00 8.766e-03 1.87e+00 1.29e+00 1 9.60e-05 +pr: 7:R_R A 3 3 6 1 Z S N 12 12 0 4.0000 4.6667 3 1 1212.81 5.760e-04 0.000e+00 7.915e-08 0.000e+00 1.174e-02 3.39e+00 2.29e+00 1 9.60e-05 #pr: 4 samples (out of 8) matched the dump limiting criteria. #pr: below, we define 'successful' autotuning when speedup of 1.010000x is exceeded, and 'tuned' results even the ones which are same as untuned #pr: rsb autotuning was successful in 4 cases (100.00 %) and unsuccessful in 0 cases (0.00 %) -#pr: (in succ. cases rsb autotuning gave avg. 622384.8 % faster, avg. sp. ratio 6224.848x, max sp. ratio 6905.488x, avg. ratio 0.000x) -#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 67501.5/59615.9/87759.1/270006.1 tuned ops) -#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 11.1/ 9.0/ 16.6/ 44.5 untuned ops) -#pr: (and amortizes from untuned rsb in avg. 11.1, min. 9.0, max. 16.6 ops) +#pr: (in succ. cases rsb autotuning gave avg. 722496.5 % faster, avg. sp. ratio 7225.965x, max sp. ratio 11912.651x, avg. ratio 0.000x) +#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 97565.0/16968.0/148352.4/390260.2 tuned ops) +#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 13.9/ 9.6/ 20.4/ 55.6 untuned ops) +#pr: (and amortizes from untuned rsb in avg. 13.9, min. 9.6, max. 20.4 ops) #pr: (avg/min/max (avg) nnz per subm before successful tuning were 2/ 2/ 2) #pr: (avg/min/max (avg) nnz per subm after successful tuning were 6/ 6/ 6) #pr: (avg/min/max (avg) bytes per subm before successful tuning were 18/ 8/ 32) #pr: (avg/min/max (avg) bytes per subm after successful tuning were 54/ 24/ 96) #pr: (avg/min/max (avg) bytes per nnz before successful tuning were 4.000/ 4.000/ 4.000) -#pr: (avg/min/max operands (mtx,lhs,rhs) read bandwidth lower bound 1.739/ 0.972/ 2.813,GBps) -#pr: (avg/min/max operands (mtx,rhs:r;lhs:rw) bandwidth lower bound 8.337/ 1.125/ 3.427,GBps) +#pr: (avg/min/max operands (mtx,lhs,rhs) read bandwidth lower bound 1.359/ 0.130/ 2.779,GBps) +#pr: (avg/min/max operands (mtx,rhs:r;lhs:rw) bandwidth lower bound 6.522/ 0.155/ 3.386,GBps) #pr: (avg/min/max code balance (bytes read at least once per flop) 2.979/ 1.292/ 5.167) #pr: (avg/min/max (avg) bytes per nnz after successful tuning were 4.667/ 4.667/ 4.667) #pr: (matrix has been subdivided more/less/same in resp. 0 / 4 /0 cases) #pr: (matrix has used more/less/same threads in resp. 0 / 0 /4 cases) #pr: no unsuccessful rsb autotuning attempt (according to 1.01x threshold) -#pr: rsb auto tuning (either succ. or uns.) time was: on avg.: 0.01 s, min 0.00 s, max 0.01 s, tot 0.02 s (4 samples) -#pr: rsb auto tuning ( only successful ) time was: on avg.: 0.01 s, min 0.00 s, max 0.01 s, tot 0.02 s (4 samples) -#pr: best tun. rsb canon. mflops were: on avg. 7.673e+02, min 3.069e+02, max 1.228e+03 (4 samples) -#pr: ref. unt. rsb canon. mflops were: on avg. 1.214e-01, min 4.596e-02, max 2.038e-01 (4 samples) -#pr: best tun. rsb operation time was: on avg. 7.820e-08s, min 7.820e-08s, max 7.820e-08s, tot 3.128e-07s (4 samples) -#pr: ref. unt. rsb operation time was: on avg. 4.868e-04s, min 4.139e-04s, max 5.400e-04s, tot 1.947e-03s (4 samples) -#pr: min / max ratio of in-memory MEMSET bandwidth to extrapolated read bandwidth ratio: 1.667e+01 4.825e+01 -#pr: in-cache to in-memory MEMSET bandwidth ratio: 1.018e+00 +#pr: rsb auto tuning (either succ. or uns.) time was: on avg.: 0.01 s, min 0.01 s, max 0.02 s, tot 0.05 s (4 samples) +#pr: rsb auto tuning ( only successful ) time was: on avg.: 0.01 s, min 0.01 s, max 0.02 s, tot 0.05 s (4 samples) +#pr: best tun. rsb canon. mflops were: on avg. 6.885e+02, min 2.517e+01, max 1.213e+03 (4 samples) +#pr: ref. unt. rsb canon. mflops were: on avg. 8.896e-02, min 1.828e-02, max 1.667e-01 (4 samples) +#pr: best tun. rsb operation time was: on avg. 2.978e-07s, min 7.915e-08s, max 9.537e-07s, tot 1.191e-06s (4 samples) +#pr: ref. unt. rsb operation time was: on avg. 8.730e-04s, min 5.760e-04s, max 1.313e-03s, tot 3.492e-03s (4 samples) +#pr: min / max ratio of in-memory MEMSET bandwidth to extrapolated read bandwidth ratio: 1.694e+01 3.622e+02 +#pr: in-cache to in-memory MEMSET bandwidth ratio: 1.013e+00 #pr: ======== Limiting to nrhs=4: #pr: 4 samples (out of 8) matched the dump limiting criteria. #pr: Dump from a base of 8 samples (of max 16) ordered by (1,1,1,1,2,4,2) = (filename x cores x incX x incY x nrhs x typecode x transA). pr: BESTCODE MTX NR NC NNZ NRHS TYPE SYM TRANS NT AT-NT AT-MKL-NT BPNZ AT-BPNZ NSUBM AT-SUBM RSBBEST-MFLOPS OPTIME MKL-OPTIME AT-OPTIME AT-MKL-OPTIME AT-TIME RWminBW-GBps CB-bpf AT-MS CMFLOPS -pr: 9:R_R A 3 3 6 4 D S N 12 12 0 4.0000 4.6667 3 1 1227.60 8.330e-04 0.000e+00 7.820e-08 0.000e+00 8.379e-03 4.65e+00 2.79e+00 1 9.60e-05 -pr: 11:R_R A 3 3 6 4 S S N 12 12 0 4.0000 4.6667 3 1 1227.60 6.661e-04 0.000e+00 7.820e-08 0.000e+00 7.349e-03 2.51e+00 1.54e+00 1 9.60e-05 -pr: 13:R_R A 3 3 6 4 C S N 12 12 0 4.0000 4.6667 3 1 4910.40 4.611e-04 0.000e+00 7.820e-08 0.000e+00 4.477e-03 4.65e+00 6.98e-01 1 3.84e-04 -pr: 15:R_R A 3 3 6 4 Z S N 12 12 0 4.0000 4.6667 3 1 4910.40 4.208e-04 0.000e+00 7.820e-08 0.000e+00 4.420e-03 8.95e+00 1.32e+00 1 3.84e-04 +pr: 9:R_R A 3 3 6 4 D S N 12 12 0 4.0000 4.6667 3 1 100.66 1.098e-03 0.000e+00 9.537e-07 0.000e+00 2.464e-02 3.82e-01 2.79e+00 1 9.60e-05 +pr: 11:R_R A 3 3 6 4 S S N 12 12 0 4.0000 4.6667 3 1 1212.81 8.552e-04 0.000e+00 7.915e-08 0.000e+00 8.359e-03 2.48e+00 1.54e+00 1 9.60e-05 +pr: 13:R_R A 3 3 6 4 C S N 12 12 0 4.0000 4.6667 3 1 4851.24 5.670e-04 0.000e+00 7.915e-08 0.000e+00 8.725e-03 4.60e+00 6.98e-01 1 3.84e-04 +pr: 15:R_R A 3 3 6 4 Z S N 12 12 0 4.0000 4.6667 3 1 4851.24 6.299e-04 0.000e+00 7.915e-08 0.000e+00 9.607e-03 8.84e+00 1.32e+00 1 3.84e-04 #pr: 4 samples (out of 8) matched the dump limiting criteria. #pr: below, we define 'successful' autotuning when speedup of 1.010000x is exceeded, and 'tuned' results even the ones which are same as untuned #pr: rsb autotuning was successful in 4 cases (100.00 %) and unsuccessful in 0 cases (0.00 %) -#pr: (in succ. cases rsb autotuning gave avg. 761104.3 % faster, avg. sp. ratio 7612.043x, max sp. ratio 10652.439x, avg. ratio 0.000x) -#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 78723.3/56521.3/107146.3/314893.3 tuned ops) -#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 10.3/ 9.7/ 11.0/ 41.3 untuned ops) -#pr: (and amortizes from untuned rsb in avg. 10.3, min. 9.7, max. 11.0 ops) +#pr: (in succ. cases rsb autotuning gave avg. 676798.7 % faster, avg. sp. ratio 6768.987x, max sp. ratio 10804.217x, avg. ratio 0.000x) +#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 90760.5/25840.2/121370.5/363042.1 tuned ops) +#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 15.7/ 9.8/ 22.4/ 62.9 untuned ops) +#pr: (and amortizes from untuned rsb in avg. 15.7, min. 9.8, max. 22.5 ops) #pr: (avg/min/max (avg) nnz per subm before successful tuning were 2/ 2/ 2) #pr: (avg/min/max (avg) nnz per subm after successful tuning were 6/ 6/ 6) #pr: (avg/min/max (avg) bytes per subm before successful tuning were 18/ 8/ 32) #pr: (avg/min/max (avg) bytes per subm after successful tuning were 54/ 24/ 96) #pr: (avg/min/max (avg) bytes per nnz before successful tuning were 4.000/ 4.000/ 4.000) -#pr: (avg/min/max operands (mtx,lhs,rhs) read bandwidth lower bound 3.811/ 1.893/ 6.496,GBps) -#pr: (avg/min/max operands (mtx,rhs:r;lhs:rw) bandwidth lower bound 20.767/ 2.506/ 8.951,GBps) +#pr: (avg/min/max operands (mtx,lhs,rhs) read bandwidth lower bound 2.989/ 0.281/ 6.418,GBps) +#pr: (avg/min/max operands (mtx,rhs:r;lhs:rw) bandwidth lower bound 16.300/ 0.382/ 8.843,GBps) #pr: (avg/min/max code balance (bytes read at least once per flop) 1.589/ 0.698/ 2.792) #pr: (avg/min/max (avg) bytes per nnz after successful tuning were 4.667/ 4.667/ 4.667) #pr: (matrix has been subdivided more/less/same in resp. 0 / 4 /0 cases) #pr: (matrix has used more/less/same threads in resp. 0 / 0 /4 cases) #pr: no unsuccessful rsb autotuning attempt (according to 1.01x threshold) -#pr: rsb auto tuning (either succ. or uns.) time was: on avg.: 0.01 s, min 0.00 s, max 0.01 s, tot 0.02 s (4 samples) -#pr: rsb auto tuning ( only successful ) time was: on avg.: 0.01 s, min 0.00 s, max 0.01 s, tot 0.02 s (4 samples) -#pr: best tun. rsb canon. mflops were: on avg. 3.069e+03, min 1.228e+03, max 4.910e+03 (4 samples) -#pr: ref. unt. rsb canon. mflops were: on avg. 5.012e-01, min 1.152e-01, max 9.125e-01 (4 samples) -#pr: best tun. rsb operation time was: on avg. 7.820e-08s, min 7.820e-08s, max 7.820e-08s, tot 3.128e-07s (4 samples) -#pr: ref. unt. rsb operation time was: on avg. 5.953e-04s, min 4.208e-04s, max 8.330e-04s, tot 2.381e-03s (4 samples) -#pr: min / max ratio of in-memory MEMSET bandwidth to extrapolated read bandwidth ratio: 7.218e+00 2.478e+01 -#pr: in-cache to in-memory MEMSET bandwidth ratio: 1.018e+00 +#pr: rsb auto tuning (either succ. or uns.) time was: on avg.: 0.01 s, min 0.01 s, max 0.02 s, tot 0.05 s (4 samples) +#pr: rsb auto tuning ( only successful ) time was: on avg.: 0.01 s, min 0.01 s, max 0.02 s, tot 0.05 s (4 samples) +#pr: best tun. rsb canon. mflops were: on avg. 2.754e+03, min 1.007e+02, max 4.851e+03 (4 samples) +#pr: ref. unt. rsb canon. mflops were: on avg. 3.717e-01, min 8.744e-02, max 6.773e-01 (4 samples) +#pr: best tun. rsb operation time was: on avg. 2.978e-07s, min 7.915e-08s, max 9.537e-07s, tot 1.191e-06s (4 samples) +#pr: ref. unt. rsb operation time was: on avg. 7.875e-04s, min 5.670e-04s, max 1.098e-03s, tot 3.150e-03s (4 samples) +#pr: min / max ratio of in-memory MEMSET bandwidth to extrapolated read bandwidth ratio: 7.338e+00 1.676e+02 +#pr: in-cache to in-memory MEMSET bandwidth ratio: 1.013e+00 #pr: rsb nrhs-to-overall-min-rhs speed ratio was: on avg. 4.000e+00 x, min 4.000e+00 x, max 4.000e+00 x (4 samples, the non-min-nrhs ones) #pr: ======== Limiting to transA=N: #pr: Dump from a base of 8 samples (of max 16) ordered by (1,1,1,1,2,4,2) = (filename x cores x incX x incY x nrhs x typecode x transA). pr: BESTCODE MTX NR NC NNZ NRHS TYPE SYM TRANS NT AT-NT AT-MKL-NT BPNZ AT-BPNZ NSUBM AT-SUBM RSBBEST-MFLOPS OPTIME MKL-OPTIME AT-OPTIME AT-MKL-OPTIME AT-TIME RWminBW-GBps CB-bpf AT-MS CMFLOPS -pr: 1:R_R A 3 3 6 1 D S N 12 12 0 4.0000 4.6667 3 1 306.90 5.221e-04 0.000e+00 7.820e-08 0.000e+00 4.720e-03 1.89e+00 5.17e+00 1 2.40e-05 -pr: 3:R_R A 3 3 6 1 S S N 12 12 0 4.0000 4.6667 3 1 306.90 4.139e-04 0.000e+00 7.820e-08 0.000e+00 6.863e-03 1.13e+00 3.17e+00 1 2.40e-05 -pr: 5:R_R A 3 3 6 1 C S N 12 12 0 4.0000 4.6667 3 1 1227.60 4.711e-04 0.000e+00 7.820e-08 0.000e+00 4.662e-03 1.89e+00 1.29e+00 1 9.60e-05 -pr: 7:R_R A 3 3 6 1 Z S N 12 12 0 4.0000 4.6667 3 1 1227.60 5.400e-04 0.000e+00 7.820e-08 0.000e+00 4.870e-03 3.43e+00 2.29e+00 1 9.60e-05 -pr: 9:R_R A 3 3 6 4 D S N 12 12 0 4.0000 4.6667 3 1 1227.60 8.330e-04 0.000e+00 7.820e-08 0.000e+00 8.379e-03 4.65e+00 2.79e+00 1 9.60e-05 -pr: 11:R_R A 3 3 6 4 S S N 12 12 0 4.0000 4.6667 3 1 1227.60 6.661e-04 0.000e+00 7.820e-08 0.000e+00 7.349e-03 2.51e+00 1.54e+00 1 9.60e-05 -pr: 13:R_R A 3 3 6 4 C S N 12 12 0 4.0000 4.6667 3 1 4910.40 4.611e-04 0.000e+00 7.820e-08 0.000e+00 4.477e-03 4.65e+00 6.98e-01 1 3.84e-04 -pr: 15:R_R A 3 3 6 4 Z S N 12 12 0 4.0000 4.6667 3 1 4910.40 4.208e-04 0.000e+00 7.820e-08 0.000e+00 4.420e-03 8.95e+00 1.32e+00 1 3.84e-04 +pr: 1:R_R A 3 3 6 1 D S N 12 12 0 4.0000 4.6667 3 1 25.17 1.313e-03 0.000e+00 9.537e-07 0.000e+00 1.618e-02 1.55e-01 5.17e+00 1 2.40e-05 +pr: 3:R_R A 3 3 6 1 S S N 12 12 0 4.0000 4.6667 3 1 303.20 9.429e-04 0.000e+00 7.915e-08 0.000e+00 9.039e-03 1.11e+00 3.17e+00 1 2.40e-05 +pr: 5:R_R A 3 3 6 1 C S N 12 12 0 4.0000 4.6667 3 1 1212.81 6.599e-04 0.000e+00 7.915e-08 0.000e+00 8.766e-03 1.87e+00 1.29e+00 1 9.60e-05 +pr: 7:R_R A 3 3 6 1 Z S N 12 12 0 4.0000 4.6667 3 1 1212.81 5.760e-04 0.000e+00 7.915e-08 0.000e+00 1.174e-02 3.39e+00 2.29e+00 1 9.60e-05 +pr: 9:R_R A 3 3 6 4 D S N 12 12 0 4.0000 4.6667 3 1 100.66 1.098e-03 0.000e+00 9.537e-07 0.000e+00 2.464e-02 3.82e-01 2.79e+00 1 9.60e-05 +pr: 11:R_R A 3 3 6 4 S S N 12 12 0 4.0000 4.6667 3 1 1212.81 8.552e-04 0.000e+00 7.915e-08 0.000e+00 8.359e-03 2.48e+00 1.54e+00 1 9.60e-05 +pr: 13:R_R A 3 3 6 4 C S N 12 12 0 4.0000 4.6667 3 1 4851.24 5.670e-04 0.000e+00 7.915e-08 0.000e+00 8.725e-03 4.60e+00 6.98e-01 1 3.84e-04 +pr: 15:R_R A 3 3 6 4 Z S N 12 12 0 4.0000 4.6667 3 1 4851.24 6.299e-04 0.000e+00 7.915e-08 0.000e+00 9.607e-03 8.84e+00 1.32e+00 1 3.84e-04 #pr: below, we define 'successful' autotuning when speedup of 1.010000x is exceeded, and 'tuned' results even the ones which are same as untuned #pr: rsb autotuning was successful in 8 cases (100.00 %) and unsuccessful in 0 cases (0.00 %) -#pr: (in succ. cases rsb autotuning gave avg. 691744.5 % faster, avg. sp. ratio 6918.445x, max sp. ratio 10652.439x, avg. ratio 0.000x) -#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 73112.4/56521.3/107146.3/584899.4 tuned ops) -#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 10.7/ 9.0/ 16.6/ 85.8 untuned ops) -#pr: (and amortizes from untuned rsb in avg. 10.7, min. 9.0, max. 16.6 ops) +#pr: (in succ. cases rsb autotuning gave avg. 699647.6 % faster, avg. sp. ratio 6997.476x, max sp. ratio 11912.651x, avg. ratio 0.000x) +#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 94162.8/16968.0/148352.4/753302.2 tuned ops) +#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 14.8/ 9.6/ 22.4/118.4 untuned ops) +#pr: (and amortizes from untuned rsb in avg. 14.8, min. 9.6, max. 22.5 ops) #pr: (avg/min/max (avg) nnz per subm before successful tuning were 2/ 2/ 2) #pr: (avg/min/max (avg) nnz per subm after successful tuning were 6/ 6/ 6) #pr: (avg/min/max (avg) bytes per subm before successful tuning were 18/ 8/ 32) #pr: (avg/min/max (avg) bytes per subm after successful tuning were 54/ 24/ 96) #pr: (avg/min/max (avg) bytes per nnz before successful tuning were 4.000/ 4.000/ 4.000) -#pr: (avg/min/max operands (mtx,lhs,rhs) read bandwidth lower bound 2.775/ 0.972/ 6.496,GBps) -#pr: (avg/min/max operands (mtx,rhs:r;lhs:rw) bandwidth lower bound 29.104/ 1.125/ 8.951,GBps) +#pr: (avg/min/max operands (mtx,lhs,rhs) read bandwidth lower bound 2.174/ 0.130/ 6.418,GBps) +#pr: (avg/min/max operands (mtx,rhs:r;lhs:rw) bandwidth lower bound 22.822/ 0.155/ 8.843,GBps) #pr: (avg/min/max code balance (bytes read at least once per flop) 2.284/ 0.698/ 5.167) #pr: (avg/min/max (avg) bytes per nnz after successful tuning were 4.667/ 4.667/ 4.667) #pr: (matrix has been subdivided more/less/same in resp. 0 / 8 /0 cases) #pr: (matrix has used more/less/same threads in resp. 0 / 0 /8 cases) #pr: no unsuccessful rsb autotuning attempt (according to 1.01x threshold) -#pr: rsb auto tuning (either succ. or uns.) time was: on avg.: 0.01 s, min 0.00 s, max 0.01 s, tot 0.05 s (8 samples) -#pr: rsb auto tuning ( only successful ) time was: on avg.: 0.01 s, min 0.00 s, max 0.01 s, tot 0.05 s (8 samples) -#pr: best tun. rsb canon. mflops were: on avg. 1.918e+03, min 3.069e+02, max 4.910e+03 (8 samples) -#pr: ref. unt. rsb canon. mflops were: on avg. 3.113e-01, min 4.596e-02, max 9.125e-01 (8 samples) -#pr: best tun. rsb operation time was: on avg. 7.820e-08s, min 7.820e-08s, max 7.820e-08s, tot 6.256e-07s (8 samples) -#pr: ref. unt. rsb operation time was: on avg. 5.410e-04s, min 4.139e-04s, max 8.330e-04s, tot 4.328e-03s (8 samples) -#pr: min / max ratio of in-memory MEMSET bandwidth to extrapolated read bandwidth ratio: 7.218e+00 4.825e+01 -#pr: in-cache to in-memory MEMSET bandwidth ratio: 1.018e+00 +#pr: rsb auto tuning (either succ. or uns.) time was: on avg.: 0.01 s, min 0.01 s, max 0.02 s, tot 0.10 s (8 samples) +#pr: rsb auto tuning ( only successful ) time was: on avg.: 0.01 s, min 0.01 s, max 0.02 s, tot 0.10 s (8 samples) +#pr: best tun. rsb canon. mflops were: on avg. 1.721e+03, min 2.517e+01, max 4.851e+03 (8 samples) +#pr: ref. unt. rsb canon. mflops were: on avg. 2.303e-01, min 1.828e-02, max 6.773e-01 (8 samples) +#pr: best tun. rsb operation time was: on avg. 2.978e-07s, min 7.915e-08s, max 9.537e-07s, tot 2.382e-06s (8 samples) +#pr: ref. unt. rsb operation time was: on avg. 8.302e-04s, min 5.670e-04s, max 1.313e-03s, tot 6.642e-03s (8 samples) +#pr: min / max ratio of in-memory MEMSET bandwidth to extrapolated read bandwidth ratio: 7.338e+00 3.622e+02 +#pr: in-cache to in-memory MEMSET bandwidth ratio: 1.013e+00 #pr: rsb nrhs-to-overall-min-rhs speed ratio was: on avg. 4.000e+00 x, min 4.000e+00 x, max 4.000e+00 x (4 samples, the non-min-nrhs ones) #pr: ======== Limiting to both transA=N and nrhs=1: #pr: 4 samples (out of 8) matched the dump limiting criteria. #pr: Dump from a base of 8 samples (of max 16) ordered by (1,1,1,1,2,4,2) = (filename x cores x incX x incY x nrhs x typecode x transA). pr: BESTCODE MTX NR NC NNZ NRHS TYPE SYM TRANS NT AT-NT AT-MKL-NT BPNZ AT-BPNZ NSUBM AT-SUBM RSBBEST-MFLOPS OPTIME MKL-OPTIME AT-OPTIME AT-MKL-OPTIME AT-TIME RWminBW-GBps CB-bpf AT-MS CMFLOPS -pr: 1:R_R A 3 3 6 1 D S N 12 12 0 4.0000 4.6667 3 1 306.90 5.221e-04 0.000e+00 7.820e-08 0.000e+00 4.720e-03 1.89e+00 5.17e+00 1 2.40e-05 -pr: 3:R_R A 3 3 6 1 S S N 12 12 0 4.0000 4.6667 3 1 306.90 4.139e-04 0.000e+00 7.820e-08 0.000e+00 6.863e-03 1.13e+00 3.17e+00 1 2.40e-05 -pr: 5:R_R A 3 3 6 1 C S N 12 12 0 4.0000 4.6667 3 1 1227.60 4.711e-04 0.000e+00 7.820e-08 0.000e+00 4.662e-03 1.89e+00 1.29e+00 1 9.60e-05 -pr: 7:R_R A 3 3 6 1 Z S N 12 12 0 4.0000 4.6667 3 1 1227.60 5.400e-04 0.000e+00 7.820e-08 0.000e+00 4.870e-03 3.43e+00 2.29e+00 1 9.60e-05 +pr: 1:R_R A 3 3 6 1 D S N 12 12 0 4.0000 4.6667 3 1 25.17 1.313e-03 0.000e+00 9.537e-07 0.000e+00 1.618e-02 1.55e-01 5.17e+00 1 2.40e-05 +pr: 3:R_R A 3 3 6 1 S S N 12 12 0 4.0000 4.6667 3 1 303.20 9.429e-04 0.000e+00 7.915e-08 0.000e+00 9.039e-03 1.11e+00 3.17e+00 1 2.40e-05 +pr: 5:R_R A 3 3 6 1 C S N 12 12 0 4.0000 4.6667 3 1 1212.81 6.599e-04 0.000e+00 7.915e-08 0.000e+00 8.766e-03 1.87e+00 1.29e+00 1 9.60e-05 +pr: 7:R_R A 3 3 6 1 Z S N 12 12 0 4.0000 4.6667 3 1 1212.81 5.760e-04 0.000e+00 7.915e-08 0.000e+00 1.174e-02 3.39e+00 2.29e+00 1 9.60e-05 #pr: 4 samples (out of 8) matched the dump limiting criteria. #pr: below, we define 'successful' autotuning when speedup of 1.010000x is exceeded, and 'tuned' results even the ones which are same as untuned #pr: rsb autotuning was successful in 4 cases (100.00 %) and unsuccessful in 0 cases (0.00 %) -#pr: (in succ. cases rsb autotuning gave avg. 622384.8 % faster, avg. sp. ratio 6224.848x, max sp. ratio 6905.488x, avg. ratio 0.000x) -#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 67501.5/59615.9/87759.1/270006.1 tuned ops) -#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 11.1/ 9.0/ 16.6/ 44.5 untuned ops) -#pr: (and amortizes from untuned rsb in avg. 11.1, min. 9.0, max. 16.6 ops) +#pr: (in succ. cases rsb autotuning gave avg. 722496.5 % faster, avg. sp. ratio 7225.965x, max sp. ratio 11912.651x, avg. ratio 0.000x) +#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 97565.0/16968.0/148352.4/390260.2 tuned ops) +#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 13.9/ 9.6/ 20.4/ 55.6 untuned ops) +#pr: (and amortizes from untuned rsb in avg. 13.9, min. 9.6, max. 20.4 ops) #pr: (avg/min/max (avg) nnz per subm before successful tuning were 2/ 2/ 2) #pr: (avg/min/max (avg) nnz per subm after successful tuning were 6/ 6/ 6) #pr: (avg/min/max (avg) bytes per subm before successful tuning were 18/ 8/ 32) #pr: (avg/min/max (avg) bytes per subm after successful tuning were 54/ 24/ 96) #pr: (avg/min/max (avg) bytes per nnz before successful tuning were 4.000/ 4.000/ 4.000) -#pr: (avg/min/max operands (mtx,lhs,rhs) read bandwidth lower bound 1.739/ 0.972/ 2.813,GBps) -#pr: (avg/min/max operands (mtx,rhs:r;lhs:rw) bandwidth lower bound 8.337/ 1.125/ 3.427,GBps) +#pr: (avg/min/max operands (mtx,lhs,rhs) read bandwidth lower bound 1.359/ 0.130/ 2.779,GBps) +#pr: (avg/min/max operands (mtx,rhs:r;lhs:rw) bandwidth lower bound 6.522/ 0.155/ 3.386,GBps) #pr: (avg/min/max code balance (bytes read at least once per flop) 2.979/ 1.292/ 5.167) #pr: (avg/min/max (avg) bytes per nnz after successful tuning were 4.667/ 4.667/ 4.667) #pr: (matrix has been subdivided more/less/same in resp. 0 / 4 /0 cases) #pr: (matrix has used more/less/same threads in resp. 0 / 0 /4 cases) #pr: no unsuccessful rsb autotuning attempt (according to 1.01x threshold) -#pr: rsb auto tuning (either succ. or uns.) time was: on avg.: 0.01 s, min 0.00 s, max 0.01 s, tot 0.02 s (4 samples) -#pr: rsb auto tuning ( only successful ) time was: on avg.: 0.01 s, min 0.00 s, max 0.01 s, tot 0.02 s (4 samples) -#pr: best tun. rsb canon. mflops were: on avg. 7.673e+02, min 3.069e+02, max 1.228e+03 (4 samples) -#pr: ref. unt. rsb canon. mflops were: on avg. 1.214e-01, min 4.596e-02, max 2.038e-01 (4 samples) -#pr: best tun. rsb operation time was: on avg. 7.820e-08s, min 7.820e-08s, max 7.820e-08s, tot 3.128e-07s (4 samples) -#pr: ref. unt. rsb operation time was: on avg. 4.868e-04s, min 4.139e-04s, max 5.400e-04s, tot 1.947e-03s (4 samples) -#pr: min / max ratio of in-memory MEMSET bandwidth to extrapolated read bandwidth ratio: 1.667e+01 4.825e+01 -#pr: in-cache to in-memory MEMSET bandwidth ratio: 1.018e+00 +#pr: rsb auto tuning (either succ. or uns.) time was: on avg.: 0.01 s, min 0.01 s, max 0.02 s, tot 0.05 s (4 samples) +#pr: rsb auto tuning ( only successful ) time was: on avg.: 0.01 s, min 0.01 s, max 0.02 s, tot 0.05 s (4 samples) +#pr: best tun. rsb canon. mflops were: on avg. 6.885e+02, min 2.517e+01, max 1.213e+03 (4 samples) +#pr: ref. unt. rsb canon. mflops were: on avg. 8.896e-02, min 1.828e-02, max 1.667e-01 (4 samples) +#pr: best tun. rsb operation time was: on avg. 2.978e-07s, min 7.915e-08s, max 9.537e-07s, tot 1.191e-06s (4 samples) +#pr: ref. unt. rsb operation time was: on avg. 8.730e-04s, min 5.760e-04s, max 1.313e-03s, tot 3.492e-03s (4 samples) +#pr: min / max ratio of in-memory MEMSET bandwidth to extrapolated read bandwidth ratio: 1.694e+01 3.622e+02 +#pr: in-cache to in-memory MEMSET bandwidth ratio: 1.013e+00 #pr: ======== Limiting to both transA=N and nrhs=4: #pr: 4 samples (out of 8) matched the dump limiting criteria. #pr: Dump from a base of 8 samples (of max 16) ordered by (1,1,1,1,2,4,2) = (filename x cores x incX x incY x nrhs x typecode x transA). pr: BESTCODE MTX NR NC NNZ NRHS TYPE SYM TRANS NT AT-NT AT-MKL-NT BPNZ AT-BPNZ NSUBM AT-SUBM RSBBEST-MFLOPS OPTIME MKL-OPTIME AT-OPTIME AT-MKL-OPTIME AT-TIME RWminBW-GBps CB-bpf AT-MS CMFLOPS -pr: 9:R_R A 3 3 6 4 D S N 12 12 0 4.0000 4.6667 3 1 1227.60 8.330e-04 0.000e+00 7.820e-08 0.000e+00 8.379e-03 4.65e+00 2.79e+00 1 9.60e-05 -pr: 11:R_R A 3 3 6 4 S S N 12 12 0 4.0000 4.6667 3 1 1227.60 6.661e-04 0.000e+00 7.820e-08 0.000e+00 7.349e-03 2.51e+00 1.54e+00 1 9.60e-05 -pr: 13:R_R A 3 3 6 4 C S N 12 12 0 4.0000 4.6667 3 1 4910.40 4.611e-04 0.000e+00 7.820e-08 0.000e+00 4.477e-03 4.65e+00 6.98e-01 1 3.84e-04 -pr: 15:R_R A 3 3 6 4 Z S N 12 12 0 4.0000 4.6667 3 1 4910.40 4.208e-04 0.000e+00 7.820e-08 0.000e+00 4.420e-03 8.95e+00 1.32e+00 1 3.84e-04 +pr: 9:R_R A 3 3 6 4 D S N 12 12 0 4.0000 4.6667 3 1 100.66 1.098e-03 0.000e+00 9.537e-07 0.000e+00 2.464e-02 3.82e-01 2.79e+00 1 9.60e-05 +pr: 11:R_R A 3 3 6 4 S S N 12 12 0 4.0000 4.6667 3 1 1212.81 8.552e-04 0.000e+00 7.915e-08 0.000e+00 8.359e-03 2.48e+00 1.54e+00 1 9.60e-05 +pr: 13:R_R A 3 3 6 4 C S N 12 12 0 4.0000 4.6667 3 1 4851.24 5.670e-04 0.000e+00 7.915e-08 0.000e+00 8.725e-03 4.60e+00 6.98e-01 1 3.84e-04 +pr: 15:R_R A 3 3 6 4 Z S N 12 12 0 4.0000 4.6667 3 1 4851.24 6.299e-04 0.000e+00 7.915e-08 0.000e+00 9.607e-03 8.84e+00 1.32e+00 1 3.84e-04 #pr: 4 samples (out of 8) matched the dump limiting criteria. #pr: below, we define 'successful' autotuning when speedup of 1.010000x is exceeded, and 'tuned' results even the ones which are same as untuned #pr: rsb autotuning was successful in 4 cases (100.00 %) and unsuccessful in 0 cases (0.00 %) -#pr: (in succ. cases rsb autotuning gave avg. 761104.3 % faster, avg. sp. ratio 7612.043x, max sp. ratio 10652.439x, avg. ratio 0.000x) -#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 78723.3/56521.3/107146.3/314893.3 tuned ops) -#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 10.3/ 9.7/ 11.0/ 41.3 untuned ops) -#pr: (and amortizes from untuned rsb in avg. 10.3, min. 9.7, max. 11.0 ops) +#pr: (in succ. cases rsb autotuning gave avg. 676798.7 % faster, avg. sp. ratio 6768.987x, max sp. ratio 10804.217x, avg. ratio 0.000x) +#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 90760.5/25840.2/121370.5/363042.1 tuned ops) +#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 15.7/ 9.8/ 22.4/ 62.9 untuned ops) +#pr: (and amortizes from untuned rsb in avg. 15.7, min. 9.8, max. 22.5 ops) #pr: (avg/min/max (avg) nnz per subm before successful tuning were 2/ 2/ 2) #pr: (avg/min/max (avg) nnz per subm after successful tuning were 6/ 6/ 6) #pr: (avg/min/max (avg) bytes per subm before successful tuning were 18/ 8/ 32) #pr: (avg/min/max (avg) bytes per subm after successful tuning were 54/ 24/ 96) #pr: (avg/min/max (avg) bytes per nnz before successful tuning were 4.000/ 4.000/ 4.000) -#pr: (avg/min/max operands (mtx,lhs,rhs) read bandwidth lower bound 3.811/ 1.893/ 6.496,GBps) -#pr: (avg/min/max operands (mtx,rhs:r;lhs:rw) bandwidth lower bound 20.767/ 2.506/ 8.951,GBps) +#pr: (avg/min/max operands (mtx,lhs,rhs) read bandwidth lower bound 2.989/ 0.281/ 6.418,GBps) +#pr: (avg/min/max operands (mtx,rhs:r;lhs:rw) bandwidth lower bound 16.300/ 0.382/ 8.843,GBps) #pr: (avg/min/max code balance (bytes read at least once per flop) 1.589/ 0.698/ 2.792) #pr: (avg/min/max (avg) bytes per nnz after successful tuning were 4.667/ 4.667/ 4.667) #pr: (matrix has been subdivided more/less/same in resp. 0 / 4 /0 cases) #pr: (matrix has used more/less/same threads in resp. 0 / 0 /4 cases) #pr: no unsuccessful rsb autotuning attempt (according to 1.01x threshold) -#pr: rsb auto tuning (either succ. or uns.) time was: on avg.: 0.01 s, min 0.00 s, max 0.01 s, tot 0.02 s (4 samples) -#pr: rsb auto tuning ( only successful ) time was: on avg.: 0.01 s, min 0.00 s, max 0.01 s, tot 0.02 s (4 samples) -#pr: best tun. rsb canon. mflops were: on avg. 3.069e+03, min 1.228e+03, max 4.910e+03 (4 samples) -#pr: ref. unt. rsb canon. mflops were: on avg. 5.012e-01, min 1.152e-01, max 9.125e-01 (4 samples) -#pr: best tun. rsb operation time was: on avg. 7.820e-08s, min 7.820e-08s, max 7.820e-08s, tot 3.128e-07s (4 samples) -#pr: ref. unt. rsb operation time was: on avg. 5.953e-04s, min 4.208e-04s, max 8.330e-04s, tot 2.381e-03s (4 samples) -#pr: min / max ratio of in-memory MEMSET bandwidth to extrapolated read bandwidth ratio: 7.218e+00 2.478e+01 -#pr: in-cache to in-memory MEMSET bandwidth ratio: 1.018e+00 +#pr: rsb auto tuning (either succ. or uns.) time was: on avg.: 0.01 s, min 0.01 s, max 0.02 s, tot 0.05 s (4 samples) +#pr: rsb auto tuning ( only successful ) time was: on avg.: 0.01 s, min 0.01 s, max 0.02 s, tot 0.05 s (4 samples) +#pr: best tun. rsb canon. mflops were: on avg. 2.754e+03, min 1.007e+02, max 4.851e+03 (4 samples) +#pr: ref. unt. rsb canon. mflops were: on avg. 3.717e-01, min 8.744e-02, max 6.773e-01 (4 samples) +#pr: best tun. rsb operation time was: on avg. 2.978e-07s, min 7.915e-08s, max 9.537e-07s, tot 1.191e-06s (4 samples) +#pr: ref. unt. rsb operation time was: on avg. 7.875e-04s, min 5.670e-04s, max 1.098e-03s, tot 3.150e-03s (4 samples) +#pr: min / max ratio of in-memory MEMSET bandwidth to extrapolated read bandwidth ratio: 7.338e+00 1.676e+02 +#pr: in-cache to in-memory MEMSET bandwidth ratio: 1.013e+00 #pr: rsb nrhs-to-overall-min-rhs speed ratio was: on avg. 4.000e+00 x, min 4.000e+00 x, max 4.000e+00 x (4 samples, the non-min-nrhs ones) #pr: ======== Limiting to transA=T: #pr: No sample (out of 8) matched the dump criteria -- skipping dump round. @@ -5048,49 +5084,49 @@ #pr: ======== All results (not limiting) #pr: Dump from a base of 8 samples (of max 16) ordered by (1,1,1,1,2,4,2) = (filename x cores x incX x incY x nrhs x typecode x transA). pr: BESTCODE MTX NR NC NNZ NRHS TYPE SYM TRANS NT AT-NT AT-MKL-NT BPNZ AT-BPNZ NSUBM AT-SUBM RSBBEST-MFLOPS OPTIME MKL-OPTIME AT-OPTIME AT-MKL-OPTIME AT-TIME RWminBW-GBps CB-bpf AT-MS CMFLOPS -pr: 1:R_R A 3 3 6 1 D S N 12 12 0 4.0000 4.6667 3 1 306.90 5.221e-04 0.000e+00 7.820e-08 0.000e+00 4.720e-03 1.89e+00 5.17e+00 1 2.40e-05 -pr: 3:R_R A 3 3 6 1 S S N 12 12 0 4.0000 4.6667 3 1 306.90 4.139e-04 0.000e+00 7.820e-08 0.000e+00 6.863e-03 1.13e+00 3.17e+00 1 2.40e-05 -pr: 5:R_R A 3 3 6 1 C S N 12 12 0 4.0000 4.6667 3 1 1227.60 4.711e-04 0.000e+00 7.820e-08 0.000e+00 4.662e-03 1.89e+00 1.29e+00 1 9.60e-05 -pr: 7:R_R A 3 3 6 1 Z S N 12 12 0 4.0000 4.6667 3 1 1227.60 5.400e-04 0.000e+00 7.820e-08 0.000e+00 4.870e-03 3.43e+00 2.29e+00 1 9.60e-05 -pr: 9:R_R A 3 3 6 4 D S N 12 12 0 4.0000 4.6667 3 1 1227.60 8.330e-04 0.000e+00 7.820e-08 0.000e+00 8.379e-03 4.65e+00 2.79e+00 1 9.60e-05 -pr: 11:R_R A 3 3 6 4 S S N 12 12 0 4.0000 4.6667 3 1 1227.60 6.661e-04 0.000e+00 7.820e-08 0.000e+00 7.349e-03 2.51e+00 1.54e+00 1 9.60e-05 -pr: 13:R_R A 3 3 6 4 C S N 12 12 0 4.0000 4.6667 3 1 4910.40 4.611e-04 0.000e+00 7.820e-08 0.000e+00 4.477e-03 4.65e+00 6.98e-01 1 3.84e-04 -pr: 15:R_R A 3 3 6 4 Z S N 12 12 0 4.0000 4.6667 3 1 4910.40 4.208e-04 0.000e+00 7.820e-08 0.000e+00 4.420e-03 8.95e+00 1.32e+00 1 3.84e-04 +pr: 1:R_R A 3 3 6 1 D S N 12 12 0 4.0000 4.6667 3 1 25.17 1.313e-03 0.000e+00 9.537e-07 0.000e+00 1.618e-02 1.55e-01 5.17e+00 1 2.40e-05 +pr: 3:R_R A 3 3 6 1 S S N 12 12 0 4.0000 4.6667 3 1 303.20 9.429e-04 0.000e+00 7.915e-08 0.000e+00 9.039e-03 1.11e+00 3.17e+00 1 2.40e-05 +pr: 5:R_R A 3 3 6 1 C S N 12 12 0 4.0000 4.6667 3 1 1212.81 6.599e-04 0.000e+00 7.915e-08 0.000e+00 8.766e-03 1.87e+00 1.29e+00 1 9.60e-05 +pr: 7:R_R A 3 3 6 1 Z S N 12 12 0 4.0000 4.6667 3 1 1212.81 5.760e-04 0.000e+00 7.915e-08 0.000e+00 1.174e-02 3.39e+00 2.29e+00 1 9.60e-05 +pr: 9:R_R A 3 3 6 4 D S N 12 12 0 4.0000 4.6667 3 1 100.66 1.098e-03 0.000e+00 9.537e-07 0.000e+00 2.464e-02 3.82e-01 2.79e+00 1 9.60e-05 +pr: 11:R_R A 3 3 6 4 S S N 12 12 0 4.0000 4.6667 3 1 1212.81 8.552e-04 0.000e+00 7.915e-08 0.000e+00 8.359e-03 2.48e+00 1.54e+00 1 9.60e-05 +pr: 13:R_R A 3 3 6 4 C S N 12 12 0 4.0000 4.6667 3 1 4851.24 5.670e-04 0.000e+00 7.915e-08 0.000e+00 8.725e-03 4.60e+00 6.98e-01 1 3.84e-04 +pr: 15:R_R A 3 3 6 4 Z S N 12 12 0 4.0000 4.6667 3 1 4851.24 6.299e-04 0.000e+00 7.915e-08 0.000e+00 9.607e-03 8.84e+00 1.32e+00 1 3.84e-04 #pr: below, we define 'successful' autotuning when speedup of 1.010000x is exceeded, and 'tuned' results even the ones which are same as untuned #pr: rsb autotuning was successful in 8 cases (100.00 %) and unsuccessful in 0 cases (0.00 %) -#pr: (in succ. cases rsb autotuning gave avg. 691744.5 % faster, avg. sp. ratio 6918.445x, max sp. ratio 10652.439x, avg. ratio 0.000x) -#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 73112.4/56521.3/107146.3/584899.4 tuned ops) -#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 10.7/ 9.0/ 16.6/ 85.8 untuned ops) -#pr: (and amortizes from untuned rsb in avg. 10.7, min. 9.0, max. 16.6 ops) +#pr: (in succ. cases rsb autotuning gave avg. 699647.6 % faster, avg. sp. ratio 6997.476x, max sp. ratio 11912.651x, avg. ratio 0.000x) +#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 94162.8/16968.0/148352.4/753302.2 tuned ops) +#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 14.8/ 9.6/ 22.4/118.4 untuned ops) +#pr: (and amortizes from untuned rsb in avg. 14.8, min. 9.6, max. 22.5 ops) #pr: (avg/min/max (avg) nnz per subm before successful tuning were 2/ 2/ 2) #pr: (avg/min/max (avg) nnz per subm after successful tuning were 6/ 6/ 6) #pr: (avg/min/max (avg) bytes per subm before successful tuning were 18/ 8/ 32) #pr: (avg/min/max (avg) bytes per subm after successful tuning were 54/ 24/ 96) #pr: (avg/min/max (avg) bytes per nnz before successful tuning were 4.000/ 4.000/ 4.000) -#pr: (avg/min/max operands (mtx,lhs,rhs) read bandwidth lower bound 2.775/ 0.972/ 6.496,GBps) -#pr: (avg/min/max operands (mtx,rhs:r;lhs:rw) bandwidth lower bound 29.104/ 1.125/ 8.951,GBps) +#pr: (avg/min/max operands (mtx,lhs,rhs) read bandwidth lower bound 2.174/ 0.130/ 6.418,GBps) +#pr: (avg/min/max operands (mtx,rhs:r;lhs:rw) bandwidth lower bound 22.822/ 0.155/ 8.843,GBps) #pr: (avg/min/max code balance (bytes read at least once per flop) 2.284/ 0.698/ 5.167) #pr: (avg/min/max (avg) bytes per nnz after successful tuning were 4.667/ 4.667/ 4.667) #pr: (matrix has been subdivided more/less/same in resp. 0 / 8 /0 cases) #pr: (matrix has used more/less/same threads in resp. 0 / 0 /8 cases) #pr: no unsuccessful rsb autotuning attempt (according to 1.01x threshold) -#pr: rsb auto tuning (either succ. or uns.) time was: on avg.: 0.01 s, min 0.00 s, max 0.01 s, tot 0.05 s (8 samples) -#pr: rsb auto tuning ( only successful ) time was: on avg.: 0.01 s, min 0.00 s, max 0.01 s, tot 0.05 s (8 samples) -#pr: best tun. rsb canon. mflops were: on avg. 1.918e+03, min 3.069e+02, max 4.910e+03 (8 samples) -#pr: ref. unt. rsb canon. mflops were: on avg. 3.113e-01, min 4.596e-02, max 9.125e-01 (8 samples) -#pr: best tun. rsb operation time was: on avg. 7.820e-08s, min 7.820e-08s, max 7.820e-08s, tot 6.256e-07s (8 samples) -#pr: ref. unt. rsb operation time was: on avg. 5.410e-04s, min 4.139e-04s, max 8.330e-04s, tot 4.328e-03s (8 samples) -#pr: min / max ratio of in-memory MEMSET bandwidth to extrapolated read bandwidth ratio: 7.218e+00 4.825e+01 -#pr: in-cache to in-memory MEMSET bandwidth ratio: 1.018e+00 +#pr: rsb auto tuning (either succ. or uns.) time was: on avg.: 0.01 s, min 0.01 s, max 0.02 s, tot 0.10 s (8 samples) +#pr: rsb auto tuning ( only successful ) time was: on avg.: 0.01 s, min 0.01 s, max 0.02 s, tot 0.10 s (8 samples) +#pr: best tun. rsb canon. mflops were: on avg. 1.721e+03, min 2.517e+01, max 4.851e+03 (8 samples) +#pr: ref. unt. rsb canon. mflops were: on avg. 2.303e-01, min 1.828e-02, max 6.773e-01 (8 samples) +#pr: best tun. rsb operation time was: on avg. 2.978e-07s, min 7.915e-08s, max 9.537e-07s, tot 2.382e-06s (8 samples) +#pr: ref. unt. rsb operation time was: on avg. 8.302e-04s, min 5.670e-04s, max 1.313e-03s, tot 6.642e-03s (8 samples) +#pr: min / max ratio of in-memory MEMSET bandwidth to extrapolated read bandwidth ratio: 7.338e+00 3.622e+02 +#pr: in-cache to in-memory MEMSET bandwidth ratio: 1.013e+00 #pr: rsb nrhs-to-overall-min-rhs speed ratio was: on avg. 4.000e+00 x, min 4.000e+00 x, max 4.000e+00 x (4 samples, the non-min-nrhs ones) -#pr: Record collection took 0.33 s. +#pr: Record collection took 0.56 s. #pr: Record comprises 40 memory benchmark samples (prepend RSB_PR_MBW=1 to dump this). -#pr: Record comprises 100 environment variables in 5413 bytes (prepend RSB_PR_ENV=1 to dump this). +#pr: Record comprises 100 environment variables in 5467 bytes (prepend RSB_PR_ENV=1 to dump this). # ====== END Total summary record. -#pr: ======== Saved a performance record of 16 samples to rsbench_pr__1773327832_gcc-14.2.rpr -# Removing the temporary record file rsbench_pr__1773327832_gcc-14.2.rpr.tmp. -# terminating run at 1773327838 (after 5.7s of w.c.t.) -srcdir="/build/reproducible-path/librsb-1.3.0.2+dfsg" /bin/bash ./scripts/doc-tests.sh +#pr: ======== Saved a performance record of 16 samples to rsbench_pr__1738918486_gcc-14.2.rpr +# Removing the temporary record file rsbench_pr__1738918486_gcc-14.2.rpr.tmp. +# terminating run at 1738918492 (after 5.9s of w.c.t.) +srcdir="/build/reproducible-path/librsb-1.3.0.2+dfsg" /bin/sh ./scripts/doc-tests.sh + set -o pipefail + test x/build/reproducible-path/librsb-1.3.0.2+dfsg = x + cat /build/reproducible-path/librsb-1.3.0.2+dfsg/examples/autotune.c /build/reproducible-path/librsb-1.3.0.2+dfsg/examples/backsolve.c /build/reproducible-path/librsb-1.3.0.2+dfsg/examples/hello-spblas.c /build/reproducible-path/librsb-1.3.0.2+dfsg/examples/hello.c /build/reproducible-path/librsb-1.3.0.2+dfsg/examples/io-spblas.c /build/reproducible-path/librsb-1.3.0.2+dfsg/examples/power.c /build/reproducible-path/librsb-1.3.0.2+dfsg/examples/snippets.c /build/reproducible-path/librsb-1.3.0.2+dfsg/examples/transpose.c @@ -5108,8 +5144,8 @@ ++ /build/reproducible-path/librsb-1.3.0.2+dfsg/rsbench -oa -Ob -h ++ wc -l + test 182 -ge 157 -++ /build/reproducible-path/librsb-1.3.0.2+dfsg/rsbench -oa -Ob -h ++ wc -c +++ /build/reproducible-path/librsb-1.3.0.2+dfsg/rsbench -oa -Ob -h + test 5369 -ge 4600 + exit 0 if ! ./librsb-config --help ; then echo "Problem executing the librsb-config script!"; false; fi; @@ -5144,7 +5180,7 @@ type char codes:D S C Z gmake[4]: Entering directory '/build/reproducible-path/librsb-1.3.0.2+dfsg/examples' if test /build/reproducible-path/librsb-1.3.0.2+dfsg != /build/reproducible-path/librsb-1.3.0.2+dfsg ; then cp /build/reproducible-path/librsb-1.3.0.2+dfsg/pd.mtx /build/reproducible-path/librsb-1.3.0.2+dfsg/vf.mtx /build/reproducible-path/librsb-1.3.0.2+dfsg/examples ; fi -( PATH="/build/reproducible-path/librsb-1.3.0.2+dfsg:/usr/sbin:/usr/bin:/sbin:/bin:/usr/games" /bin/bash /build/reproducible-path/librsb-1.3.0.2+dfsg/examples/bench.sh; ) +( PATH="/build/reproducible-path/librsb-1.3.0.2+dfsg:/usr/sbin:/usr/bin:/sbin:/bin:/usr/games:/i/capture/the/path" /bin/sh /build/reproducible-path/librsb-1.3.0.2+dfsg/examples/bench.sh; ) + which rsbench /build/reproducible-path/librsb-1.3.0.2+dfsg/rsbench + BRF=test.rpr @@ -5154,15 +5190,15 @@ Will invoke autotuning for ~10.000000 s x 1 rounds, specifying verbosity=0 and threads=0. (>0 means no structure tuning; 0 means only structure tuning, <0 means tuning of both with (negated) thread count suggestion). # Requested no transposition. # performance record file set to: test.rpr -# beginning run at 1773327838 +# beginning run at 1738918492 # /build/reproducible-path/librsb-1.3.0.2+dfsg/.libs/rsbench -oa -Ob --bench --lower 100 --as-symmetric --types : -n 1 --notranspose --compare-competitors --verbose --verbose --write-performance-record=test.rpr # compiled with: CC=gcc CFLAGS=-g -O2 -Werror=implicit-function-declaration -fstack-protector-strong -fstack-clash-protection -Wformat -Werror=format-security -mbranch-protection=standard -O3 -std=c99 -# average timer granularity: 7.57e-08 s +# average timer granularity: 4.92e-08 s # Will write a final performance record to file test.rpr and periodic checkpoints to test.rpr.tmp # will NOT perform ancillary tests. # will flush cache memory: between each operation measurement series, and NOT between each operation. # will keep any zero encountered in the matrix. -# env: export PATH=/build/reproducible-path/librsb-1.3.0.2+dfsg:/usr/sbin:/usr/bin:/sbin:/bin:/usr/games +# env: export PATH=/build/reproducible-path/librsb-1.3.0.2+dfsg:/usr/sbin:/usr/bin:/sbin:/bin:/usr/games:/i/capture/the/path # env: export LD_LIBRARY_PATH=/build/reproducible-path/librsb-1.3.0.2+dfsg/.libs # env: HOSTNAME is not set # env: KMP_AFFINITY is not set @@ -5201,7 +5237,7 @@ # env: SLURM_NTASKS is not set # env: SLURM_STEP_TASKS_PER_NODE is not set # env: SLURM_TASKS_PER_NODE is not set -# detected hostname: codethink03-arm64 +# detected hostname: i-capture-the-hostname # user specified a verbosity level of 2 (each --verbose occurrence counts +1) # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 524288 bytes, per-thread 43690 bytes @@ -5221,29 +5257,29 @@ # This test will measure times in scanning arrays sized and aligned to fit in caches. # 2 cache levels detected Will fill struct with 40 samples... -# Memory benchmark took 5.369s +# Memory benchmark took 5.325s # auto-tuning oriented output implies times==0 iterations and sort-after-load. #pr: allocated a performance record for 4 samples (1120 bytes). # multi-type benchmarking (DSCZ) -- now using typecode D (last was D). # Cache block size total 524288 bytes, per-thread 43690 bytes -# so far, program took 5.373s of wall clock time; ancillary tests 0.000s; I/O 0.000s; checks 0.000s; conversions 0.000s; rsb/mkl tuning 0.000s/0.000s . +# so far, program took 5.328s of wall clock time; ancillary tests 0.000s; I/O 0.000s; checks 0.000s; conversions 0.000s; rsb/mkl tuning 0.000s/0.000s . # Using 1 threads # Using alpha=1 beta=1 order=cols for rsb_spmv/rsb_spsv/rsb_spmm/rsb_spsm. # will use input matrix flags: RSB_FLAG_USE_HALFWORD_INDICES, RSB_FLAG_SORTED_INPUT, RSB_FLAG_LOWER, RSB_FLAG_QUAD_PARTITIONING, RSB_FLAG_SYMMETRIC, RSB_FLAG_OWN_PARTITIONING_ARRAYS # Using 1 threads Building a matrix with 5050 nnz, 100 x 100 Duplicates check: 5050 - 0 = 5050 - converted COO to RSB in 7.185e-03 s (100.00 %) - analyzed arrays in 2.067e-03 s (28.77 %) - cleaned-up arrays in 1.001e-05 s (0.14 %) - deduplicated arrays in 9.060e-06 s (0.13 %) + converted COO to RSB in 3.504e-02 s (100.00 %) + analyzed arrays in 1.617e-02 s (46.16 %) + cleaned-up arrays in 1.001e-05 s (0.03 %) + deduplicated arrays in 9.060e-06 s (0.03 %) sorted arrays in 0.000e+00 s (0.00 %) - shuffled partitions in 3.839e-03 s (53.43 %) - memory allocations took 1.383e-05 s (0.19 %) - leafs setup took 5.007e-06 s (0.07 %) - halfword conversion took 1.238e-03 s (17.23 %) -Built (100 x 100)[0xaaaad0340930]{D} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x2446196 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'LS' -# Constructed matrix (took 0.007s): (100 x 100)[0xaaaad0340930]{D} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x2446196 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'LS' + shuffled partitions in 1.442e-02 s (41.16 %) + memory allocations took 1.383e-05 s (0.04 %) + leafs setup took 6.914e-06 s (0.02 %) + halfword conversion took 4.401e-03 s (12.56 %) +Built (100 x 100)[0xaaaaeaaa3970]{D} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x2446196 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'LS' +# Constructed matrix (took 0.035s): (100 x 100)[0xaaaaeaaa3970]{D} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x2446196 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'LS' # matrix consistency check took 0.000s (ok) RSB Sparse Blocks Autotuner invoked requesting max 6 splits and max 6 merges in 1 rounds, threads spec.0 (specify negative values to enable threads tuning). Will autotune matrix: 100 x 100, type D, 5050 nnz, 50 nnz/r, 4 subms, 3 lsubms, 2.1212 bpnz. @@ -5294,10 +5330,10 @@ # RSB_IO_WANT_SORT_METHOD: 0 # RSB_IO_WANT_SUBDIVISION_MULTIPLIER: 1 # librsb version 1.3.0.2 - 202212201855: Initialization success -3 iterations (1 th.) took 0.002496s; avg 0.000832s ( +/- 25.35/ 50.01 %); best 0.0006211s; worst 0.001248s; std dev. 0.0002943 (taking best). -Reference operation time is 0.00062108 s (32.52 Mflops) with 1 threads. -Starting merge (same threads) based auto-tuning procedure (transA=N, nrhs=1, order=cols) (max 6 steps, inclusive 3 grace steps) on: 100 x 100, type D, 5050 nnz, 50 nnz/r, 4 subms, 3 lsubms, 2.1212 bpnz (tpop: 0.0006211 Mflops: 32.524) -Merge (3 -> 1 leaves) took w.c.t. of 4.101e-05s, ~3.29e-05s of computing time (of which 1.502e-05s sorting, 3.099e-06s analysis) +3 iterations (1 th.) took 0.006517s; avg 0.002172s ( +/- 46.69/ 87.08 %); best 0.001158s; worst 0.004064s; std dev. 0.001339 (taking best). +Reference operation time is 0.001158 s (17.44 Mflops) with 1 threads. +Starting merge (same threads) based auto-tuning procedure (transA=N, nrhs=1, order=cols) (max 6 steps, inclusive 3 grace steps) on: 100 x 100, type D, 5050 nnz, 50 nnz/r, 4 subms, 3 lsubms, 2.1212 bpnz (tpop: 0.001158 Mflops: 17.444) +Merge (3 -> 1 leaves) took w.c.t. of 0.0001061s, ~8.512e-05s of computing time (of which 3.505e-05s sorting, 7.153e-06s analysis) # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 524288 bytes, per-thread 524288 bytes # RSB_IO_WANT_MEMORY_HIERARCHY_INFO_STRING: unset @@ -5328,8 +5364,8 @@ # RSB_IO_WANT_SORT_METHOD: 0 # RSB_IO_WANT_SUBDIVISION_MULTIPLIER: 1 # librsb version 1.3.0.2 - 202212201855: Initialization success -3 iterations (1 th.) took 1.788e-05s; avg 5.96e-06s ( +/- 0.00/ 0.00 %); best 5.96e-06s; worst 5.96e-06s; std dev. 0 (taking best). -Reference operation time is 5.96046e-06 s (3389 Mflops) with 1 threads. +3 iterations (1 th.) took 5.603e-05s; avg 1.868e-05s ( +/- 13.19/ 17.45 %); best 1.621e-05s; worst 2.193e-05s; std dev. 2.403e-06 (taking best). +Reference operation time is 1.62125e-05 s (1246 Mflops) with 1 threads. # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 524288 bytes, per-thread 524288 bytes # RSB_IO_WANT_MEMORY_HIERARCHY_INFO_STRING: unset @@ -5345,16 +5381,16 @@ # RSB_IO_WANT_SORT_METHOD: 0 # RSB_IO_WANT_SUBDIVISION_MULTIPLIER: 1 # librsb version 1.3.0.2 - 202212201855: Initialization success -After merge step 1: tpop: 5.96e-06 s ~Mflops: 3388.998 nsubm:1 otn:1 -Applying merge (3 -> 1 leaves, 1 th.) yielded SPEEDUP of 104.200x: 0.0006211s -> 5.96e-06s, so taking this instance. +After merge step 1: tpop: 1.621e-05 s ~Mflops: 1245.955 nsubm:1 otn:1 +Applying merge (3 -> 1 leaves, 1 th.) yielded SPEEDUP of 71.426x: 0.001158s -> 1.621e-05s, so taking this instance. Saved plot to test-tuning-lower-100x100-5050nz--D-N-1--mv-tuned_merge1_1x1th.eps Merged all the matrix leaves: no reason to continue merging. -A total of 1 merge steps (of max 6) (3 -> 1 subms) took 0.009197s (of which 4.387e-05s partitioning, 0.00622s I/O); computing times: 3.29e-05s in par. loops, 1.502e-05s sorting, 3.099e-06s analyzing) -Total merge + benchmarking process took 0.009197s, equivalent to 1543.0/14.8 new/old ops (0.005144s for 2 clones -- as 863.0/8.3 ops, or 431.5/4.1 ops per clone), SPEEDUP of 104.200x -Applying multi-merge (3 -> 1 leaves, 1 steps, 0 -> 1 th.sp.) yielded SPEEDUP of 104.200x (0.0006211s -> 5.96e-06s), will amortize in 15.0 ops by saving 0.0006151s per op. -In 1 tuning rounds (tot. 0.014s, 0.0051s for constructor, 2 clones) obtained a SPEEDUP of 10320.0% (104.2x) (from 32.52 to 3389 Mflops). Employed 0.0073s for I/O of matrix plots. +A total of 1 merge steps (of max 6) (3 -> 1 subms) took 0.01603s (of which 0.000113s partitioning, 0.01164s I/O); computing times: 8.512e-05s in par. loops, 3.505e-05s sorting, 7.153e-06s analyzing) +Total merge + benchmarking process took 0.01603s, equivalent to 988.8/13.8 new/old ops (0.00871s for 2 clones -- as 537.2/7.5 ops, or 268.6/3.8 ops per clone), SPEEDUP of 71.426x +Applying multi-merge (3 -> 1 leaves, 1 steps, 0 -> 1 th.sp.) yielded SPEEDUP of 71.426x (0.001158s -> 1.621e-05s), will amortize in 14.0 ops by saving 0.001142s per op. +In 1 tuning rounds (tot. 0.028s, 0.0087s for constructor, 2 clones) obtained a SPEEDUP of 7042.6% (71.43x) (from 17.44 to 1246 Mflops). Employed 0.014s for I/O of matrix plots. #pr: updating sample at index 1 (0^th of 4), 0^th touch for (0,0,0,0,0,0,0). -First run of RSB Autotuner took 0.0213089 s (6.211e-04 s -> 5.960e-06 s per spmv_sxsa) (tuned: 3 -> 1 lsubm). +First run of RSB Autotuner took 0.0415349 s (1.158e-03 s -> 1.621e-05 s per spmv_sxsa) (tuned: 3 -> 1 lsubm). RSB Sparse Blocks Autotuner invoked requesting max 0 splits and max 0 merges in 1 rounds, auto threads spec. Will autotune matrix: 100 x 100, type D, 5050 nnz, 50 nnz/r, 1 subms, 1 lsubms, 2.0800 bpnz. Parameters: verbosity:1 mintimes:3 maxtimes:10 mindt:0 maxdt:10 @@ -5420,20 +5456,20 @@ # RSB_IO_WANT_SORT_METHOD: 0 # RSB_IO_WANT_SUBDIVISION_MULTIPLIER: 1 # librsb version 1.3.0.2 - 202212201855: Initialization success -3 iterations (1 th.) took 2.217e-05s; avg 7.391e-06s ( +/- 19.35/ 35.48 %); best 5.96e-06s; worst 1.001e-05s; std dev. 1.857e-06 (taking best). -Reference operation time is 5.96046e-06 s (3389 Mflops) with 1 threads. +3 iterations (1 th.) took 5.198e-05s; avg 1.733e-05s ( +/- 13.30/ 26.61 %); best 1.502e-05s; worst 2.193e-05s; std dev. 3.259e-06 (taking best). +Reference operation time is 1.50204e-05 s (1345 Mflops) with 1 threads. Building a matrix with 5050 nnz, 100 x 100 Duplicates check: 5050 - 0 = 5050 - converted COO to RSB in 2.882e-03 s (100.00 %) - analyzed arrays in 1.023e-03 s (35.50 %) - cleaned-up arrays in 9.060e-06 s (0.31 %) - deduplicated arrays in 6.914e-06 s (0.24 %) + converted COO to RSB in 4.010e-03 s (100.00 %) + analyzed arrays in 1.358e-03 s (33.86 %) + cleaned-up arrays in 2.384e-05 s (0.59 %) + deduplicated arrays in 2.003e-05 s (0.50 %) sorted arrays in 0.000e+00 s (0.00 %) - shuffled partitions in 1.838e-03 s (63.77 %) - memory allocations took 1.907e-06 s (0.07 %) - leafs setup took 9.537e-07 s (0.03 %) - halfword conversion took 2.146e-06 s (0.07 %) -Built (100 x 100)[0xaaaad034b120]{D} @ (0(0..100),0(0..100)) (5050 nnz, 50 nnz/r) flags 0x42644094 (coo:0, csr:1, hw:0, ic:1, fi:0), storage: 1, subm: 1, symflags:'LS' + shuffled partitions in 2.594e-03 s (64.68 %) + memory allocations took 5.484e-06 s (0.14 %) + leafs setup took 1.907e-06 s (0.05 %) + halfword conversion took 7.153e-06 s (0.18 %) +Built (100 x 100)[0xaaaaeaaae160]{D} @ (0(0..100),0(0..100)) (5050 nnz, 50 nnz/r) flags 0x42644094 (coo:0, csr:1, hw:0, ic:1, fi:0), storage: 1, subm: 1, symflags:'LS' Starting autotuning stage, with subdivision of 1 (current threads=1, requested threads=0, max threads = 12). # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 524288 bytes, per-thread 524288 bytes @@ -5467,16 +5503,16 @@ # librsb version 1.3.0.2 - 202212201855: Initialization success Building a matrix with 5050 nnz, 100 x 100 Duplicates check: 5050 - 0 = 5050 - converted COO to RSB in 4.721e-03 s (100.00 %) - analyzed arrays in 1.441e-03 s (30.52 %) - cleaned-up arrays in 9.060e-06 s (0.19 %) - deduplicated arrays in 6.914e-06 s (0.15 %) + converted COO to RSB in 7.050e-03 s (100.00 %) + analyzed arrays in 1.877e-03 s (26.62 %) + cleaned-up arrays in 9.060e-06 s (0.13 %) + deduplicated arrays in 2.098e-05 s (0.30 %) sorted arrays in 0.000e+00 s (0.00 %) - shuffled partitions in 1.429e-03 s (30.27 %) - memory allocations took 9.537e-07 s (0.02 %) - leafs setup took 0.000e+00 s (0.00 %) - halfword conversion took 1.834e-03 s (38.85 %) -Built (100 x 100)[0xaaaad0340c60]{D} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x42646096 (coo:0, csr:1, hw:1, ic:1, fi:0), storage: 1, subm: 3, symflags:'LS' + shuffled partitions in 2.554e-03 s (36.23 %) + memory allocations took 4.053e-06 s (0.06 %) + leafs setup took 4.053e-06 s (0.06 %) + halfword conversion took 2.581e-03 s (36.61 %) +Built (100 x 100)[0xaaaaeaaa3ca0]{D} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x42646096 (coo:0, csr:1, hw:1, ic:1, fi:0), storage: 1, subm: 3, symflags:'LS' # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 524288 bytes, per-thread 524288 bytes # RSB_IO_WANT_MEMORY_HIERARCHY_INFO_STRING: unset @@ -5522,9 +5558,9 @@ # RSB_IO_WANT_SORT_METHOD: 0 # RSB_IO_WANT_SUBDIVISION_MULTIPLIER: 0.25 # librsb version 1.3.0.2 - 202212201855: Initialization success -3 iterations (1 th.) took 0.002481s; avg 0.000827s ( +/- 25.01/ 48.85 %); best 0.0006201s; worst 0.001231s; std dev. 0.0002857 (taking best). -Reference operation time is 0.000620127 s (32.57 Mflops) with 1 threads. -Challenging best inner round reference (5.96046e-06 s/1 threads) with: subdivision 0.25, 3 leaves, 2.121 bytes/nz, 0.000620127 s/0 threads (speedup 0.00961169 x), same?n. +3 iterations (1 th.) took 0.003457s; avg 0.001152s ( +/- 7.06/ 5.43 %); best 0.001071s; worst 0.001215s; std dev. 6.027e-05 (taking best). +Reference operation time is 0.00107098 s (18.86 Mflops) with 1 threads. +Challenging best inner round reference (1.50204e-05 s/1 threads) with: subdivision 0.25, 3 leaves, 2.121 bytes/nz, 0.00107098 s/0 threads (speedup 0.0140249 x), same?n. New candidate clone performs slowly; discarding it: 100 x 100, type D, 5050 nnz, 50 nnz/r, 4 subms, 3 lsubms, 2.1212 bpnz # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 524288 bytes, per-thread 524288 bytes @@ -5558,16 +5594,16 @@ # librsb version 1.3.0.2 - 202212201855: Initialization success Building a matrix with 5050 nnz, 100 x 100 Duplicates check: 5050 - 0 = 5050 - converted COO to RSB in 5.404e-03 s (100.00 %) - analyzed arrays in 1.660e-03 s (30.72 %) - cleaned-up arrays in 9.060e-06 s (0.17 %) - deduplicated arrays in 6.914e-06 s (0.13 %) + converted COO to RSB in 8.006e-03 s (100.00 %) + analyzed arrays in 2.689e-03 s (33.59 %) + cleaned-up arrays in 2.313e-05 s (0.29 %) + deduplicated arrays in 2.003e-05 s (0.25 %) sorted arrays in 0.000e+00 s (0.00 %) - shuffled partitions in 1.883e-03 s (34.85 %) - memory allocations took 1.907e-06 s (0.04 %) - leafs setup took 9.537e-07 s (0.02 %) - halfword conversion took 1.841e-03 s (34.07 %) -Built (100 x 100)[0xaaaad0341650]{D} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x42646096 (coo:0, csr:1, hw:1, ic:1, fi:0), storage: 1, subm: 10, symflags:'LS' + shuffled partitions in 2.996e-03 s (37.42 %) + memory allocations took 5.722e-06 s (0.07 %) + leafs setup took 4.053e-06 s (0.05 %) + halfword conversion took 2.266e-03 s (28.30 %) +Built (100 x 100)[0xaaaaeaaa4690]{D} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x42646096 (coo:0, csr:1, hw:1, ic:1, fi:0), storage: 1, subm: 10, symflags:'LS' # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 524288 bytes, per-thread 524288 bytes # RSB_IO_WANT_MEMORY_HIERARCHY_INFO_STRING: unset @@ -5613,9 +5649,9 @@ # RSB_IO_WANT_SORT_METHOD: 0 # RSB_IO_WANT_SUBDIVISION_MULTIPLIER: 0.5 # librsb version 1.3.0.2 - 202212201855: Initialization success -3 iterations (1 th.) took 0.002486s; avg 0.0008287s ( +/- 24.82/ 48.69 %); best 0.000623s; worst 0.001232s; std dev. 0.0002853 (taking best). -Reference operation time is 0.000622988 s (32.42 Mflops) with 1 threads. -Challenging best inner round reference (5.96046e-06 s/1 threads) with: subdivision 0.5, 10 leaves, 2.206 bytes/nz, 0.000622988 s/0 threads (speedup 0.00956755 x), same?n. +3 iterations (1 th.) took 0.003364s; avg 0.001121s ( +/- 19.74/ 10.22 %); best 0.0009s; worst 0.001236s; std dev. 0.0001565 (taking best). +Reference operation time is 0.00090003 s (22.44 Mflops) with 1 threads. +Challenging best inner round reference (1.50204e-05 s/1 threads) with: subdivision 0.5, 10 leaves, 2.206 bytes/nz, 0.00090003 s/0 threads (speedup 0.0166887 x), same?n. New candidate clone performs slowly; discarding it: 100 x 100, type D, 5050 nnz, 50 nnz/r, 14 subms, 10 lsubms, 2.2059 bpnz # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 524288 bytes, per-thread 524288 bytes @@ -5649,16 +5685,16 @@ # librsb version 1.3.0.2 - 202212201855: Initialization success Building a matrix with 5050 nnz, 100 x 100 Duplicates check: 5050 - 0 = 5050 - converted COO to RSB in 4.631e-03 s (100.00 %) - analyzed arrays in 2.096e-03 s (45.26 %) - cleaned-up arrays in 9.060e-06 s (0.20 %) - deduplicated arrays in 6.914e-06 s (0.15 %) + converted COO to RSB in 1.062e-02 s (100.00 %) + analyzed arrays in 4.406e-03 s (41.50 %) + cleaned-up arrays in 9.060e-06 s (0.09 %) + deduplicated arrays in 7.868e-06 s (0.07 %) sorted arrays in 0.000e+00 s (0.00 %) - shuffled partitions in 1.473e-03 s (31.81 %) - memory allocations took 3.099e-06 s (0.07 %) - leafs setup took 9.537e-07 s (0.02 %) - halfword conversion took 1.042e-03 s (22.50 %) -Built (100 x 100)[0xaaaad034b240]{D} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x42646096 (coo:0, csr:1, hw:1, ic:1, fi:0), storage: 1, subm: 24, symflags:'LS' + shuffled partitions in 2.708e-03 s (25.50 %) + memory allocations took 7.153e-06 s (0.07 %) + leafs setup took 5.007e-06 s (0.05 %) + halfword conversion took 3.473e-03 s (32.71 %) +Built (100 x 100)[0xaaaaeaaae280]{D} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x42646096 (coo:0, csr:1, hw:1, ic:1, fi:0), storage: 1, subm: 25, symflags:'LS' # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 524288 bytes, per-thread 524288 bytes # RSB_IO_WANT_MEMORY_HIERARCHY_INFO_STRING: unset @@ -5704,10 +5740,10 @@ # RSB_IO_WANT_SORT_METHOD: 0 # RSB_IO_WANT_SUBDIVISION_MULTIPLIER: 1 # librsb version 1.3.0.2 - 202212201855: Initialization success -3 iterations (1 th.) took 0.001626s; avg 0.000542s ( +/- 3.71/ 3.33 %); best 0.0005219s; worst 0.00056s; std dev. 1.564e-05 (taking best). -Reference operation time is 0.000521898 s (38.7 Mflops) with 1 threads. -Challenging best inner round reference (5.96046e-06 s/1 threads) with: subdivision 1, 24 leaves, 2.295 bytes/nz, 0.000521898 s/0 threads (speedup 0.0114207 x), same?n. -New candidate clone performs slowly; discarding it: 100 x 100, type D, 5050 nnz, 50 nnz/r, 34 subms, 24 lsubms, 2.2947 bpnz +3 iterations (1 th.) took 0.003307s; avg 0.001102s ( +/- 5.38/ 4.33 %); best 0.001043s; worst 0.00115s; std dev. 4.446e-05 (taking best). +Reference operation time is 0.00104308 s (19.37 Mflops) with 1 threads. +Challenging best inner round reference (1.50204e-05 s/1 threads) with: subdivision 1, 25 leaves, 2.317 bytes/nz, 0.00104308 s/0 threads (speedup 0.0144 x), same?n. +New candidate clone performs slowly; discarding it: 100 x 100, type D, 5050 nnz, 50 nnz/r, 34 subms, 25 lsubms, 2.3168 bpnz # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 524288 bytes, per-thread 524288 bytes # RSB_IO_WANT_MEMORY_HIERARCHY_INFO_STRING: unset @@ -5740,16 +5776,16 @@ # librsb version 1.3.0.2 - 202212201855: Initialization success Building a matrix with 5050 nnz, 100 x 100 Duplicates check: 5050 - 0 = 5050 - converted COO to RSB in 3.789e-03 s (100.00 %) - analyzed arrays in 1.554e-03 s (41.01 %) - cleaned-up arrays in 8.106e-06 s (0.21 %) - deduplicated arrays in 7.868e-06 s (0.21 %) + converted COO to RSB in 6.731e-03 s (100.00 %) + analyzed arrays in 2.704e-03 s (40.17 %) + cleaned-up arrays in 2.599e-05 s (0.39 %) + deduplicated arrays in 2.289e-05 s (0.34 %) sorted arrays in 0.000e+00 s (0.00 %) - shuffled partitions in 1.127e-03 s (29.74 %) - memory allocations took 2.861e-06 s (0.08 %) - leafs setup took 1.192e-06 s (0.03 %) - halfword conversion took 1.088e-03 s (28.71 %) -Built (100 x 100)[0xaaaad0371ee0]{D} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x42646096 (coo:0, csr:1, hw:1, ic:1, fi:0), storage: 1, subm: 36, symflags:'LS' + shuffled partitions in 1.830e-03 s (27.19 %) + memory allocations took 5.960e-06 s (0.09 %) + leafs setup took 5.960e-06 s (0.09 %) + halfword conversion took 2.135e-03 s (31.72 %) +Built (100 x 100)[0xaaaaeaad4f20]{D} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x42646096 (coo:0, csr:1, hw:1, ic:1, fi:0), storage: 1, subm: 36, symflags:'LS' # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 524288 bytes, per-thread 524288 bytes # RSB_IO_WANT_MEMORY_HIERARCHY_INFO_STRING: unset @@ -5795,9 +5831,9 @@ # RSB_IO_WANT_SORT_METHOD: 0 # RSB_IO_WANT_SUBDIVISION_MULTIPLIER: 2 # librsb version 1.3.0.2 - 202212201855: Initialization success -3 iterations (1 th.) took 0.00154s; avg 0.0005133s ( +/- 5.71/ 6.55 %); best 0.000484s; worst 0.0005469s; std dev. 2.587e-05 (taking best). -Reference operation time is 0.00048399 s (41.74 Mflops) with 1 threads. -Challenging best inner round reference (5.96046e-06 s/1 threads) with: subdivision 2, 36 leaves, 2.383 bytes/nz, 0.00048399 s/0 threads (speedup 0.0123153 x), same?n. +3 iterations (1 th.) took 0.002953s; avg 0.0009844s ( +/- 26.56/ 17.13 %); best 0.0007229s; worst 0.001153s; std dev. 0.0001875 (taking best). +Reference operation time is 0.000722885 s (27.94 Mflops) with 1 threads. +Challenging best inner round reference (1.50204e-05 s/1 threads) with: subdivision 2, 36 leaves, 2.383 bytes/nz, 0.000722885 s/0 threads (speedup 0.0207784 x), same?n. New candidate clone performs slowly; discarding it: 100 x 100, type D, 5050 nnz, 50 nnz/r, 50 subms, 36 lsubms, 2.3834 bpnz # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 524288 bytes, per-thread 524288 bytes @@ -5831,16 +5867,16 @@ # librsb version 1.3.0.2 - 202212201855: Initialization success Building a matrix with 5050 nnz, 100 x 100 Duplicates check: 5050 - 0 = 5050 - converted COO to RSB in 3.518e-03 s (100.00 %) - analyzed arrays in 1.460e-03 s (41.50 %) - cleaned-up arrays in 8.821e-06 s (0.25 %) - deduplicated arrays in 8.106e-06 s (0.23 %) + converted COO to RSB in 8.276e-03 s (100.00 %) + analyzed arrays in 2.542e-03 s (30.72 %) + cleaned-up arrays in 9.775e-06 s (0.12 %) + deduplicated arrays in 9.060e-06 s (0.11 %) sorted arrays in 0.000e+00 s (0.00 %) - shuffled partitions in 1.035e-03 s (29.42 %) - memory allocations took 3.099e-06 s (0.09 %) - leafs setup took 1.907e-06 s (0.05 %) - halfword conversion took 1.001e-03 s (28.46 %) -Built (100 x 100)[0xaaaad0371ee0]{D} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x42646096 (coo:0, csr:1, hw:1, ic:1, fi:0), storage: 1, subm: 36, symflags:'LS' + shuffled partitions in 2.287e-03 s (27.63 %) + memory allocations took 6.914e-06 s (0.08 %) + leafs setup took 8.106e-06 s (0.10 %) + halfword conversion took 3.412e-03 s (41.23 %) +Built (100 x 100)[0xaaaaeaad4f20]{D} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x42646096 (coo:0, csr:1, hw:1, ic:1, fi:0), storage: 1, subm: 36, symflags:'LS' # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 524288 bytes, per-thread 524288 bytes # RSB_IO_WANT_MEMORY_HIERARCHY_INFO_STRING: unset @@ -5886,11 +5922,11 @@ # RSB_IO_WANT_SORT_METHOD: 0 # RSB_IO_WANT_SUBDIVISION_MULTIPLIER: 4 # librsb version 1.3.0.2 - 202212201855: Initialization success -3 iterations (1 th.) took 0.00148s; avg 0.0004933s ( +/- 5.75/ 3.77 %); best 0.0004649s; worst 0.0005119s; std dev. 2.038e-05 (taking best). -Reference operation time is 0.000464916 s (43.45 Mflops) with 1 threads. -Challenging best inner round reference (5.96046e-06 s/1 threads) with: subdivision 4, 36 leaves, 2.383 bytes/nz, 0.000464916 s/0 threads (speedup 0.0128205 x), same?n. +3 iterations (1 th.) took 0.004802s; avg 0.001601s ( +/- 30.90/ 19.52 %); best 0.001106s; worst 0.001913s; std dev. 0.0003538 (taking best). +Reference operation time is 0.00110602 s (18.26 Mflops) with 1 threads. +Challenging best inner round reference (1.50204e-05 s/1 threads) with: subdivision 4, 36 leaves, 2.383 bytes/nz, 0.00110602 s/0 threads (speedup 0.0135805 x), same?n. New candidate clone performs slowly; discarding it: 100 x 100, type D, 5050 nnz, 50 nnz/r, 50 subms, 36 lsubms, 2.3834 bpnz -Best sparse multiply performance with subdivision multiplier of 1: 3389 Mflops. +Best sparse multiply performance with subdivision multiplier of 1: 1344.84 Mflops. # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 524288 bytes, per-thread 524288 bytes # RSB_IO_WANT_MEMORY_HIERARCHY_INFO_STRING: unset @@ -5906,23 +5942,23 @@ # RSB_IO_WANT_SORT_METHOD: 0 # RSB_IO_WANT_SUBDIVISION_MULTIPLIER: 1 # librsb version 1.3.0.2 - 202212201855: Initialization success -Last tuner inner round (1 of 1) took 0.0355 s (eq. to 6e+03/ 6e+03 old/new op.times), gained local/global speedup 1 x (5.96046e-06 : 5.96046e-06) / 1 x (5.96046e-06 : 5.96046e-06). This is not amortizable ! +Last tuner inner round (1 of 1) took 0.063997 s (eq. to 4e+03/ 4e+03 old/new op.times), gained local/global speedup 1 x (1.50204e-05 : 1.50204e-05) / 1 x (1.50204e-05 : 1.50204e-05). This is not amortizable ! Auto tuning inner round 1 did not find a configuration better than the original. -In 1 tuning rounds (tot. 0.036s, 0.026s for constructor, 0 clones) obtained NO speedup (best stays 3389 Mflops). -Second run of RSB Autotuner took 0.0355201 s and estimated a speedup of 1.000000 x (5.960e-06 s -> 5.960e-06 s per op) in same matrix (1 -> 1 lsubm) +In 1 tuning rounds (tot. 0.064s, 0.046s for constructor, 0 clones) obtained NO speedup (best stays 1345 Mflops). +Second run of RSB Autotuner took 0.0640378 s and estimated a speedup of 1.000000 x (1.502e-05 s -> 1.502e-05 s per op) in same matrix (1 -> 1 lsubm) #min:1 #max:1 #sum:100 #norm:10 #used index storage compared to COO:10504 vs 40400 bytes (26.00%) ; compared to CSR:10504 vs 20604 bytes (50.99%) #%:CONSTRUCTOR_*:SORT SCAN INSERT SCAN+INSERT -%:CONSTRUCTOR_TIMES:lower-100x100-5050nz S N 1 100 100 5050 0.000000 0.002067 0.003839 0.005906 -%:UNSORTEDCOO2RSB_TIME:lower-100x100-5050nz S N 1 100 100 5050 0.005906 -%:RSB_SUBDIVISION_TIME:lower-100x100-5050nz S N 1 100 100 5050 0.002067 -%:RSB_SHUFFLE_TIME:lower-100x100-5050nz S N 1 100 100 5050 0.003839 +%:CONSTRUCTOR_TIMES:lower-100x100-5050nz S N 1 100 100 5050 0.000000 0.016172 0.014422 0.030594 +%:UNSORTEDCOO2RSB_TIME:lower-100x100-5050nz S N 1 100 100 5050 0.030594 +%:RSB_SUBDIVISION_TIME:lower-100x100-5050nz S N 1 100 100 5050 0.016172 +%:RSB_SHUFFLE_TIME:lower-100x100-5050nz S N 1 100 100 5050 0.014422 %:ROW_MAJOR_SORT_TIME:lower-100x100-5050nz S N 1 100 100 5050 0.000000 %:ROW_MAJOR_SORT_SCALING:lower-100x100-5050nz S N 1 100 100 5050 nan -%:SORTEDCOO2RSB_TIME:lower-100x100-5050nz S N 1 100 100 5050 0.005906 +%:SORTEDCOO2RSB_TIME:lower-100x100-5050nz S N 1 100 100 5050 0.030594 %:ROW_MAJOR_SORT_TO_MOP:lower-100x100-5050nz S N 1 100 100 5050 0.000 %:UNSORTEDCOO2RSB_SCALING:lower-100x100-5050nz S N 1 100 100 5050 1.00 %:SORTEDCOO2RSB_SCALING:lower-100x100-5050nz S N 1 100 100 5050 1.00 @@ -5937,34 +5973,34 @@ %:SM_MINMAXAVGNNZ:lower-100x100-5050nz S N 1 100 100 5050 5050 5050 5050 # %operation:matrix CONSTRUCTOR[1] SPMV[1] SPMV[1] -%operation:lower-100x100-5050nz 0.00718498 1e+09 1e+09 +%operation:lower-100x100-5050nz 0.035037 1e+09 1e+09 %constructor:matrix SORT[1] SCAN[1] SHUFFLE[1] INSERT[1] -%constructor:lower-100x100-5050nz 0 0.00206685 0 0.00383902 -# so far, program took 5.440s of wall clock time; ancillary tests 0.000s; I/O 0.000s; checks 0.000s; conversions 0.000s; rsb/mkl tuning 0.057s/0.000s . +%constructor:lower-100x100-5050nz 0 0.0161722 0 0.0144222 +# so far, program took 5.476s of wall clock time; ancillary tests 0.000s; I/O 0.000s; checks 0.000s; conversions 0.000s; rsb/mkl tuning 0.106s/0.000s . getrusage() stats: ru_maxrss: 6 (maximum resident set size -- MB) -ru_stime : 0.04363s (system CPU time used) -ru_utime : 5.98s (user CPU time used) +ru_stime : 0.0563s (system CPU time used) +ru_utime : 5.999s (user CPU time used) # multi-type benchmarking (DSCZ) -- now using typecode S (last was D). # Cache block size total 524288 bytes, per-thread 524288 bytes -# so far, program took 5.440s of wall clock time; ancillary tests 0.000s; I/O 0.000s; checks 0.000s; conversions 0.000s; rsb/mkl tuning 0.057s/0.000s . +# so far, program took 5.476s of wall clock time; ancillary tests 0.000s; I/O 0.000s; checks 0.000s; conversions 0.000s; rsb/mkl tuning 0.106s/0.000s . # Using 1 threads # Using alpha=1 beta=1 order=cols for rsb_spmv/rsb_spsv/rsb_spmm/rsb_spsm. # will use input matrix flags: RSB_FLAG_USE_HALFWORD_INDICES, RSB_FLAG_SORTED_INPUT, RSB_FLAG_LOWER, RSB_FLAG_QUAD_PARTITIONING, RSB_FLAG_SYMMETRIC, RSB_FLAG_OWN_PARTITIONING_ARRAYS # Using 1 threads Building a matrix with 5050 nnz, 100 x 100 Duplicates check: 5050 - 0 = 5050 - converted COO to RSB in 3.393e-03 s (100.00 %) - analyzed arrays in 5.422e-04 s (15.98 %) - cleaned-up arrays in 9.060e-06 s (0.27 %) - deduplicated arrays in 7.868e-06 s (0.23 %) + converted COO to RSB in 7.047e-03 s (100.00 %) + analyzed arrays in 1.319e-03 s (18.72 %) + cleaned-up arrays in 2.003e-05 s (0.28 %) + deduplicated arrays in 1.717e-05 s (0.24 %) sorted arrays in 0.000e+00 s (0.00 %) - shuffled partitions in 1.893e-03 s (55.79 %) - memory allocations took 2.861e-06 s (0.08 %) - leafs setup took 0.000e+00 s (0.00 %) - halfword conversion took 9.379e-04 s (27.64 %) -Built (100 x 100)[0xaaaad034b240]{S} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x2446196 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'LS' -# Constructed matrix (took 0.003s): (100 x 100)[0xaaaad034b240]{S} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x2446196 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'LS' + shuffled partitions in 3.931e-03 s (55.78 %) + memory allocations took 5.960e-06 s (0.08 %) + leafs setup took 2.146e-06 s (0.03 %) + halfword conversion took 1.751e-03 s (24.85 %) +Built (100 x 100)[0xaaaaeaaae280]{S} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x2446196 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'LS' +# Constructed matrix (took 0.007s): (100 x 100)[0xaaaaeaaae280]{S} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x2446196 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'LS' # matrix consistency check took 0.000s (ok) RSB Sparse Blocks Autotuner invoked requesting max 6 splits and max 6 merges in 1 rounds, threads spec.0 (specify negative values to enable threads tuning). Will autotune matrix: 100 x 100, type S, 5050 nnz, 50 nnz/r, 4 subms, 3 lsubms, 2.1212 bpnz. @@ -6015,10 +6051,10 @@ # RSB_IO_WANT_SORT_METHOD: 0 # RSB_IO_WANT_SUBDIVISION_MULTIPLIER: 1 # librsb version 1.3.0.2 - 202212201855: Initialization success -3 iterations (1 th.) took 0.001352s; avg 0.0004507s ( +/- 0.81/ 0.72 %); best 0.000447s; worst 0.0004539s; std dev. 2.837e-06 (taking best). -Reference operation time is 0.000447035 s (45.19 Mflops) with 1 threads. -Starting merge (same threads) based auto-tuning procedure (transA=N, nrhs=1, order=cols) (max 6 steps, inclusive 3 grace steps) on: 100 x 100, type S, 5050 nnz, 50 nnz/r, 4 subms, 3 lsubms, 2.1212 bpnz (tpop: 0.000447 Mflops: 45.187) -Merge (3 -> 1 leaves) took w.c.t. of 3.6e-05s, ~3.099e-05s of computing time (of which 1.287e-05s sorting, 9.537e-07s analysis) +3 iterations (1 th.) took 0.006549s; avg 0.002183s ( +/- 40.72/ 74.90 %); best 0.001294s; worst 0.003818s; std dev. 0.001158 (taking best). +Reference operation time is 0.00129414 s (15.61 Mflops) with 1 threads. +Starting merge (same threads) based auto-tuning procedure (transA=N, nrhs=1, order=cols) (max 6 steps, inclusive 3 grace steps) on: 100 x 100, type S, 5050 nnz, 50 nnz/r, 4 subms, 3 lsubms, 2.1212 bpnz (tpop: 0.001294 Mflops: 15.609) +Merge (3 -> 1 leaves) took w.c.t. of 6.7e-05s, ~5.507e-05s of computing time (of which 2.098e-05s sorting, 4.053e-06s analysis) # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 524288 bytes, per-thread 524288 bytes # RSB_IO_WANT_MEMORY_HIERARCHY_INFO_STRING: unset @@ -6049,8 +6085,8 @@ # RSB_IO_WANT_SORT_METHOD: 0 # RSB_IO_WANT_SUBDIVISION_MULTIPLIER: 1 # librsb version 1.3.0.2 - 202212201855: Initialization success -3 iterations (1 th.) took 1.788e-05s; avg 5.96e-06s ( +/- 16.00/ 16.00 %); best 5.007e-06s; worst 6.914e-06s; std dev. 7.787e-07 (taking best). -Reference operation time is 5.00679e-06 s (4035 Mflops) with 1 threads. +3 iterations (1 th.) took 3.815e-05s; avg 1.272e-05s ( +/- 6.25/ 10.62 %); best 1.192e-05s; worst 1.407e-05s; std dev. 9.603e-07 (taking best). +Reference operation time is 1.19209e-05 s (1694 Mflops) with 1 threads. # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 524288 bytes, per-thread 524288 bytes # RSB_IO_WANT_MEMORY_HIERARCHY_INFO_STRING: unset @@ -6066,16 +6102,16 @@ # RSB_IO_WANT_SORT_METHOD: 0 # RSB_IO_WANT_SUBDIVISION_MULTIPLIER: 1 # librsb version 1.3.0.2 - 202212201855: Initialization success -After merge step 1: tpop: 5.007e-06 s ~Mflops: 4034.521 nsubm:1 otn:1 -Applying merge (3 -> 1 leaves, 1 th.) yielded SPEEDUP of 89.286x: 0.000447s -> 5.007e-06s, so taking this instance. +After merge step 1: tpop: 1.192e-05 s ~Mflops: 1694.499 nsubm:1 otn:1 +Applying merge (3 -> 1 leaves, 1 th.) yielded SPEEDUP of 108.560x: 0.001294s -> 1.192e-05s, so taking this instance. Saved plot to test-tuning-lower-100x100-5050nz--S-N-1--mv-tuned_merge1_1x1th.eps Merged all the matrix leaves: no reason to continue merging. -A total of 1 merge steps (of max 6) (3 -> 1 subms) took 0.0058s (of which 3.695e-05s partitioning, 0.004289s I/O); computing times: 3.099e-05s in par. loops, 1.287e-05s sorting, 9.537e-07s analyzing) -Total merge + benchmarking process took 0.0058s, equivalent to 1158.4/13.0 new/old ops (0.002716s for 2 clones -- as 542.5/6.1 ops, or 271.2/3.0 ops per clone), SPEEDUP of 89.286x -Applying multi-merge (3 -> 1 leaves, 1 steps, 0 -> 1 th.sp.) yielded SPEEDUP of 89.286x (0.000447s -> 5.007e-06s), will amortize in 13.1 ops by saving 0.000442s per op. -In 1 tuning rounds (tot. 0.0085s, 0.0027s for constructor, 2 clones) obtained a SPEEDUP of 8828.6% (89.29x) (from 45.19 to 4035 Mflops). Employed 0.0045s for I/O of matrix plots. +A total of 1 merge steps (of max 6) (3 -> 1 subms) took 0.01447s (of which 7.2e-05s partitioning, 0.01027s I/O); computing times: 5.507e-05s in par. loops, 2.098e-05s sorting, 4.053e-06s analyzing) +Total merge + benchmarking process took 0.01447s, equivalent to 1214.2/11.2 new/old ops (0.02126s for 2 clones -- as 1783.1/16.4 ops, or 891.5/8.2 ops per clone), SPEEDUP of 108.560x +Applying multi-merge (3 -> 1 leaves, 1 steps, 0 -> 1 th.sp.) yielded SPEEDUP of 108.560x (0.001294s -> 1.192e-05s), will amortize in 11.3 ops by saving 0.001282s per op. +In 1 tuning rounds (tot. 0.038s, 0.021s for constructor, 2 clones) obtained a SPEEDUP of 10756.0% (108.6x) (from 15.61 to 1694 Mflops). Employed 0.01s for I/O of matrix plots. #pr: updating sample at index 2 (1^th of 4), 0^th touch for (0,0,0,0,0,1,0). -First run of RSB Autotuner took 0.013145 s (4.470e-04 s -> 5.007e-06 s per spmv_sxsa) (tuned: 3 -> 1 lsubm). +First run of RSB Autotuner took 0.0484741 s (1.294e-03 s -> 1.192e-05 s per spmv_sxsa) (tuned: 3 -> 1 lsubm). RSB Sparse Blocks Autotuner invoked requesting max 0 splits and max 0 merges in 1 rounds, auto threads spec. Will autotune matrix: 100 x 100, type S, 5050 nnz, 50 nnz/r, 1 subms, 1 lsubms, 2.0800 bpnz. Parameters: verbosity:1 mintimes:3 maxtimes:10 mindt:0 maxdt:10 @@ -6141,20 +6177,20 @@ # RSB_IO_WANT_SORT_METHOD: 0 # RSB_IO_WANT_SUBDIVISION_MULTIPLIER: 1 # librsb version 1.3.0.2 - 202212201855: Initialization success -3 iterations (1 th.) took 2.122e-05s; avg 7.073e-06s ( +/- 29.21/ 41.57 %); best 5.007e-06s; worst 1.001e-05s; std dev. 2.135e-06 (taking best). -Reference operation time is 5.00679e-06 s (4035 Mflops) with 1 threads. +3 iterations (1 th.) took 3.91e-05s; avg 1.303e-05s ( +/- 15.85/ 22.56 %); best 1.097e-05s; worst 1.597e-05s; std dev. 2.135e-06 (taking best). +Reference operation time is 1.09673e-05 s (1842 Mflops) with 1 threads. Building a matrix with 5050 nnz, 100 x 100 Duplicates check: 5050 - 0 = 5050 - converted COO to RSB in 1.397e-03 s (100.00 %) - analyzed arrays in 4.749e-04 s (34.00 %) - cleaned-up arrays in 9.060e-06 s (0.65 %) - deduplicated arrays in 6.914e-06 s (0.49 %) + converted COO to RSB in 3.925e-03 s (100.00 %) + analyzed arrays in 2.282e-03 s (58.14 %) + cleaned-up arrays in 1.788e-05 s (0.46 %) + deduplicated arrays in 1.502e-05 s (0.38 %) sorted arrays in 0.000e+00 s (0.00 %) - shuffled partitions in 9.000e-04 s (64.43 %) - memory allocations took 3.099e-06 s (0.22 %) - leafs setup took 9.537e-07 s (0.07 %) - halfword conversion took 1.907e-06 s (0.14 %) -Built (100 x 100)[0xaaaad034b120]{S} @ (0(0..100),0(0..100)) (5050 nnz, 50 nnz/r) flags 0x42644094 (coo:0, csr:1, hw:0, ic:1, fi:0), storage: 1, subm: 1, symflags:'LS' + shuffled partitions in 1.602e-03 s (40.82 %) + memory allocations took 2.861e-06 s (0.07 %) + leafs setup took 1.192e-06 s (0.03 %) + halfword conversion took 2.861e-06 s (0.07 %) +Built (100 x 100)[0xaaaaeaaae160]{S} @ (0(0..100),0(0..100)) (5050 nnz, 50 nnz/r) flags 0x42644094 (coo:0, csr:1, hw:0, ic:1, fi:0), storage: 1, subm: 1, symflags:'LS' Starting autotuning stage, with subdivision of 1 (current threads=1, requested threads=0, max threads = 12). # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 524288 bytes, per-thread 524288 bytes @@ -6188,16 +6224,16 @@ # librsb version 1.3.0.2 - 202212201855: Initialization success Building a matrix with 5050 nnz, 100 x 100 Duplicates check: 5050 - 0 = 5050 - converted COO to RSB in 9.720e-04 s (100.00 %) - analyzed arrays in 4.580e-04 s (47.12 %) - cleaned-up arrays in 8.821e-06 s (0.91 %) - deduplicated arrays in 7.153e-06 s (0.74 %) + converted COO to RSB in 3.085e-03 s (100.00 %) + analyzed arrays in 2.296e-03 s (74.43 %) + cleaned-up arrays in 1.693e-05 s (0.55 %) + deduplicated arrays in 1.407e-05 s (0.46 %) sorted arrays in 0.000e+00 s (0.00 %) - shuffled partitions in 4.940e-04 s (50.82 %) - memory allocations took 1.192e-06 s (0.12 %) - leafs setup took 0.000e+00 s (0.00 %) - halfword conversion took 1.907e-06 s (0.20 %) -Built (100 x 100)[0xaaaad0341650]{S} @ (0(0..100),0(0..100)) (5050 nnz, 50 nnz/r) flags 0x42644096 (coo:0, csr:1, hw:1, ic:1, fi:0), storage: 1, subm: 1, symflags:'LS' + shuffled partitions in 7.489e-04 s (24.28 %) + memory allocations took 4.053e-06 s (0.13 %) + leafs setup took 9.537e-07 s (0.03 %) + halfword conversion took 3.099e-06 s (0.10 %) +Built (100 x 100)[0xaaaaeaaa4690]{S} @ (0(0..100),0(0..100)) (5050 nnz, 50 nnz/r) flags 0x42644096 (coo:0, csr:1, hw:1, ic:1, fi:0), storage: 1, subm: 1, symflags:'LS' # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 524288 bytes, per-thread 524288 bytes # RSB_IO_WANT_MEMORY_HIERARCHY_INFO_STRING: unset @@ -6243,10 +6279,9 @@ # RSB_IO_WANT_SORT_METHOD: 0 # RSB_IO_WANT_SUBDIVISION_MULTIPLIER: 0.25 # librsb version 1.3.0.2 - 202212201855: Initialization success -3 iterations (1 th.) took 2.003e-05s; avg 6.676e-06s ( +/- 25.00/ 32.14 %); best 5.007e-06s; worst 8.821e-06s; std dev. 1.593e-06 (taking best). -Reference operation time is 5.00679e-06 s (4035 Mflops) with 1 threads. -Challenging best inner round reference (5.00679e-06 s/1 threads) with: subdivision 0.25, 1 leaves, 2.08 bytes/nz, 5.00679e-06 s/0 threads (speedup 1 x), same?n. -New candidate clone performs slowly; discarding it: 100 x 100, type S, 5050 nnz, 50 nnz/r, 1 subms, 1 lsubms, 2.0800 bpnz +3 iterations (1 th.) took 3.505e-05s; avg 1.168e-05s ( +/- 14.29/ 28.57 %); best 1.001e-05s; worst 1.502e-05s; std dev. 2.36e-06 (taking best). +Reference operation time is 1.00136e-05 s (2017 Mflops) with 1 threads. +Challenging best inner round reference (1.09673e-05 s/1 threads) with: subdivision 0.25, 1 leaves, 2.08 bytes/nz, 1.00136e-05 s/0 threads (speedup 1.09524 x), same?n. # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 524288 bytes, per-thread 524288 bytes # RSB_IO_WANT_MEMORY_HIERARCHY_INFO_STRING: unset @@ -6279,16 +6314,16 @@ # librsb version 1.3.0.2 - 202212201855: Initialization success Building a matrix with 5050 nnz, 100 x 100 Duplicates check: 5050 - 0 = 5050 - converted COO to RSB in 2.777e-03 s (100.00 %) - analyzed arrays in 9.401e-04 s (33.85 %) - cleaned-up arrays in 9.060e-06 s (0.33 %) - deduplicated arrays in 6.914e-06 s (0.25 %) + converted COO to RSB in 6.723e-03 s (100.00 %) + analyzed arrays in 2.658e-03 s (39.54 %) + cleaned-up arrays in 1.502e-05 s (0.22 %) + deduplicated arrays in 1.287e-05 s (0.19 %) sorted arrays in 0.000e+00 s (0.00 %) - shuffled partitions in 9.251e-04 s (33.31 %) - memory allocations took 9.537e-07 s (0.03 %) - leafs setup took 1.907e-06 s (0.07 %) - halfword conversion took 8.931e-04 s (32.16 %) -Built (100 x 100)[0xaaaad0341650]{S} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x42646096 (coo:0, csr:1, hw:1, ic:1, fi:0), storage: 1, subm: 8, symflags:'LS' + shuffled partitions in 1.944e-03 s (28.92 %) + memory allocations took 3.099e-06 s (0.05 %) + leafs setup took 1.907e-06 s (0.03 %) + halfword conversion took 2.087e-03 s (31.04 %) +Built (100 x 100)[0xaaaaeaaae280]{S} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x42646096 (coo:0, csr:1, hw:1, ic:1, fi:0), storage: 1, subm: 8, symflags:'LS' # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 524288 bytes, per-thread 524288 bytes # RSB_IO_WANT_MEMORY_HIERARCHY_INFO_STRING: unset @@ -6334,9 +6369,9 @@ # RSB_IO_WANT_SORT_METHOD: 0 # RSB_IO_WANT_SUBDIVISION_MULTIPLIER: 0.5 # librsb version 1.3.0.2 - 202212201855: Initialization success -3 iterations (1 th.) took 0.001336s; avg 0.0004454s ( +/- 3.21/ 2.19 %); best 0.0004311s; worst 0.0004551s; std dev. 1.034e-05 (taking best). -Reference operation time is 0.000431061 s (46.86 Mflops) with 1 threads. -Challenging best inner round reference (5.00679e-06 s/1 threads) with: subdivision 0.5, 8 leaves, 2.185 bytes/nz, 0.000431061 s/0 threads (speedup 0.011615 x), same?n. +3 iterations (1 th.) took 0.002511s; avg 0.000837s ( +/- 11.24/ 9.81 %); best 0.0007429s; worst 0.0009191s; std dev. 7.243e-05 (taking best). +Reference operation time is 0.000742912 s (27.19 Mflops) with 1 threads. +Challenging best inner round reference (1.00136e-05 s/0 threads) with: subdivision 0.5, 8 leaves, 2.185 bytes/nz, 0.000742912 s/0 threads (speedup 0.0134788 x), same?n. New candidate clone performs slowly; discarding it: 100 x 100, type S, 5050 nnz, 50 nnz/r, 11 subms, 8 lsubms, 2.1846 bpnz # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 524288 bytes, per-thread 524288 bytes @@ -6370,16 +6405,16 @@ # librsb version 1.3.0.2 - 202212201855: Initialization success Building a matrix with 5050 nnz, 100 x 100 Duplicates check: 5050 - 0 = 5050 - converted COO to RSB in 2.767e-03 s (100.00 %) - analyzed arrays in 9.310e-04 s (33.65 %) - cleaned-up arrays in 9.060e-06 s (0.33 %) - deduplicated arrays in 6.914e-06 s (0.25 %) + converted COO to RSB in 7.810e-03 s (100.00 %) + analyzed arrays in 2.323e-03 s (29.74 %) + cleaned-up arrays in 1.502e-05 s (0.19 %) + deduplicated arrays in 1.192e-05 s (0.15 %) sorted arrays in 0.000e+00 s (0.00 %) - shuffled partitions in 9.210e-04 s (33.28 %) - memory allocations took 2.146e-06 s (0.08 %) - leafs setup took 9.537e-07 s (0.03 %) - halfword conversion took 8.960e-04 s (32.38 %) -Built (100 x 100)[0xaaaad034b240]{S} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x42646096 (coo:0, csr:1, hw:1, ic:1, fi:0), storage: 1, subm: 19, symflags:'LS' + shuffled partitions in 3.622e-03 s (46.38 %) + memory allocations took 5.960e-06 s (0.08 %) + leafs setup took 5.960e-06 s (0.08 %) + halfword conversion took 1.826e-03 s (23.38 %) +Built (100 x 100)[0xaaaaeaaae280]{S} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x42646096 (coo:0, csr:1, hw:1, ic:1, fi:0), storage: 1, subm: 19, symflags:'LS' # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 524288 bytes, per-thread 524288 bytes # RSB_IO_WANT_MEMORY_HIERARCHY_INFO_STRING: unset @@ -6425,9 +6460,9 @@ # RSB_IO_WANT_SORT_METHOD: 0 # RSB_IO_WANT_SUBDIVISION_MULTIPLIER: 1 # librsb version 1.3.0.2 - 202212201855: Initialization success -3 iterations (1 th.) took 0.001339s; avg 0.0004463s ( +/- 1.66/ 1.28 %); best 0.0004389s; worst 0.000452s; std dev. 5.482e-06 (taking best). -Reference operation time is 0.000438929 s (46.02 Mflops) with 1 threads. -Challenging best inner round reference (5.00679e-06 s/1 threads) with: subdivision 1, 19 leaves, 2.272 bytes/nz, 0.000438929 s/0 threads (speedup 0.0114068 x), same?n. +3 iterations (1 th.) took 0.002443s; avg 0.0008144s ( +/- 34.65/ 23.90 %); best 0.0005322s; worst 0.001009s; std dev. 0.0002043 (taking best). +Reference operation time is 0.00053215 s (37.96 Mflops) with 1 threads. +Challenging best inner round reference (1.00136e-05 s/0 threads) with: subdivision 1, 19 leaves, 2.272 bytes/nz, 0.00053215 s/0 threads (speedup 0.0188172 x), same?n. New candidate clone performs slowly; discarding it: 100 x 100, type S, 5050 nnz, 50 nnz/r, 26 subms, 19 lsubms, 2.2725 bpnz # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 524288 bytes, per-thread 524288 bytes @@ -6461,16 +6496,16 @@ # librsb version 1.3.0.2 - 202212201855: Initialization success Building a matrix with 5050 nnz, 100 x 100 Duplicates check: 5050 - 0 = 5050 - converted COO to RSB in 2.838e-03 s (100.00 %) - analyzed arrays in 9.449e-04 s (33.29 %) - cleaned-up arrays in 8.821e-06 s (0.31 %) - deduplicated arrays in 7.153e-06 s (0.25 %) + converted COO to RSB in 4.943e-03 s (100.00 %) + analyzed arrays in 1.858e-03 s (37.59 %) + cleaned-up arrays in 1.812e-05 s (0.37 %) + deduplicated arrays in 1.502e-05 s (0.30 %) sorted arrays in 0.000e+00 s (0.00 %) - shuffled partitions in 9.711e-04 s (34.22 %) - memory allocations took 2.146e-06 s (0.08 %) - leafs setup took 3.099e-06 s (0.11 %) - halfword conversion took 9.000e-04 s (31.71 %) -Built (100 x 100)[0xaaaad034b240]{S} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x42646096 (coo:0, csr:1, hw:1, ic:1, fi:0), storage: 1, subm: 36, symflags:'LS' + shuffled partitions in 1.562e-03 s (31.60 %) + memory allocations took 4.768e-06 s (0.10 %) + leafs setup took 4.053e-06 s (0.08 %) + halfword conversion took 1.480e-03 s (29.94 %) +Built (100 x 100)[0xaaaaeaaae280]{S} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x42646096 (coo:0, csr:1, hw:1, ic:1, fi:0), storage: 1, subm: 36, symflags:'LS' # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 524288 bytes, per-thread 524288 bytes # RSB_IO_WANT_MEMORY_HIERARCHY_INFO_STRING: unset @@ -6516,9 +6551,9 @@ # RSB_IO_WANT_SORT_METHOD: 0 # RSB_IO_WANT_SUBDIVISION_MULTIPLIER: 2 # librsb version 1.3.0.2 - 202212201855: Initialization success -3 iterations (1 th.) took 0.001339s; avg 0.0004463s ( +/- 2.30/ 2.62 %); best 0.0004361s; worst 0.000458s; std dev. 9.012e-06 (taking best). -Reference operation time is 0.000436068 s (46.32 Mflops) with 1 threads. -Challenging best inner round reference (5.00679e-06 s/1 threads) with: subdivision 2, 36 leaves, 2.383 bytes/nz, 0.000436068 s/0 threads (speedup 0.0114817 x), same?n. +3 iterations (1 th.) took 0.002188s; avg 0.0007293s ( +/- 3.63/ 6.28 %); best 0.0007029s; worst 0.0007751s; std dev. 3.25e-05 (taking best). +Reference operation time is 0.000702858 s (28.74 Mflops) with 1 threads. +Challenging best inner round reference (1.00136e-05 s/0 threads) with: subdivision 2, 36 leaves, 2.383 bytes/nz, 0.000702858 s/0 threads (speedup 0.0142469 x), same?n. New candidate clone performs slowly; discarding it: 100 x 100, type S, 5050 nnz, 50 nnz/r, 50 subms, 36 lsubms, 2.3834 bpnz # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 524288 bytes, per-thread 524288 bytes @@ -6552,16 +6587,16 @@ # librsb version 1.3.0.2 - 202212201855: Initialization success Building a matrix with 5050 nnz, 100 x 100 Duplicates check: 5050 - 0 = 5050 - converted COO to RSB in 2.797e-03 s (100.00 %) - analyzed arrays in 9.391e-04 s (33.58 %) - cleaned-up arrays in 9.060e-06 s (0.32 %) - deduplicated arrays in 6.914e-06 s (0.25 %) + converted COO to RSB in 6.925e-03 s (100.00 %) + analyzed arrays in 3.341e-03 s (48.24 %) + cleaned-up arrays in 1.693e-05 s (0.24 %) + deduplicated arrays in 1.502e-05 s (0.22 %) sorted arrays in 0.000e+00 s (0.00 %) - shuffled partitions in 9.360e-04 s (33.47 %) - memory allocations took 1.907e-06 s (0.07 %) - leafs setup took 9.537e-07 s (0.03 %) - halfword conversion took 9.019e-04 s (32.25 %) -Built (100 x 100)[0xaaaad035e320]{S} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x42646096 (coo:0, csr:1, hw:1, ic:1, fi:0), storage: 1, subm: 36, symflags:'LS' + shuffled partitions in 2.027e-03 s (29.27 %) + memory allocations took 7.153e-06 s (0.10 %) + leafs setup took 2.861e-06 s (0.04 %) + halfword conversion took 1.515e-03 s (21.88 %) +Built (100 x 100)[0xaaaaeaad0030]{S} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x42646096 (coo:0, csr:1, hw:1, ic:1, fi:0), storage: 1, subm: 36, symflags:'LS' # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 524288 bytes, per-thread 524288 bytes # RSB_IO_WANT_MEMORY_HIERARCHY_INFO_STRING: unset @@ -6607,11 +6642,11 @@ # RSB_IO_WANT_SORT_METHOD: 0 # RSB_IO_WANT_SUBDIVISION_MULTIPLIER: 4 # librsb version 1.3.0.2 - 202212201855: Initialization success -3 iterations (1 th.) took 0.001342s; avg 0.0004474s ( +/- 1.19/ 0.62 %); best 0.000442s; worst 0.0004501s; std dev. 3.766e-06 (taking best). -Reference operation time is 0.000442028 s (45.7 Mflops) with 1 threads. -Challenging best inner round reference (5.00679e-06 s/1 threads) with: subdivision 4, 36 leaves, 2.383 bytes/nz, 0.000442028 s/0 threads (speedup 0.0113269 x), same?n. +3 iterations (1 th.) took 0.002219s; avg 0.0007397s ( +/- 13.48/ 26.94 %); best 0.0006399s; worst 0.0009389s; std dev. 0.0001409 (taking best). +Reference operation time is 0.000639915 s (31.57 Mflops) with 1 threads. +Challenging best inner round reference (1.00136e-05 s/0 threads) with: subdivision 4, 36 leaves, 2.383 bytes/nz, 0.000639915 s/0 threads (speedup 0.0156483 x), same?n. New candidate clone performs slowly; discarding it: 100 x 100, type S, 5050 nnz, 50 nnz/r, 50 subms, 36 lsubms, 2.3834 bpnz -Best sparse multiply performance with subdivision multiplier of 1: 4034.52 Mflops. +Best sparse multiply performance with subdivision multiplier of 0.25: 2017.26 Mflops. # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 524288 bytes, per-thread 524288 bytes # RSB_IO_WANT_MEMORY_HIERARCHY_INFO_STRING: unset @@ -6627,23 +6662,23 @@ # RSB_IO_WANT_SORT_METHOD: 0 # RSB_IO_WANT_SUBDIVISION_MULTIPLIER: 1 # librsb version 1.3.0.2 - 202212201855: Initialization success -Last tuner inner round (1 of 1) took 0.0207548 s (eq. to 4e+03/ 4e+03 old/new op.times), gained local/global speedup 1 x (5.00679e-06 : 5.00679e-06) / 1 x (5.00679e-06 : 5.00679e-06). This is not amortizable ! -Auto tuning inner round 1 did not find a configuration better than the original. -In 1 tuning rounds (tot. 0.021s, 0.014s for constructor, 0 clones) obtained NO speedup (best stays 4035 Mflops). -Second run of RSB Autotuner took 0.0207741 s and estimated a speedup of 1.000000 x (5.007e-06 s -> 5.007e-06 s per op) in same matrix (1 -> 1 lsubm) +Last tuner inner round (1 of 1) took 0.0438001 s (eq. to 4e+03/ 4e+03 old/new op.times), gained local/global speedup 1.09524 x (1.09673e-05 : 1.00136e-05) / 1.09524 x (1.09673e-05 : 1.00136e-05). This is amortizable in 45928 op.times. +In 1 tuning rounds (tot. 0.044s, 0.034s for constructor, 0 clones) obtained a SPEEDUP of 9.5% (1.095x) (from 1842 to 2017 Mflops). +Second run of RSB Autotuner took 0.0438318 s and estimated a speedup of 1.095238 x (1.097e-05 s -> 1.001e-05 s per op) in new matrix (1 -> 1 lsubm) +RSB Autotuner suggested a new matrix: freeing the old one. #min:1 #max:1 #sum:100 #norm:10 #used index storage compared to COO:10504 vs 40400 bytes (26.00%) ; compared to CSR:10504 vs 20604 bytes (50.99%) #%:CONSTRUCTOR_*:SORT SCAN INSERT SCAN+INSERT -%:CONSTRUCTOR_TIMES:lower-100x100-5050nz S N 1 100 100 5050 0.000000 0.000542 0.001893 0.002435 -%:UNSORTEDCOO2RSB_TIME:lower-100x100-5050nz S N 1 100 100 5050 0.002435 -%:RSB_SUBDIVISION_TIME:lower-100x100-5050nz S N 1 100 100 5050 0.000542 -%:RSB_SHUFFLE_TIME:lower-100x100-5050nz S N 1 100 100 5050 0.001893 +%:CONSTRUCTOR_TIMES:lower-100x100-5050nz S N 1 100 100 5050 0.000000 0.001319 0.003931 0.005250 +%:UNSORTEDCOO2RSB_TIME:lower-100x100-5050nz S N 1 100 100 5050 0.005250 +%:RSB_SUBDIVISION_TIME:lower-100x100-5050nz S N 1 100 100 5050 0.001319 +%:RSB_SHUFFLE_TIME:lower-100x100-5050nz S N 1 100 100 5050 0.003931 %:ROW_MAJOR_SORT_TIME:lower-100x100-5050nz S N 1 100 100 5050 0.000000 %:ROW_MAJOR_SORT_SCALING:lower-100x100-5050nz S N 1 100 100 5050 nan -%:SORTEDCOO2RSB_TIME:lower-100x100-5050nz S N 1 100 100 5050 0.002435 +%:SORTEDCOO2RSB_TIME:lower-100x100-5050nz S N 1 100 100 5050 0.005250 %:ROW_MAJOR_SORT_TO_MOP:lower-100x100-5050nz S N 1 100 100 5050 0.000 %:UNSORTEDCOO2RSB_SCALING:lower-100x100-5050nz S N 1 100 100 5050 1.00 %:SORTEDCOO2RSB_SCALING:lower-100x100-5050nz S N 1 100 100 5050 1.00 @@ -6658,34 +6693,34 @@ %:SM_MINMAXAVGNNZ:lower-100x100-5050nz S N 1 100 100 5050 5050 5050 5050 # %operation:matrix CONSTRUCTOR[1] SPMV[1] SPMV[1] -%operation:lower-100x100-5050nz 0.00339293 1e+09 1e+09 +%operation:lower-100x100-5050nz 0.00704694 1e+09 1e+09 %constructor:matrix SORT[1] SCAN[1] SHUFFLE[1] INSERT[1] -%constructor:lower-100x100-5050nz 0 0.000542164 0 0.00189304 -# so far, program took 5.480s of wall clock time; ancillary tests 0.000s; I/O 0.000s; checks 0.000s; conversions 0.000s; rsb/mkl tuning 0.091s/0.000s . +%constructor:lower-100x100-5050nz 0 0.00131893 0 0.00393081 +# so far, program took 5.581s of wall clock time; ancillary tests 0.000s; I/O 0.000s; checks 0.000s; conversions 0.000s; rsb/mkl tuning 0.198s/0.000s . getrusage() stats: ru_maxrss: 6 (maximum resident set size -- MB) -ru_stime : 0.044s (system CPU time used) -ru_utime : 6.358s (user CPU time used) +ru_stime : 0.06424s (system CPU time used) +ru_utime : 6.466s (user CPU time used) # multi-type benchmarking (DSCZ) -- now using typecode C (last was D). # Cache block size total 524288 bytes, per-thread 524288 bytes -# so far, program took 5.480s of wall clock time; ancillary tests 0.000s; I/O 0.000s; checks 0.000s; conversions 0.000s; rsb/mkl tuning 0.091s/0.000s . +# so far, program took 5.581s of wall clock time; ancillary tests 0.000s; I/O 0.000s; checks 0.000s; conversions 0.000s; rsb/mkl tuning 0.198s/0.000s . # Using 1 threads # Using alpha=1 beta=1 order=cols for rsb_spmv/rsb_spsv/rsb_spmm/rsb_spsm. # will use input matrix flags: RSB_FLAG_USE_HALFWORD_INDICES, RSB_FLAG_SORTED_INPUT, RSB_FLAG_LOWER, RSB_FLAG_QUAD_PARTITIONING, RSB_FLAG_SYMMETRIC, RSB_FLAG_OWN_PARTITIONING_ARRAYS # Using 1 threads Building a matrix with 5050 nnz, 100 x 100 Duplicates check: 5050 - 0 = 5050 - converted COO to RSB in 3.239e-03 s (100.00 %) - analyzed arrays in 4.740e-04 s (14.63 %) - cleaned-up arrays in 8.821e-06 s (0.27 %) - deduplicated arrays in 8.106e-06 s (0.25 %) + converted COO to RSB in 5.956e-03 s (100.00 %) + analyzed arrays in 9.840e-04 s (16.52 %) + cleaned-up arrays in 1.693e-05 s (0.28 %) + deduplicated arrays in 1.407e-05 s (0.24 %) sorted arrays in 0.000e+00 s (0.00 %) - shuffled partitions in 1.831e-03 s (56.53 %) - memory allocations took 2.146e-06 s (0.07 %) - leafs setup took 9.537e-07 s (0.03 %) - halfword conversion took 9.131e-04 s (28.19 %) -Built (100 x 100)[0xaaaad034b240]{C} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x2446196 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'LS' -# Constructed matrix (took 0.003s): (100 x 100)[0xaaaad034b240]{C} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x2446196 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'LS' + shuffled partitions in 3.244e-03 s (54.47 %) + memory allocations took 4.053e-06 s (0.07 %) + leafs setup took 1.907e-06 s (0.03 %) + halfword conversion took 1.691e-03 s (28.39 %) +Built (100 x 100)[0xaaaaeaaae280]{C} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x2446196 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'LS' +# Constructed matrix (took 0.006s): (100 x 100)[0xaaaaeaaae280]{C} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x2446196 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'LS' # matrix consistency check took 0.000s (ok) RSB Sparse Blocks Autotuner invoked requesting max 6 splits and max 6 merges in 1 rounds, threads spec.0 (specify negative values to enable threads tuning). Will autotune matrix: 100 x 100, type C, 5050 nnz, 50 nnz/r, 4 subms, 3 lsubms, 2.1212 bpnz. @@ -6736,10 +6771,10 @@ # RSB_IO_WANT_SORT_METHOD: 0 # RSB_IO_WANT_SUBDIVISION_MULTIPLIER: 1 # librsb version 1.3.0.2 - 202212201855: Initialization success -3 iterations (1 th.) took 0.001561s; avg 0.0005204s ( +/- 1.04/ 0.52 %); best 0.000515s; worst 0.0005231s; std dev. 3.821e-06 (taking best). -Reference operation time is 0.000514984 s (156.9 Mflops) with 1 threads. -Starting merge (same threads) based auto-tuning procedure (transA=N, nrhs=1, order=cols) (max 6 steps, inclusive 3 grace steps) on: 100 x 100, type C, 5050 nnz, 50 nnz/r, 4 subms, 3 lsubms, 2.1212 bpnz (tpop: 0.000515 Mflops: 156.898) -Merge (3 -> 1 leaves) took w.c.t. of 3.6e-05s, ~3.123e-05s of computing time (of which 1.311e-05s sorting, 1.907e-06s analysis) +3 iterations (1 th.) took 0.002228s; avg 0.0007427s ( +/- 3.85/ 6.77 %); best 0.0007141s; worst 0.000793s; std dev. 3.568e-05 (taking best). +Reference operation time is 0.000714064 s (113.2 Mflops) with 1 threads. +Starting merge (same threads) based auto-tuning procedure (transA=N, nrhs=1, order=cols) (max 6 steps, inclusive 3 grace steps) on: 100 x 100, type C, 5050 nnz, 50 nnz/r, 4 subms, 3 lsubms, 2.1212 bpnz (tpop: 0.0007141 Mflops: 113.155) +Merge (3 -> 1 leaves) took w.c.t. of 5.293e-05s, ~4.601e-05s of computing time (of which 1.979e-05s sorting, 1.907e-06s analysis) # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 524288 bytes, per-thread 524288 bytes # RSB_IO_WANT_MEMORY_HIERARCHY_INFO_STRING: unset @@ -6770,8 +6805,8 @@ # RSB_IO_WANT_SORT_METHOD: 0 # RSB_IO_WANT_SUBDIVISION_MULTIPLIER: 1 # librsb version 1.3.0.2 - 202212201855: Initialization success -3 iterations (1 th.) took 5.984e-05s; avg 1.995e-05s ( +/- 5.58/ 9.96 %); best 1.884e-05s; worst 2.193e-05s; std dev. 1.408e-06 (taking best). -Reference operation time is 1.88351e-05 s (4290 Mflops) with 1 threads. +3 iterations (1 th.) took 9.418e-05s; avg 3.139e-05s ( +/- 1.27/ 2.53 %); best 3.099e-05s; worst 3.219e-05s; std dev. 5.62e-07 (taking best). +Reference operation time is 3.09944e-05 s (2607 Mflops) with 1 threads. # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 524288 bytes, per-thread 524288 bytes # RSB_IO_WANT_MEMORY_HIERARCHY_INFO_STRING: unset @@ -6787,16 +6822,16 @@ # RSB_IO_WANT_SORT_METHOD: 0 # RSB_IO_WANT_SUBDIVISION_MULTIPLIER: 1 # librsb version 1.3.0.2 - 202212201855: Initialization success -After merge step 1: tpop: 1.884e-05 s ~Mflops: 4289.870 nsubm:1 otn:1 -Applying merge (3 -> 1 leaves, 1 th.) yielded SPEEDUP of 27.342x: 0.000515s -> 1.884e-05s, so taking this instance. +After merge step 1: tpop: 3.099e-05 s ~Mflops: 2606.921 nsubm:1 otn:1 +Applying merge (3 -> 1 leaves, 1 th.) yielded SPEEDUP of 23.038x: 0.0007141s -> 3.099e-05s, so taking this instance. Saved plot to test-tuning-lower-100x100-5050nz--C-N-1--mv-tuned_merge1_1x1th.eps Merged all the matrix leaves: no reason to continue merging. -A total of 1 merge steps (of max 6) (3 -> 1 subms) took 0.006553s (of which 3.791e-05s partitioning, 0.004761s I/O); computing times: 3.123e-05s in par. loops, 1.311e-05s sorting, 1.907e-06s analyzing) -Total merge + benchmarking process took 0.006553s, equivalent to 347.9/12.7 new/old ops (0.003035s for 2 clones -- as 161.1/5.9 ops, or 80.6/2.9 ops per clone), SPEEDUP of 27.342x -Applying multi-merge (3 -> 1 leaves, 1 steps, 0 -> 1 th.sp.) yielded SPEEDUP of 27.342x (0.000515s -> 1.884e-05s), will amortize in 13.2 ops by saving 0.0004961s per op. -In 1 tuning rounds (tot. 0.0097s, 0.003s for constructor, 2 clones) obtained a SPEEDUP of 2634.2% (27.34x) (from 156.9 to 4290 Mflops). Employed 0.0045s for I/O of matrix plots. +A total of 1 merge steps (of max 6) (3 -> 1 subms) took 0.01133s (of which 5.722e-05s partitioning, 0.008337s I/O); computing times: 4.601e-05s in par. loops, 1.979e-05s sorting, 1.907e-06s analyzing) +Total merge + benchmarking process took 0.01133s, equivalent to 365.5/15.9 new/old ops (0.005675s for 2 clones -- as 183.1/7.9 ops, or 91.5/4.0 ops per clone), SPEEDUP of 23.038x +Applying multi-merge (3 -> 1 leaves, 1 steps, 0 -> 1 th.sp.) yielded SPEEDUP of 23.038x (0.0007141s -> 3.099e-05s), will amortize in 16.6 ops by saving 0.0006831s per op. +In 1 tuning rounds (tot. 0.016s, 0.0057s for constructor, 2 clones) obtained a SPEEDUP of 2203.8% (23.04x) (from 113.2 to 2607 Mflops). Employed 0.012s for I/O of matrix plots. #pr: updating sample at index 3 (2^th of 4), 0^th touch for (0,0,0,0,0,2,0). -First run of RSB Autotuner took 0.014158 s (5.150e-04 s -> 1.884e-05 s per spmv_sxsa) (tuned: 3 -> 1 lsubm). +First run of RSB Autotuner took 0.0281918 s (7.141e-04 s -> 3.099e-05 s per spmv_sxsa) (tuned: 3 -> 1 lsubm). RSB Sparse Blocks Autotuner invoked requesting max 0 splits and max 0 merges in 1 rounds, auto threads spec. Will autotune matrix: 100 x 100, type C, 5050 nnz, 50 nnz/r, 1 subms, 1 lsubms, 2.0800 bpnz. Parameters: verbosity:1 mintimes:3 maxtimes:10 mindt:0 maxdt:10 @@ -6862,20 +6897,20 @@ # RSB_IO_WANT_SORT_METHOD: 0 # RSB_IO_WANT_SUBDIVISION_MULTIPLIER: 1 # librsb version 1.3.0.2 - 202212201855: Initialization success -3 iterations (1 th.) took 6.318e-05s; avg 2.106e-05s ( +/- 9.43/ 18.87 %); best 1.907e-05s; worst 2.503e-05s; std dev. 2.81e-06 (taking best). -Reference operation time is 1.90735e-05 s (4236 Mflops) with 1 threads. +3 iterations (1 th.) took 0.0001111s; avg 3.703e-05s ( +/- 7.94/ 13.30 %); best 3.409e-05s; worst 4.196e-05s; std dev. 3.506e-06 (taking best). +Reference operation time is 3.40939e-05 s (2370 Mflops) with 1 threads. Building a matrix with 5050 nnz, 100 x 100 Duplicates check: 5050 - 0 = 5050 - converted COO to RSB in 1.597e-03 s (100.00 %) - analyzed arrays in 5.291e-04 s (33.12 %) - cleaned-up arrays in 8.821e-06 s (0.55 %) - deduplicated arrays in 7.153e-06 s (0.45 %) + converted COO to RSB in 2.217e-03 s (100.00 %) + analyzed arrays in 7.160e-04 s (32.29 %) + cleaned-up arrays in 1.502e-05 s (0.68 %) + deduplicated arrays in 1.383e-05 s (0.62 %) sorted arrays in 0.000e+00 s (0.00 %) - shuffled partitions in 1.048e-03 s (65.61 %) - memory allocations took 2.146e-06 s (0.13 %) - leafs setup took 1.192e-06 s (0.07 %) - halfword conversion took 9.537e-07 s (0.06 %) -Built (100 x 100)[0xaaaad034b120]{C} @ (0(0..100),0(0..100)) (5050 nnz, 50 nnz/r) flags 0x42644094 (coo:0, csr:1, hw:0, ic:1, fi:0), storage: 1, subm: 1, symflags:'LS' + shuffled partitions in 1.465e-03 s (66.07 %) + memory allocations took 3.338e-06 s (0.15 %) + leafs setup took 2.146e-06 s (0.10 %) + halfword conversion took 1.907e-06 s (0.09 %) +Built (100 x 100)[0xaaaaeaaae160]{C} @ (0(0..100),0(0..100)) (5050 nnz, 50 nnz/r) flags 0x42644094 (coo:0, csr:1, hw:0, ic:1, fi:0), storage: 1, subm: 1, symflags:'LS' Starting autotuning stage, with subdivision of 1 (current threads=1, requested threads=0, max threads = 12). # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 524288 bytes, per-thread 524288 bytes @@ -6909,16 +6944,16 @@ # librsb version 1.3.0.2 - 202212201855: Initialization success Building a matrix with 5050 nnz, 100 x 100 Duplicates check: 5050 - 0 = 5050 - converted COO to RSB in 3.054e-03 s (100.00 %) - analyzed arrays in 9.620e-04 s (31.50 %) - cleaned-up arrays in 7.868e-06 s (0.26 %) - deduplicated arrays in 7.153e-06 s (0.23 %) + converted COO to RSB in 5.046e-03 s (100.00 %) + analyzed arrays in 1.385e-03 s (27.45 %) + cleaned-up arrays in 1.502e-05 s (0.30 %) + deduplicated arrays in 1.311e-05 s (0.26 %) sorted arrays in 0.000e+00 s (0.00 %) - shuffled partitions in 1.034e-03 s (33.86 %) - memory allocations took 1.907e-06 s (0.06 %) - leafs setup took 1.907e-06 s (0.06 %) - halfword conversion took 1.039e-03 s (34.02 %) -Built (100 x 100)[0xaaaad0341a20]{C} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x42646096 (coo:0, csr:1, hw:1, ic:1, fi:0), storage: 1, subm: 3, symflags:'LS' + shuffled partitions in 1.548e-03 s (30.68 %) + memory allocations took 3.815e-06 s (0.08 %) + leafs setup took 1.907e-06 s (0.04 %) + halfword conversion took 2.079e-03 s (41.20 %) +Built (100 x 100)[0xaaaaeaaae280]{C} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x42646096 (coo:0, csr:1, hw:1, ic:1, fi:0), storage: 1, subm: 3, symflags:'LS' # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 524288 bytes, per-thread 524288 bytes # RSB_IO_WANT_MEMORY_HIERARCHY_INFO_STRING: unset @@ -6964,9 +6999,9 @@ # RSB_IO_WANT_SORT_METHOD: 0 # RSB_IO_WANT_SUBDIVISION_MULTIPLIER: 0.25 # librsb version 1.3.0.2 - 202212201855: Initialization success -3 iterations (1 th.) took 0.001521s; avg 0.000507s ( +/- 2.37/ 2.95 %); best 0.000495s; worst 0.0005219s; std dev. 1.119e-05 (taking best). -Reference operation time is 0.000494957 s (163.2 Mflops) with 1 threads. -Challenging best inner round reference (1.90735e-05 s/1 threads) with: subdivision 0.25, 3 leaves, 2.121 bytes/nz, 0.000494957 s/0 threads (speedup 0.0385356 x), same?n. +3 iterations (1 th.) took 0.002425s; avg 0.0008083s ( +/- 29.00/ 23.11 %); best 0.0005739s; worst 0.0009952s; std dev. 0.0001753 (taking best). +Reference operation time is 0.000573874 s (140.8 Mflops) with 1 threads. +Challenging best inner round reference (3.40939e-05 s/1 threads) with: subdivision 0.25, 3 leaves, 2.121 bytes/nz, 0.000573874 s/0 threads (speedup 0.0594101 x), same?n. New candidate clone performs slowly; discarding it: 100 x 100, type C, 5050 nnz, 50 nnz/r, 4 subms, 3 lsubms, 2.1212 bpnz # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 524288 bytes, per-thread 524288 bytes @@ -7000,16 +7035,16 @@ # librsb version 1.3.0.2 - 202212201855: Initialization success Building a matrix with 5050 nnz, 100 x 100 Duplicates check: 5050 - 0 = 5050 - converted COO to RSB in 3.219e-03 s (100.00 %) - analyzed arrays in 1.174e-03 s (36.47 %) - cleaned-up arrays in 8.821e-06 s (0.27 %) - deduplicated arrays in 7.153e-06 s (0.22 %) + converted COO to RSB in 5.580e-03 s (100.00 %) + analyzed arrays in 2.186e-03 s (39.18 %) + cleaned-up arrays in 1.192e-05 s (0.21 %) + deduplicated arrays in 1.001e-05 s (0.18 %) sorted arrays in 0.000e+00 s (0.00 %) - shuffled partitions in 1.019e-03 s (31.66 %) - memory allocations took 1.907e-06 s (0.06 %) - leafs setup took 1.192e-06 s (0.04 %) - halfword conversion took 1.006e-03 s (31.25 %) -Built (100 x 100)[0xaaaad034b240]{C} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x42646096 (coo:0, csr:1, hw:1, ic:1, fi:0), storage: 1, subm: 10, symflags:'LS' + shuffled partitions in 1.366e-03 s (24.48 %) + memory allocations took 4.053e-06 s (0.07 %) + leafs setup took 9.537e-07 s (0.02 %) + halfword conversion took 2.000e-03 s (35.84 %) +Built (100 x 100)[0xaaaaeaaae280]{C} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x42646096 (coo:0, csr:1, hw:1, ic:1, fi:0), storage: 1, subm: 10, symflags:'LS' # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 524288 bytes, per-thread 524288 bytes # RSB_IO_WANT_MEMORY_HIERARCHY_INFO_STRING: unset @@ -7055,9 +7090,9 @@ # RSB_IO_WANT_SORT_METHOD: 0 # RSB_IO_WANT_SUBDIVISION_MULTIPLIER: 0.5 # librsb version 1.3.0.2 - 202212201855: Initialization success -3 iterations (1 th.) took 0.001687s; avg 0.0005623s ( +/- 18.89/ 17.91 %); best 0.0004561s; worst 0.000663s; std dev. 8.458e-05 (taking best). -Reference operation time is 0.000456095 s (177.2 Mflops) with 1 threads. -Challenging best inner round reference (1.90735e-05 s/1 threads) with: subdivision 0.5, 10 leaves, 2.206 bytes/nz, 0.000456095 s/0 threads (speedup 0.0418191 x), same?n. +3 iterations (1 th.) took 0.002348s; avg 0.0007826s ( +/- 18.36/ 12.44 %); best 0.000639s; worst 0.00088s; std dev. 0.0001037 (taking best). +Reference operation time is 0.000638962 s (126.5 Mflops) with 1 threads. +Challenging best inner round reference (3.40939e-05 s/1 threads) with: subdivision 0.5, 10 leaves, 2.206 bytes/nz, 0.000638962 s/0 threads (speedup 0.0533582 x), same?n. New candidate clone performs slowly; discarding it: 100 x 100, type C, 5050 nnz, 50 nnz/r, 14 subms, 10 lsubms, 2.2059 bpnz # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 524288 bytes, per-thread 524288 bytes @@ -7091,16 +7126,16 @@ # librsb version 1.3.0.2 - 202212201855: Initialization success Building a matrix with 5050 nnz, 100 x 100 Duplicates check: 5050 - 0 = 5050 - converted COO to RSB in 3.424e-03 s (100.00 %) - analyzed arrays in 1.001e-03 s (29.24 %) - cleaned-up arrays in 9.060e-06 s (0.26 %) - deduplicated arrays in 6.914e-06 s (0.20 %) + converted COO to RSB in 6.811e-03 s (100.00 %) + analyzed arrays in 2.498e-03 s (36.68 %) + cleaned-up arrays in 9.060e-06 s (0.13 %) + deduplicated arrays in 9.060e-06 s (0.13 %) sorted arrays in 0.000e+00 s (0.00 %) - shuffled partitions in 1.009e-03 s (29.47 %) - memory allocations took 1.907e-06 s (0.06 %) - leafs setup took 9.537e-07 s (0.03 %) - halfword conversion took 1.395e-03 s (40.74 %) -Built (100 x 100)[0xaaaad034b240]{C} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x42646096 (coo:0, csr:1, hw:1, ic:1, fi:0), storage: 1, subm: 23, symflags:'LS' + shuffled partitions in 2.442e-03 s (35.85 %) + memory allocations took 4.053e-06 s (0.06 %) + leafs setup took 3.099e-06 s (0.05 %) + halfword conversion took 1.846e-03 s (27.10 %) +Built (100 x 100)[0xaaaaeaaae280]{C} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x42646096 (coo:0, csr:1, hw:1, ic:1, fi:0), storage: 1, subm: 25, symflags:'LS' # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 524288 bytes, per-thread 524288 bytes # RSB_IO_WANT_MEMORY_HIERARCHY_INFO_STRING: unset @@ -7146,10 +7181,10 @@ # RSB_IO_WANT_SORT_METHOD: 0 # RSB_IO_WANT_SUBDIVISION_MULTIPLIER: 1 # librsb version 1.3.0.2 - 202212201855: Initialization success -3 iterations (1 th.) took 0.001439s; avg 0.0004797s ( +/- 1.14/ 0.89 %); best 0.0004742s; worst 0.000484s; std dev. 4.079e-06 (taking best). -Reference operation time is 0.000474215 s (170.4 Mflops) with 1 threads. -Challenging best inner round reference (1.90735e-05 s/1 threads) with: subdivision 1, 23 leaves, 2.295 bytes/nz, 0.000474215 s/0 threads (speedup 0.0402212 x), same?n. -New candidate clone performs slowly; discarding it: 100 x 100, type C, 5050 nnz, 50 nnz/r, 32 subms, 23 lsubms, 2.2947 bpnz +3 iterations (1 th.) took 0.002757s; avg 0.0009189s ( +/- 20.69/ 36.91 %); best 0.0007288s; worst 0.001258s; std dev. 0.0002404 (taking best). +Reference operation time is 0.000728846 s (110.9 Mflops) with 1 threads. +Challenging best inner round reference (3.40939e-05 s/1 threads) with: subdivision 1, 25 leaves, 2.317 bytes/nz, 0.000728846 s/0 threads (speedup 0.0467779 x), same?n. +New candidate clone performs slowly; discarding it: 100 x 100, type C, 5050 nnz, 50 nnz/r, 34 subms, 25 lsubms, 2.3168 bpnz # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 524288 bytes, per-thread 524288 bytes # RSB_IO_WANT_MEMORY_HIERARCHY_INFO_STRING: unset @@ -7182,16 +7217,16 @@ # librsb version 1.3.0.2 - 202212201855: Initialization success Building a matrix with 5050 nnz, 100 x 100 Duplicates check: 5050 - 0 = 5050 - converted COO to RSB in 3.733e-03 s (100.00 %) - analyzed arrays in 1.024e-03 s (27.43 %) - cleaned-up arrays in 9.060e-06 s (0.24 %) - deduplicated arrays in 6.914e-06 s (0.19 %) + converted COO to RSB in 5.008e-03 s (100.00 %) + analyzed arrays in 1.730e-03 s (34.54 %) + cleaned-up arrays in 9.060e-06 s (0.18 %) + deduplicated arrays in 7.868e-06 s (0.16 %) sorted arrays in 0.000e+00 s (0.00 %) - shuffled partitions in 1.151e-03 s (30.83 %) - memory allocations took 3.099e-06 s (0.08 %) - leafs setup took 2.146e-06 s (0.06 %) - halfword conversion took 1.537e-03 s (41.17 %) -Built (100 x 100)[0xaaaad0371ee0]{C} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x42646096 (coo:0, csr:1, hw:1, ic:1, fi:0), storage: 1, subm: 36, symflags:'LS' + shuffled partitions in 2.010e-03 s (40.13 %) + memory allocations took 3.099e-06 s (0.06 %) + leafs setup took 2.146e-06 s (0.04 %) + halfword conversion took 1.246e-03 s (24.88 %) +Built (100 x 100)[0xaaaaeaad4f20]{C} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x42646096 (coo:0, csr:1, hw:1, ic:1, fi:0), storage: 1, subm: 36, symflags:'LS' # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 524288 bytes, per-thread 524288 bytes # RSB_IO_WANT_MEMORY_HIERARCHY_INFO_STRING: unset @@ -7237,9 +7272,9 @@ # RSB_IO_WANT_SORT_METHOD: 0 # RSB_IO_WANT_SUBDIVISION_MULTIPLIER: 2 # librsb version 1.3.0.2 - 202212201855: Initialization success -3 iterations (1 th.) took 0.001184s; avg 0.0003947s ( +/- 39.47/ 20.10 %); best 0.0002389s; worst 0.000474s; std dev. 0.0001101 (taking best). -Reference operation time is 0.000238895 s (338.2 Mflops) with 1 threads. -Challenging best inner round reference (1.90735e-05 s/1 threads) with: subdivision 2, 36 leaves, 2.383 bytes/nz, 0.000238895 s/0 threads (speedup 0.0798403 x), same?n. +3 iterations (1 th.) took 0.001754s; avg 0.0005847s ( +/- 13.31/ 9.81 %); best 0.0005069s; worst 0.0006421s; std dev. 5.705e-05 (taking best). +Reference operation time is 0.000506878 s (159.4 Mflops) with 1 threads. +Challenging best inner round reference (3.40939e-05 s/1 threads) with: subdivision 2, 36 leaves, 2.383 bytes/nz, 0.000506878 s/0 threads (speedup 0.0672625 x), same?n. New candidate clone performs slowly; discarding it: 100 x 100, type C, 5050 nnz, 50 nnz/r, 50 subms, 36 lsubms, 2.3834 bpnz # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 524288 bytes, per-thread 524288 bytes @@ -7273,16 +7308,16 @@ # librsb version 1.3.0.2 - 202212201855: Initialization success Building a matrix with 5050 nnz, 100 x 100 Duplicates check: 5050 - 0 = 5050 - converted COO to RSB in 3.051e-03 s (100.00 %) - analyzed arrays in 1.114e-03 s (36.51 %) - cleaned-up arrays in 1.717e-05 s (0.56 %) - deduplicated arrays in 1.383e-05 s (0.45 %) + converted COO to RSB in 4.026e-03 s (100.00 %) + analyzed arrays in 1.204e-03 s (29.91 %) + cleaned-up arrays in 9.060e-06 s (0.23 %) + deduplicated arrays in 8.106e-06 s (0.20 %) sorted arrays in 0.000e+00 s (0.00 %) - shuffled partitions in 9.682e-04 s (31.73 %) - memory allocations took 5.007e-06 s (0.16 %) - leafs setup took 3.815e-06 s (0.13 %) - halfword conversion took 9.282e-04 s (30.42 %) -Built (100 x 100)[0xaaaad0371ee0]{C} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x42646096 (coo:0, csr:1, hw:1, ic:1, fi:0), storage: 1, subm: 36, symflags:'LS' + shuffled partitions in 1.202e-03 s (29.85 %) + memory allocations took 3.815e-06 s (0.09 %) + leafs setup took 1.192e-06 s (0.03 %) + halfword conversion took 1.597e-03 s (39.67 %) +Built (100 x 100)[0xaaaaeaad4f20]{C} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x42646096 (coo:0, csr:1, hw:1, ic:1, fi:0), storage: 1, subm: 36, symflags:'LS' # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 524288 bytes, per-thread 524288 bytes # RSB_IO_WANT_MEMORY_HIERARCHY_INFO_STRING: unset @@ -7328,11 +7363,11 @@ # RSB_IO_WANT_SORT_METHOD: 0 # RSB_IO_WANT_SUBDIVISION_MULTIPLIER: 4 # librsb version 1.3.0.2 - 202212201855: Initialization success -3 iterations (1 th.) took 0.00119s; avg 0.0003966s ( +/- 36.23/ 18.47 %); best 0.000253s; worst 0.0004699s; std dev. 0.0001016 (taking best). -Reference operation time is 0.000252962 s (319.4 Mflops) with 1 threads. -Challenging best inner round reference (1.90735e-05 s/1 threads) with: subdivision 4, 36 leaves, 2.383 bytes/nz, 0.000252962 s/0 threads (speedup 0.0754006 x), same?n. +3 iterations (1 th.) took 0.003458s; avg 0.001153s ( +/- 57.93/109.51 %); best 0.0004849s; worst 0.002415s; std dev. 0.0008931 (taking best). +Reference operation time is 0.000484943 s (166.6 Mflops) with 1 threads. +Challenging best inner round reference (3.40939e-05 s/1 threads) with: subdivision 4, 36 leaves, 2.383 bytes/nz, 0.000484943 s/0 threads (speedup 0.0703048 x), same?n. New candidate clone performs slowly; discarding it: 100 x 100, type C, 5050 nnz, 50 nnz/r, 50 subms, 36 lsubms, 2.3834 bpnz -Best sparse multiply performance with subdivision multiplier of 1: 4236.25 Mflops. +Best sparse multiply performance with subdivision multiplier of 1: 2369.93 Mflops. # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 524288 bytes, per-thread 524288 bytes # RSB_IO_WANT_MEMORY_HIERARCHY_INFO_STRING: unset @@ -7348,23 +7383,23 @@ # RSB_IO_WANT_SORT_METHOD: 0 # RSB_IO_WANT_SUBDIVISION_MULTIPLIER: 1 # librsb version 1.3.0.2 - 202212201855: Initialization success -Last tuner inner round (1 of 1) took 0.0265019 s (eq. to 1e+03/ 1e+03 old/new op.times), gained local/global speedup 1 x (1.90735e-05 : 1.90735e-05) / 1 x (1.90735e-05 : 1.90735e-05). This is not amortizable ! +Last tuner inner round (1 of 1) took 0.0427051 s (eq. to 1e+03/ 1e+03 old/new op.times), gained local/global speedup 1 x (3.40939e-05 : 3.40939e-05) / 1 x (3.40939e-05 : 3.40939e-05). This is not amortizable ! Auto tuning inner round 1 did not find a configuration better than the original. -In 1 tuning rounds (tot. 0.027s, 0.019s for constructor, 0 clones) obtained NO speedup (best stays 4236 Mflops). -Second run of RSB Autotuner took 0.026525 s and estimated a speedup of 1.000000 x (1.907e-05 s -> 1.907e-05 s per op) in same matrix (1 -> 1 lsubm) +In 1 tuning rounds (tot. 0.043s, 0.029s for constructor, 0 clones) obtained NO speedup (best stays 2370 Mflops). +Second run of RSB Autotuner took 0.042733 s and estimated a speedup of 1.000000 x (3.409e-05 s -> 3.409e-05 s per op) in same matrix (1 -> 1 lsubm) #min:1 0 #max:1 0 #sum:100 0 #norm:10 0 #used index storage compared to COO:10504 vs 40400 bytes (26.00%) ; compared to CSR:10504 vs 20604 bytes (50.99%) #%:CONSTRUCTOR_*:SORT SCAN INSERT SCAN+INSERT -%:CONSTRUCTOR_TIMES:lower-100x100-5050nz S N 1 100 100 5050 0.000000 0.000474 0.001831 0.002305 -%:UNSORTEDCOO2RSB_TIME:lower-100x100-5050nz S N 1 100 100 5050 0.002305 -%:RSB_SUBDIVISION_TIME:lower-100x100-5050nz S N 1 100 100 5050 0.000474 -%:RSB_SHUFFLE_TIME:lower-100x100-5050nz S N 1 100 100 5050 0.001831 +%:CONSTRUCTOR_TIMES:lower-100x100-5050nz S N 1 100 100 5050 0.000000 0.000984 0.003244 0.004228 +%:UNSORTEDCOO2RSB_TIME:lower-100x100-5050nz S N 1 100 100 5050 0.004228 +%:RSB_SUBDIVISION_TIME:lower-100x100-5050nz S N 1 100 100 5050 0.000984 +%:RSB_SHUFFLE_TIME:lower-100x100-5050nz S N 1 100 100 5050 0.003244 %:ROW_MAJOR_SORT_TIME:lower-100x100-5050nz S N 1 100 100 5050 0.000000 %:ROW_MAJOR_SORT_SCALING:lower-100x100-5050nz S N 1 100 100 5050 nan -%:SORTEDCOO2RSB_TIME:lower-100x100-5050nz S N 1 100 100 5050 0.002305 +%:SORTEDCOO2RSB_TIME:lower-100x100-5050nz S N 1 100 100 5050 0.004228 %:ROW_MAJOR_SORT_TO_MOP:lower-100x100-5050nz S N 1 100 100 5050 0.000 %:UNSORTEDCOO2RSB_SCALING:lower-100x100-5050nz S N 1 100 100 5050 1.00 %:SORTEDCOO2RSB_SCALING:lower-100x100-5050nz S N 1 100 100 5050 1.00 @@ -7379,34 +7414,34 @@ %:SM_MINMAXAVGNNZ:lower-100x100-5050nz S N 1 100 100 5050 5050 5050 5050 # %operation:matrix CONSTRUCTOR[1] SPMV[1] SPMV[1] -%operation:lower-100x100-5050nz 0.00323915 1e+09 1e+09 +%operation:lower-100x100-5050nz 0.00595617 1e+09 1e+09 %constructor:matrix SORT[1] SCAN[1] SHUFFLE[1] INSERT[1] -%constructor:lower-100x100-5050nz 0 0.000473976 0 0.00183105 -# so far, program took 5.528s of wall clock time; ancillary tests 0.000s; I/O 0.000s; checks 0.000s; conversions 0.000s; rsb/mkl tuning 0.131s/0.000s . +%constructor:lower-100x100-5050nz 0 0.000983953 0 0.00324416 +# so far, program took 5.661s of wall clock time; ancillary tests 0.000s; I/O 0.000s; checks 0.000s; conversions 0.000s; rsb/mkl tuning 0.269s/0.000s . getrusage() stats: ru_maxrss: 6 (maximum resident set size -- MB) -ru_stime : 0.05211s (system CPU time used) -ru_utime : 6.799s (user CPU time used) +ru_stime : 0.06831s (system CPU time used) +ru_utime : 6.884s (user CPU time used) # multi-type benchmarking (DSCZ) -- now using typecode Z (last was D). # Cache block size total 524288 bytes, per-thread 524288 bytes -# so far, program took 5.528s of wall clock time; ancillary tests 0.000s; I/O 0.000s; checks 0.000s; conversions 0.000s; rsb/mkl tuning 0.131s/0.000s . +# so far, program took 5.661s of wall clock time; ancillary tests 0.000s; I/O 0.000s; checks 0.000s; conversions 0.000s; rsb/mkl tuning 0.269s/0.000s . # Using 1 threads # Using alpha=1 beta=1 order=cols for rsb_spmv/rsb_spsv/rsb_spmm/rsb_spsm. # will use input matrix flags: RSB_FLAG_USE_HALFWORD_INDICES, RSB_FLAG_SORTED_INPUT, RSB_FLAG_LOWER, RSB_FLAG_QUAD_PARTITIONING, RSB_FLAG_SYMMETRIC, RSB_FLAG_OWN_PARTITIONING_ARRAYS # Using 1 threads Building a matrix with 5050 nnz, 100 x 100 Duplicates check: 5050 - 0 = 5050 - converted COO to RSB in 3.596e-03 s (100.00 %) - analyzed arrays in 4.890e-04 s (13.60 %) - cleaned-up arrays in 1.693e-05 s (0.47 %) - deduplicated arrays in 1.502e-05 s (0.42 %) + converted COO to RSB in 4.717e-03 s (100.00 %) + analyzed arrays in 8.528e-04 s (18.08 %) + cleaned-up arrays in 9.060e-06 s (0.19 %) + deduplicated arrays in 7.868e-06 s (0.17 %) sorted arrays in 0.000e+00 s (0.00 %) - shuffled partitions in 2.165e-03 s (60.20 %) - memory allocations took 5.960e-06 s (0.17 %) - leafs setup took 2.146e-06 s (0.06 %) - halfword conversion took 9.010e-04 s (25.05 %) -Built (100 x 100)[0xaaaad034b240]{Z} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x2446196 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'LS' -# Constructed matrix (took 0.004s): (100 x 100)[0xaaaad034b240]{Z} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x2446196 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'LS' + shuffled partitions in 2.215e-03 s (46.96 %) + memory allocations took 4.292e-06 s (0.09 %) + leafs setup took 9.537e-07 s (0.02 %) + halfword conversion took 1.627e-03 s (34.49 %) +Built (100 x 100)[0xaaaaeaaae280]{Z} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x2446196 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'LS' +# Constructed matrix (took 0.005s): (100 x 100)[0xaaaaeaaae280]{Z} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x2446196 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'LS' # matrix consistency check took 0.000s (ok) RSB Sparse Blocks Autotuner invoked requesting max 6 splits and max 6 merges in 1 rounds, threads spec.0 (specify negative values to enable threads tuning). Will autotune matrix: 100 x 100, type Z, 5050 nnz, 50 nnz/r, 4 subms, 3 lsubms, 2.1212 bpnz. @@ -7457,10 +7492,10 @@ # RSB_IO_WANT_SORT_METHOD: 0 # RSB_IO_WANT_SUBDIVISION_MULTIPLIER: 1 # librsb version 1.3.0.2 - 202212201855: Initialization success -3 iterations (1 th.) took 0.0013s; avg 0.0004334s ( +/- 1.25/ 0.62 %); best 0.000428s; worst 0.0004361s; std dev. 3.821e-06 (taking best). -Reference operation time is 0.000427961 s (188.8 Mflops) with 1 threads. -Starting merge (same threads) based auto-tuning procedure (transA=N, nrhs=1, order=cols) (max 6 steps, inclusive 3 grace steps) on: 100 x 100, type Z, 5050 nnz, 50 nnz/r, 4 subms, 3 lsubms, 2.1212 bpnz (tpop: 0.000428 Mflops: 188.802) -Merge (3 -> 1 leaves) took w.c.t. of 6.08e-05s, ~5.293e-05s of computing time (of which 2.503e-05s sorting, 1.907e-06s analysis) +3 iterations (1 th.) took 0.002146s; avg 0.0007153s ( +/- 1.01/ 0.92 %); best 0.0007081s; worst 0.0007219s; std dev. 5.663e-06 (taking best). +Reference operation time is 0.000708103 s (114.1 Mflops) with 1 threads. +Starting merge (same threads) based auto-tuning procedure (transA=N, nrhs=1, order=cols) (max 6 steps, inclusive 3 grace steps) on: 100 x 100, type Z, 5050 nnz, 50 nnz/r, 4 subms, 3 lsubms, 2.1212 bpnz (tpop: 0.0007081 Mflops: 114.108) +Merge (3 -> 1 leaves) took w.c.t. of 4.411e-05s, ~3.695e-05s of computing time (of which 1.788e-05s sorting, 2.146e-06s analysis) # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 524288 bytes, per-thread 524288 bytes # RSB_IO_WANT_MEMORY_HIERARCHY_INFO_STRING: unset @@ -7491,8 +7526,8 @@ # RSB_IO_WANT_SORT_METHOD: 0 # RSB_IO_WANT_SUBDIVISION_MULTIPLIER: 1 # librsb version 1.3.0.2 - 202212201855: Initialization success -3 iterations (1 th.) took 9.894e-05s; avg 3.298e-05s ( +/- 2.41/ 2.65 %); best 3.219e-05s; worst 3.386e-05s; std dev. 6.837e-07 (taking best). -Reference operation time is 3.21865e-05 s (2510 Mflops) with 1 threads. +3 iterations (1 th.) took 5.889e-05s; avg 1.963e-05s ( +/- 4.05/ 2.02 %); best 1.884e-05s; worst 2.003e-05s; std dev. 5.62e-07 (taking best). +Reference operation time is 1.88351e-05 s (4290 Mflops) with 1 threads. # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 524288 bytes, per-thread 524288 bytes # RSB_IO_WANT_MEMORY_HIERARCHY_INFO_STRING: unset @@ -7508,16 +7543,16 @@ # RSB_IO_WANT_SORT_METHOD: 0 # RSB_IO_WANT_SUBDIVISION_MULTIPLIER: 1 # librsb version 1.3.0.2 - 202212201855: Initialization success -After merge step 1: tpop: 3.219e-05 s ~Mflops: 2510.369 nsubm:1 otn:1 -Applying merge (3 -> 1 leaves, 1 th.) yielded SPEEDUP of 13.296x: 0.000428s -> 3.219e-05s, so taking this instance. +After merge step 1: tpop: 1.884e-05 s ~Mflops: 4289.870 nsubm:1 otn:1 +Applying merge (3 -> 1 leaves, 1 th.) yielded SPEEDUP of 37.595x: 0.0007081s -> 1.884e-05s, so taking this instance. Saved plot to test-tuning-lower-100x100-5050nz--Z-N-1--mv-tuned_merge1_1x1th.eps Merged all the matrix leaves: no reason to continue merging. -A total of 1 merge steps (of max 6) (3 -> 1 subms) took 0.006404s (of which 6.39e-05s partitioning, 0.004908s I/O); computing times: 5.293e-05s in par. loops, 2.503e-05s sorting, 1.907e-06s analyzing) -Total merge + benchmarking process took 0.006404s, equivalent to 199.0/15.0 new/old ops (0.002199s for 2 clones -- as 68.3/5.1 ops, or 34.2/2.6 ops per clone), SPEEDUP of 13.296x -Applying multi-merge (3 -> 1 leaves, 1 steps, 0 -> 1 th.sp.) yielded SPEEDUP of 13.296x (0.000428s -> 3.219e-05s), will amortize in 16.2 ops by saving 0.0003958s per op. -In 1 tuning rounds (tot. 0.0089s, 0.0022s for constructor, 2 clones) obtained a SPEEDUP of 1229.6% (13.3x) (from 188.8 to 2510 Mflops). Employed 0.0055s for I/O of matrix plots. +A total of 1 merge steps (of max 6) (3 -> 1 subms) took 0.01024s (of which 4.697e-05s partitioning, 0.007448s I/O); computing times: 3.695e-05s in par. loops, 1.788e-05s sorting, 2.146e-06s analyzing) +Total merge + benchmarking process took 0.01024s, equivalent to 543.5/14.5 new/old ops (0.004738s for 2 clones -- as 251.6/6.7 ops, or 125.8/3.3 ops per clone), SPEEDUP of 37.595x +Applying multi-merge (3 -> 1 leaves, 1 steps, 0 -> 1 th.sp.) yielded SPEEDUP of 37.595x (0.0007081s -> 1.884e-05s), will amortize in 14.9 ops by saving 0.0006893s per op. +In 1 tuning rounds (tot. 0.015s, 0.0047s for constructor, 2 clones) obtained a SPEEDUP of 3659.5% (37.59x) (from 114.1 to 4290 Mflops). Employed 0.0061s for I/O of matrix plots. #pr: updating sample at index 4 (3^th of 4), 0^th touch for (0,0,0,0,0,3,0). -First run of RSB Autotuner took 0.0146761 s (4.280e-04 s -> 3.219e-05 s per spmv_sxsa) (tuned: 3 -> 1 lsubm). +First run of RSB Autotuner took 0.0205898 s (7.081e-04 s -> 1.884e-05 s per spmv_sxsa) (tuned: 3 -> 1 lsubm). RSB Sparse Blocks Autotuner invoked requesting max 0 splits and max 0 merges in 1 rounds, auto threads spec. Will autotune matrix: 100 x 100, type Z, 5050 nnz, 50 nnz/r, 1 subms, 1 lsubms, 2.0800 bpnz. Parameters: verbosity:1 mintimes:3 maxtimes:10 mindt:0 maxdt:10 @@ -7583,20 +7618,20 @@ # RSB_IO_WANT_SORT_METHOD: 0 # RSB_IO_WANT_SUBDIVISION_MULTIPLIER: 1 # librsb version 1.3.0.2 - 202212201855: Initialization success -3 iterations (1 th.) took 9.584e-05s; avg 3.195e-05s ( +/- 9.70/ 15.67 %); best 2.885e-05s; worst 3.695e-05s; std dev. 3.574e-06 (taking best). -Reference operation time is 2.88486e-05 s (2801 Mflops) with 1 threads. +3 iterations (1 th.) took 6.604e-05s; avg 2.201e-05s ( +/- 13.36/ 22.38 %); best 1.907e-05s; worst 2.694e-05s; std dev. 3.506e-06 (taking best). +Reference operation time is 1.90735e-05 s (4236 Mflops) with 1 threads. Building a matrix with 5050 nnz, 100 x 100 Duplicates check: 5050 - 0 = 5050 - converted COO to RSB in 1.391e-03 s (100.00 %) - analyzed arrays in 4.852e-04 s (34.88 %) - cleaned-up arrays in 1.407e-05 s (1.01 %) - deduplicated arrays in 1.192e-05 s (0.86 %) + converted COO to RSB in 1.182e-02 s (100.00 %) + analyzed arrays in 3.885e-03 s (32.87 %) + cleaned-up arrays in 1.001e-05 s (0.08 %) + deduplicated arrays in 6.914e-06 s (0.06 %) sorted arrays in 0.000e+00 s (0.00 %) - shuffled partitions in 8.731e-04 s (62.77 %) - memory allocations took 2.861e-06 s (0.21 %) - leafs setup took 9.537e-07 s (0.07 %) - halfword conversion took 1.907e-06 s (0.14 %) -Built (100 x 100)[0xaaaad034b120]{Z} @ (0(0..100),0(0..100)) (5050 nnz, 50 nnz/r) flags 0x42644094 (coo:0, csr:1, hw:0, ic:1, fi:0), storage: 1, subm: 1, symflags:'LS' + shuffled partitions in 7.896e-03 s (66.81 %) + memory allocations took 1.502e-05 s (0.13 %) + leafs setup took 1.907e-06 s (0.02 %) + halfword conversion took 2.146e-06 s (0.02 %) +Built (100 x 100)[0xaaaaeaaae160]{Z} @ (0(0..100),0(0..100)) (5050 nnz, 50 nnz/r) flags 0x42644094 (coo:0, csr:1, hw:0, ic:1, fi:0), storage: 1, subm: 1, symflags:'LS' Starting autotuning stage, with subdivision of 1 (current threads=1, requested threads=0, max threads = 12). # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 524288 bytes, per-thread 524288 bytes @@ -7630,16 +7665,16 @@ # librsb version 1.3.0.2 - 202212201855: Initialization success Building a matrix with 5050 nnz, 100 x 100 Duplicates check: 5050 - 0 = 5050 - converted COO to RSB in 3.124e-03 s (100.00 %) - analyzed arrays in 1.294e-03 s (41.42 %) - cleaned-up arrays in 1.407e-05 s (0.45 %) - deduplicated arrays in 1.001e-05 s (0.32 %) + converted COO to RSB in 1.110e-02 s (100.00 %) + analyzed arrays in 6.441e-03 s (58.01 %) + cleaned-up arrays in 9.060e-06 s (0.08 %) + deduplicated arrays in 8.106e-06 s (0.07 %) sorted arrays in 0.000e+00 s (0.00 %) - shuffled partitions in 9.019e-04 s (28.87 %) - memory allocations took 4.053e-06 s (0.13 %) - leafs setup took 9.537e-07 s (0.03 %) - halfword conversion took 8.991e-04 s (28.78 %) -Built (100 x 100)[0xaaaad034b240]{Z} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x42646096 (coo:0, csr:1, hw:1, ic:1, fi:0), storage: 1, subm: 6, symflags:'LS' + shuffled partitions in 1.691e-03 s (15.23 %) + memory allocations took 5.007e-06 s (0.05 %) + leafs setup took 2.146e-06 s (0.02 %) + halfword conversion took 2.946e-03 s (26.53 %) +Built (100 x 100)[0xaaaaeaaae280]{Z} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x42646096 (coo:0, csr:1, hw:1, ic:1, fi:0), storage: 1, subm: 6, symflags:'LS' # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 524288 bytes, per-thread 524288 bytes # RSB_IO_WANT_MEMORY_HIERARCHY_INFO_STRING: unset @@ -7685,9 +7720,9 @@ # RSB_IO_WANT_SORT_METHOD: 0 # RSB_IO_WANT_SUBDIVISION_MULTIPLIER: 0.25 # librsb version 1.3.0.2 - 202212201855: Initialization success -3 iterations (1 th.) took 0.001141s; avg 0.0003803s ( +/- 39.00/ 20.19 %); best 0.000232s; worst 0.000457s; std dev. 0.0001049 (taking best). -Reference operation time is 0.000231981 s (348.3 Mflops) with 1 threads. -Challenging best inner round reference (2.88486e-05 s/1 threads) with: subdivision 0.25, 6 leaves, 2.163 bytes/nz, 0.000231981 s/0 threads (speedup 0.124358 x), same?n. +3 iterations (1 th.) took 0.003138s; avg 0.001046s ( +/- 15.87/ 25.43 %); best 0.00088s; worst 0.001312s; std dev. 0.00019 (taking best). +Reference operation time is 0.000880003 s (91.82 Mflops) with 1 threads. +Challenging best inner round reference (1.90735e-05 s/1 threads) with: subdivision 0.25, 6 leaves, 2.163 bytes/nz, 0.000880003 s/0 threads (speedup 0.0216743 x), same?n. New candidate clone performs slowly; discarding it: 100 x 100, type Z, 5050 nnz, 50 nnz/r, 8 subms, 6 lsubms, 2.1632 bpnz # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 524288 bytes, per-thread 524288 bytes @@ -7721,16 +7756,16 @@ # librsb version 1.3.0.2 - 202212201855: Initialization success Building a matrix with 5050 nnz, 100 x 100 Duplicates check: 5050 - 0 = 5050 - converted COO to RSB in 2.890e-03 s (100.00 %) - analyzed arrays in 1.039e-03 s (35.95 %) - cleaned-up arrays in 1.287e-05 s (0.45 %) - deduplicated arrays in 1.097e-05 s (0.38 %) + converted COO to RSB in 5.571e-03 s (100.00 %) + analyzed arrays in 2.082e-03 s (37.37 %) + cleaned-up arrays in 8.821e-06 s (0.16 %) + deduplicated arrays in 9.060e-06 s (0.16 %) sorted arrays in 0.000e+00 s (0.00 %) - shuffled partitions in 9.201e-04 s (31.83 %) - memory allocations took 4.292e-06 s (0.15 %) - leafs setup took 1.907e-06 s (0.07 %) - halfword conversion took 9.000e-04 s (31.14 %) -Built (100 x 100)[0xaaaad034b240]{Z} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x42646096 (coo:0, csr:1, hw:1, ic:1, fi:0), storage: 1, subm: 16, symflags:'LS' + shuffled partitions in 2.037e-03 s (36.56 %) + memory allocations took 4.053e-06 s (0.07 %) + leafs setup took 1.907e-06 s (0.03 %) + halfword conversion took 1.428e-03 s (25.63 %) +Built (100 x 100)[0xaaaaeaaae280]{Z} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x42646096 (coo:0, csr:1, hw:1, ic:1, fi:0), storage: 1, subm: 16, symflags:'LS' # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 524288 bytes, per-thread 524288 bytes # RSB_IO_WANT_MEMORY_HIERARCHY_INFO_STRING: unset @@ -7776,9 +7811,9 @@ # RSB_IO_WANT_SORT_METHOD: 0 # RSB_IO_WANT_SUBDIVISION_MULTIPLIER: 0.5 # librsb version 1.3.0.2 - 202212201855: Initialization success -3 iterations (1 th.) took 0.001132s; avg 0.0003773s ( +/- 38.77/ 19.55 %); best 0.000231s; worst 0.0004511s; std dev. 0.0001035 (taking best). -Reference operation time is 0.000231028 s (349.7 Mflops) with 1 threads. -Challenging best inner round reference (2.88486e-05 s/1 threads) with: subdivision 0.5, 16 leaves, 2.25 bytes/nz, 0.000231028 s/0 threads (speedup 0.124871 x), same?n. +3 iterations (1 th.) took 0.002246s; avg 0.0007486s ( +/- 9.33/ 9.14 %); best 0.0006788s; worst 0.0008171s; std dev. 5.646e-05 (taking best). +Reference operation time is 0.000678778 s (119 Mflops) with 1 threads. +Challenging best inner round reference (1.90735e-05 s/1 threads) with: subdivision 0.5, 16 leaves, 2.25 bytes/nz, 0.000678778 s/0 threads (speedup 0.0280998 x), same?n. New candidate clone performs slowly; discarding it: 100 x 100, type Z, 5050 nnz, 50 nnz/r, 22 subms, 16 lsubms, 2.2503 bpnz # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 524288 bytes, per-thread 524288 bytes @@ -7812,16 +7847,16 @@ # librsb version 1.3.0.2 - 202212201855: Initialization success Building a matrix with 5050 nnz, 100 x 100 Duplicates check: 5050 - 0 = 5050 - converted COO to RSB in 2.964e-03 s (100.00 %) - analyzed arrays in 1.074e-03 s (36.24 %) - cleaned-up arrays in 1.311e-05 s (0.44 %) - deduplicated arrays in 1.097e-05 s (0.37 %) + converted COO to RSB in 4.839e-03 s (100.00 %) + analyzed arrays in 1.887e-03 s (39.00 %) + cleaned-up arrays in 8.821e-06 s (0.18 %) + deduplicated arrays in 9.060e-06 s (0.19 %) sorted arrays in 0.000e+00 s (0.00 %) - shuffled partitions in 9.570e-04 s (32.29 %) - memory allocations took 1.907e-06 s (0.06 %) - leafs setup took 1.907e-06 s (0.06 %) - halfword conversion took 9.041e-04 s (30.50 %) -Built (100 x 100)[0xaaaad0399630]{Z} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x42646096 (coo:0, csr:1, hw:1, ic:1, fi:0), storage: 1, subm: 36, symflags:'LS' + shuffled partitions in 1.411e-03 s (29.16 %) + memory allocations took 3.099e-06 s (0.06 %) + leafs setup took 2.146e-06 s (0.04 %) + halfword conversion took 1.516e-03 s (31.33 %) +Built (100 x 100)[0xaaaaeaafc670]{Z} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x42646096 (coo:0, csr:1, hw:1, ic:1, fi:0), storage: 1, subm: 36, symflags:'LS' # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 524288 bytes, per-thread 524288 bytes # RSB_IO_WANT_MEMORY_HIERARCHY_INFO_STRING: unset @@ -7867,9 +7902,9 @@ # RSB_IO_WANT_SORT_METHOD: 0 # RSB_IO_WANT_SUBDIVISION_MULTIPLIER: 1 # librsb version 1.3.0.2 - 202212201855: Initialization success -3 iterations (1 th.) took 0.001559s; avg 0.0005197s ( +/- 50.36/ 63.56 %); best 0.000258s; worst 0.00085s; std dev. 0.0002465 (taking best). -Reference operation time is 0.000257969 s (313.2 Mflops) with 1 threads. -Challenging best inner round reference (2.88486e-05 s/1 threads) with: subdivision 1, 36 leaves, 2.383 bytes/nz, 0.000257969 s/0 threads (speedup 0.11183 x), same?n. +3 iterations (1 th.) took 0.001904s; avg 0.0006347s ( +/- 3.27/ 1.95 %); best 0.0006139s; worst 0.0006471s; std dev. 1.476e-05 (taking best). +Reference operation time is 0.000613928 s (131.6 Mflops) with 1 threads. +Challenging best inner round reference (1.90735e-05 s/1 threads) with: subdivision 1, 36 leaves, 2.383 bytes/nz, 0.000613928 s/0 threads (speedup 0.031068 x), same?n. New candidate clone performs slowly; discarding it: 100 x 100, type Z, 5050 nnz, 50 nnz/r, 50 subms, 36 lsubms, 2.3834 bpnz # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 524288 bytes, per-thread 524288 bytes @@ -7903,16 +7938,16 @@ # librsb version 1.3.0.2 - 202212201855: Initialization success Building a matrix with 5050 nnz, 100 x 100 Duplicates check: 5050 - 0 = 5050 - converted COO to RSB in 2.730e-03 s (100.00 %) - analyzed arrays in 9.191e-04 s (33.67 %) - cleaned-up arrays in 1.407e-05 s (0.52 %) - deduplicated arrays in 1.097e-05 s (0.40 %) + converted COO to RSB in 5.115e-03 s (100.00 %) + analyzed arrays in 1.244e-03 s (24.32 %) + cleaned-up arrays in 1.192e-05 s (0.23 %) + deduplicated arrays in 1.097e-05 s (0.21 %) sorted arrays in 0.000e+00 s (0.00 %) - shuffled partitions in 9.029e-04 s (33.07 %) - memory allocations took 5.007e-06 s (0.18 %) - leafs setup took 3.099e-06 s (0.11 %) - halfword conversion took 8.740e-04 s (32.01 %) -Built (100 x 100)[0xaaaad0399630]{Z} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x42646096 (coo:0, csr:1, hw:1, ic:1, fi:0), storage: 1, subm: 36, symflags:'LS' + shuffled partitions in 2.250e-03 s (43.99 %) + memory allocations took 4.292e-06 s (0.08 %) + leafs setup took 2.861e-06 s (0.06 %) + halfword conversion took 1.590e-03 s (31.09 %) +Built (100 x 100)[0xaaaaeaafc670]{Z} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x42646096 (coo:0, csr:1, hw:1, ic:1, fi:0), storage: 1, subm: 36, symflags:'LS' # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 524288 bytes, per-thread 524288 bytes # RSB_IO_WANT_MEMORY_HIERARCHY_INFO_STRING: unset @@ -7958,9 +7993,9 @@ # RSB_IO_WANT_SORT_METHOD: 0 # RSB_IO_WANT_SUBDIVISION_MULTIPLIER: 2 # librsb version 1.3.0.2 - 202212201855: Initialization success -3 iterations (1 th.) took 0.001562s; avg 0.0005207s ( +/- 28.16/ 39.01 %); best 0.0003741s; worst 0.0007238s; std dev. 0.0001483 (taking best). -Reference operation time is 0.000374079 s (216 Mflops) with 1 threads. -Challenging best inner round reference (2.88486e-05 s/1 threads) with: subdivision 2, 36 leaves, 2.383 bytes/nz, 0.000374079 s/0 threads (speedup 0.0771192 x), same?n. +3 iterations (1 th.) took 0.002335s; avg 0.0007783s ( +/- 7.88/ 6.76 %); best 0.0007169s; worst 0.0008309s; std dev. 4.693e-05 (taking best). +Reference operation time is 0.000716925 s (112.7 Mflops) with 1 threads. +Challenging best inner round reference (1.90735e-05 s/1 threads) with: subdivision 2, 36 leaves, 2.383 bytes/nz, 0.000716925 s/0 threads (speedup 0.0266046 x), same?n. New candidate clone performs slowly; discarding it: 100 x 100, type Z, 5050 nnz, 50 nnz/r, 50 subms, 36 lsubms, 2.3834 bpnz # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 524288 bytes, per-thread 524288 bytes @@ -7994,16 +8029,16 @@ # librsb version 1.3.0.2 - 202212201855: Initialization success Building a matrix with 5050 nnz, 100 x 100 Duplicates check: 5050 - 0 = 5050 - converted COO to RSB in 3.189e-03 s (100.00 %) - analyzed arrays in 9.680e-04 s (30.35 %) - cleaned-up arrays in 1.407e-05 s (0.44 %) - deduplicated arrays in 1.097e-05 s (0.34 %) + converted COO to RSB in 4.419e-03 s (100.00 %) + analyzed arrays in 1.435e-03 s (32.48 %) + cleaned-up arrays in 1.097e-05 s (0.25 %) + deduplicated arrays in 9.060e-06 s (0.21 %) sorted arrays in 0.000e+00 s (0.00 %) - shuffled partitions in 8.821e-04 s (27.66 %) - memory allocations took 5.007e-06 s (0.16 %) - leafs setup took 2.861e-06 s (0.09 %) - halfword conversion took 1.306e-03 s (40.95 %) -Built (100 x 100)[0xaaaad0399630]{Z} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x42646096 (coo:0, csr:1, hw:1, ic:1, fi:0), storage: 1, subm: 36, symflags:'LS' + shuffled partitions in 1.601e-03 s (36.23 %) + memory allocations took 4.768e-06 s (0.11 %) + leafs setup took 5.007e-06 s (0.11 %) + halfword conversion took 1.353e-03 s (30.62 %) +Built (100 x 100)[0xaaaaeaafc670]{Z} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x42646096 (coo:0, csr:1, hw:1, ic:1, fi:0), storage: 1, subm: 36, symflags:'LS' # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 524288 bytes, per-thread 524288 bytes # RSB_IO_WANT_MEMORY_HIERARCHY_INFO_STRING: unset @@ -8049,11 +8084,11 @@ # RSB_IO_WANT_SORT_METHOD: 0 # RSB_IO_WANT_SUBDIVISION_MULTIPLIER: 4 # librsb version 1.3.0.2 - 202212201855: Initialization success -3 iterations (1 th.) took 0.002501s; avg 0.0008337s ( +/- 14.23/ 14.08 %); best 0.000715s; worst 0.0009511s; std dev. 9.636e-05 (taking best). -Reference operation time is 0.000715017 s (113 Mflops) with 1 threads. -Challenging best inner round reference (2.88486e-05 s/1 threads) with: subdivision 4, 36 leaves, 2.383 bytes/nz, 0.000715017 s/0 threads (speedup 0.0403468 x), same?n. +3 iterations (1 th.) took 0.002744s; avg 0.0009147s ( +/- 30.59/ 16.01 %); best 0.0006349s; worst 0.001061s; std dev. 0.0001979 (taking best). +Reference operation time is 0.000634909 s (127.3 Mflops) with 1 threads. +Challenging best inner round reference (1.90735e-05 s/1 threads) with: subdivision 4, 36 leaves, 2.383 bytes/nz, 0.000634909 s/0 threads (speedup 0.0300413 x), same?n. New candidate clone performs slowly; discarding it: 100 x 100, type Z, 5050 nnz, 50 nnz/r, 50 subms, 36 lsubms, 2.3834 bpnz -Best sparse multiply performance with subdivision multiplier of 1: 2800.82 Mflops. +Best sparse multiply performance with subdivision multiplier of 1: 4236.25 Mflops. # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 524288 bytes, per-thread 524288 bytes # RSB_IO_WANT_MEMORY_HIERARCHY_INFO_STRING: unset @@ -8069,23 +8104,23 @@ # RSB_IO_WANT_SORT_METHOD: 0 # RSB_IO_WANT_SUBDIVISION_MULTIPLIER: 1 # librsb version 1.3.0.2 - 202212201855: Initialization success -Last tuner inner round (1 of 1) took 0.026011 s (eq. to 9e+02/ 9e+02 old/new op.times), gained local/global speedup 1 x (2.88486e-05 : 2.88486e-05) / 1 x (2.88486e-05 : 2.88486e-05). This is not amortizable ! +Last tuner inner round (1 of 1) took 0.0566041 s (eq. to 3e+03/ 3e+03 old/new op.times), gained local/global speedup 1 x (1.90735e-05 : 1.90735e-05) / 1 x (1.90735e-05 : 1.90735e-05). This is not amortizable ! Auto tuning inner round 1 did not find a configuration better than the original. -In 1 tuning rounds (tot. 0.026s, 0.017s for constructor, 0 clones) obtained NO speedup (best stays 2801 Mflops). -Second run of RSB Autotuner took 0.0260441 s and estimated a speedup of 1.000000 x (2.885e-05 s -> 2.885e-05 s per op) in same matrix (1 -> 1 lsubm) +In 1 tuning rounds (tot. 0.057s, 0.043s for constructor, 0 clones) obtained NO speedup (best stays 4236 Mflops). +Second run of RSB Autotuner took 0.056627 s and estimated a speedup of 1.000000 x (1.907e-05 s -> 1.907e-05 s per op) in same matrix (1 -> 1 lsubm) #min:1 0 #max:1 0 #sum:100 0 #norm:10 0 #used index storage compared to COO:10504 vs 40400 bytes (26.00%) ; compared to CSR:10504 vs 20604 bytes (50.99%) #%:CONSTRUCTOR_*:SORT SCAN INSERT SCAN+INSERT -%:CONSTRUCTOR_TIMES:lower-100x100-5050nz S N 1 100 100 5050 0.000000 0.000489 0.002165 0.002654 -%:UNSORTEDCOO2RSB_TIME:lower-100x100-5050nz S N 1 100 100 5050 0.002654 -%:RSB_SUBDIVISION_TIME:lower-100x100-5050nz S N 1 100 100 5050 0.000489 -%:RSB_SHUFFLE_TIME:lower-100x100-5050nz S N 1 100 100 5050 0.002165 +%:CONSTRUCTOR_TIMES:lower-100x100-5050nz S N 1 100 100 5050 0.000000 0.000853 0.002215 0.003068 +%:UNSORTEDCOO2RSB_TIME:lower-100x100-5050nz S N 1 100 100 5050 0.003068 +%:RSB_SUBDIVISION_TIME:lower-100x100-5050nz S N 1 100 100 5050 0.000853 +%:RSB_SHUFFLE_TIME:lower-100x100-5050nz S N 1 100 100 5050 0.002215 %:ROW_MAJOR_SORT_TIME:lower-100x100-5050nz S N 1 100 100 5050 0.000000 %:ROW_MAJOR_SORT_SCALING:lower-100x100-5050nz S N 1 100 100 5050 nan -%:SORTEDCOO2RSB_TIME:lower-100x100-5050nz S N 1 100 100 5050 0.002654 +%:SORTEDCOO2RSB_TIME:lower-100x100-5050nz S N 1 100 100 5050 0.003068 %:ROW_MAJOR_SORT_TO_MOP:lower-100x100-5050nz S N 1 100 100 5050 0.000 %:UNSORTEDCOO2RSB_SCALING:lower-100x100-5050nz S N 1 100 100 5050 1.00 %:SORTEDCOO2RSB_SCALING:lower-100x100-5050nz S N 1 100 100 5050 1.00 @@ -8100,68 +8135,68 @@ %:SM_MINMAXAVGNNZ:lower-100x100-5050nz S N 1 100 100 5050 5050 5050 5050 # %operation:matrix CONSTRUCTOR[1] SPMV[1] SPMV[1] -%operation:lower-100x100-5050nz 0.00359607 1e+09 1e+09 +%operation:lower-100x100-5050nz 0.00471687 1e+09 1e+09 %constructor:matrix SORT[1] SCAN[1] SHUFFLE[1] INSERT[1] -%constructor:lower-100x100-5050nz 0 0.000488997 0 0.00216484 -# so far, program took 5.576s of wall clock time; ancillary tests 0.000s; I/O 0.000s; checks 0.000s; conversions 0.000s; rsb/mkl tuning 0.172s/0.000s . +%constructor:lower-100x100-5050nz 0 0.000852823 0 0.00221491 +# so far, program took 5.747s of wall clock time; ancillary tests 0.000s; I/O 0.000s; checks 0.000s; conversions 0.000s; rsb/mkl tuning 0.346s/0.000s . getrusage() stats: ru_maxrss: 6 (maximum resident set size -- MB) -ru_stime : 0.0561s (system CPU time used) -ru_utime : 7.217s (user CPU time used) +ru_stime : 0.07258s (system CPU time used) +ru_utime : 7.277s (user CPU time used) # benchmarking terminated --- finalizing run. # ====== BEGIN Total summary record. #pr: ======== All results (not limiting) #pr: Dump from a base of 4 samples (of max 4) ordered by (1,1,1,1,1,4,1) = (filename x cores x incX x incY x nrhs x typecode x transA). pr: BESTCODE MTX NR NC NNZ NRHS TYPE SYM TRANS NT AT-NT AT-MKL-NT BPNZ AT-BPNZ NSUBM AT-SUBM RSBBEST-MFLOPS OPTIME MKL-OPTIME AT-OPTIME AT-MKL-OPTIME AT-TIME RWminBW-GBps CB-bpf AT-MS CMFLOPS -pr: 1:R_R lower-100x100-5050nz 100 100 5050 1 D S N 1 1 0 2.1212 2.0800 3 1 3389.00 6.211e-04 0.000e+00 5.960e-06 0.000e+00 2.131e-02 8.94e+00 2.60e+00 1 2.02e-02 -pr: 2:R_R lower-100x100-5050nz 100 100 5050 1 S S N 1 1 0 2.1212 2.0800 3 1 4034.52 4.470e-04 0.000e+00 5.007e-06 0.000e+00 1.314e-02 6.37e+00 1.56e+00 1 2.02e-02 -pr: 3:R_R lower-100x100-5050nz 100 100 5050 1 C S N 1 1 0 2.1212 2.0800 3 1 4289.87 5.150e-04 0.000e+00 1.884e-05 0.000e+00 1.416e-02 2.83e+00 6.50e-01 1 8.08e-02 -pr: 4:R_R lower-100x100-5050nz 100 100 5050 1 Z S N 1 1 0 2.1212 2.0800 3 1 2510.37 4.280e-04 0.000e+00 3.219e-05 0.000e+00 1.468e-02 2.99e+00 1.17e+00 1 8.08e-02 +pr: 1:R_R lower-100x100-5050nz 100 100 5050 1 D S N 1 1 0 2.1212 2.0800 3 1 1245.96 1.158e-03 0.000e+00 1.621e-05 0.000e+00 4.153e-02 3.29e+00 2.60e+00 1 2.02e-02 +pr: 2:R_R lower-100x100-5050nz 100 100 5050 1 S S N 1 1 0 2.1212 2.0800 3 1 1694.50 1.294e-03 0.000e+00 1.192e-05 0.000e+00 4.847e-02 2.68e+00 1.56e+00 1 2.02e-02 +pr: 3:R_R lower-100x100-5050nz 100 100 5050 1 C S N 1 1 0 2.1212 2.0800 3 1 2606.92 7.141e-04 0.000e+00 3.099e-05 0.000e+00 2.819e-02 1.72e+00 6.50e-01 1 8.08e-02 +pr: 4:R_R lower-100x100-5050nz 100 100 5050 1 Z S N 1 1 0 2.1212 2.0800 3 1 4289.87 7.081e-04 0.000e+00 1.884e-05 0.000e+00 2.059e-02 5.10e+00 1.17e+00 1 8.08e-02 #pr: below, we define 'successful' autotuning when speedup of 1.010000x is exceeded, and 'tuned' results even the ones which are same as untuned #pr: rsb autotuning was successful in 4 cases (100.00 %) and unsuccessful in 0 cases (0.00 %) -#pr: (in succ. cases rsb autotuning gave avg. 5753.1 % faster, avg. sp. ratio 58.531x, max sp. ratio 104.200x, avg. ratio 0.000x) -#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 1852.0/456.0/3575.0/7408.1 tuned ops) -#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 31.4/ 27.5/ 34.3/125.5 untuned ops) -#pr: (and amortizes from untuned rsb in avg. 32.5, min. 28.5, max. 37.1 ops) +#pr: (in succ. cases rsb autotuning gave avg. 5915.5 % faster, avg. sp. ratio 60.155x, max sp. ratio 108.560x, avg. ratio 0.000x) +#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 2157.7/909.6/4066.3/8631.0 tuned ops) +#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 35.5/ 29.1/ 39.5/141.9 untuned ops) +#pr: (and amortizes from untuned rsb in avg. 36.3, min. 29.9, max. 41.3 ops) #pr: (avg/min/max (avg) nnz per subm before successful tuning were 1683/ 1683/ 1683) #pr: (avg/min/max (avg) nnz per subm after successful tuning were 5050/ 5050/ 5050) #pr: (avg/min/max (avg) bytes per subm before successful tuning were 15150/ 6733/ 26933) #pr: (avg/min/max (avg) bytes per subm after successful tuning were 45450/ 20200/ 80800) #pr: (avg/min/max (avg) bytes per nnz before successful tuning were 2.121/ 2.121/ 2.121) -#pr: (avg/min/max operands (mtx,lhs,rhs) read bandwidth lower bound 5.206/ 2.788/ 8.809,GBps) -#pr: (avg/min/max operands (mtx,rhs:r;lhs:rw) bandwidth lower bound 21.131/ 2.830/ 8.943,GBps) +#pr: (avg/min/max operands (mtx,lhs,rhs) read bandwidth lower bound 3.148/ 1.694/ 5.017,GBps) +#pr: (avg/min/max operands (mtx,rhs:r;lhs:rw) bandwidth lower bound 12.786/ 1.720/ 5.102,GBps) #pr: (avg/min/max code balance (bytes read at least once per flop) 1.495/ 0.650/ 2.599) #pr: (avg/min/max (avg) bytes per nnz after successful tuning were 2.080/ 2.080/ 2.080) #pr: (matrix has been subdivided more/less/same in resp. 0 / 4 /0 cases) #pr: (matrix has used more/less/same threads in resp. 0 / 0 /4 cases) #pr: no unsuccessful rsb autotuning attempt (according to 1.01x threshold) -#pr: rsb auto tuning (either succ. or uns.) time was: on avg.: 0.02 s, min 0.01 s, max 0.02 s, tot 0.06 s (4 samples) -#pr: rsb auto tuning ( only successful ) time was: on avg.: 0.02 s, min 0.01 s, max 0.02 s, tot 0.06 s (4 samples) -#pr: best tun. rsb canon. mflops were: on avg. 3.556e+03, min 2.510e+03, max 4.290e+03 (4 samples) -#pr: ref. unt. rsb canon. mflops were: on avg. 1.059e+02, min 3.252e+01, max 1.888e+02 (4 samples) -#pr: best tun. rsb operation time was: on avg. 1.550e-05s, min 5.007e-06s, max 3.219e-05s, tot 6.199e-05s (4 samples) -#pr: ref. unt. rsb operation time was: on avg. 5.028e-04s, min 4.280e-04s, max 6.211e-04s, tot 2.011e-03s (4 samples) -#pr: min / max ratio of in-memory MEMSET bandwidth to extrapolated read bandwidth ratio: 5.312e+00 1.679e+01 +#pr: rsb auto tuning (either succ. or uns.) time was: on avg.: 0.03 s, min 0.02 s, max 0.05 s, tot 0.14 s (4 samples) +#pr: rsb auto tuning ( only successful ) time was: on avg.: 0.03 s, min 0.02 s, max 0.05 s, tot 0.14 s (4 samples) +#pr: best tun. rsb canon. mflops were: on avg. 2.459e+03, min 1.246e+03, max 4.290e+03 (4 samples) +#pr: ref. unt. rsb canon. mflops were: on avg. 6.508e+01, min 1.561e+01, max 1.141e+02 (4 samples) +#pr: best tun. rsb operation time was: on avg. 1.949e-05s, min 1.192e-05s, max 3.099e-05s, tot 7.796e-05s (4 samples) +#pr: ref. unt. rsb operation time was: on avg. 9.686e-04s, min 7.081e-04s, max 1.294e-03s, tot 3.874e-03s (4 samples) +#pr: min / max ratio of in-memory MEMSET bandwidth to extrapolated read bandwidth ratio: 9.328e+00 2.763e+01 #pr: in-cache to in-memory MEMSET bandwidth ratio: 1.020e+00 -#pr: Record collection took 0.17 s. +#pr: Record collection took 0.36 s. #pr: Record comprises 40 memory benchmark samples (prepend RSB_PR_MBW=1 to dump this). -#pr: Record comprises 99 environment variables in 5459 bytes (prepend RSB_PR_ENV=1 to dump this). +#pr: Record comprises 99 environment variables in 5513 bytes (prepend RSB_PR_ENV=1 to dump this). # ====== END Total summary record. #pr: ======== Saved a performance record of 4 samples to test.rpr # Removing the temporary record file test.rpr.tmp. -# terminating run at 1773327844 (after 5.6s of w.c.t.) +# terminating run at 1738918497 (after 5.7s of w.c.t.) + ls -ltr test-tuning-lower-100x100-5050nz--C-N-1--base.eps test-tuning-lower-100x100-5050nz--C-N-1--mv-tuned_merge1_1x1th.eps test-tuning-lower-100x100-5050nz--D-N-1--base.eps test-tuning-lower-100x100-5050nz--D-N-1--mv-tuned_merge1_1x1th.eps test-tuning-lower-100x100-5050nz--S-N-1--base.eps test-tuning-lower-100x100-5050nz--S-N-1--mv-tuned_merge1_1x1th.eps test-tuning-lower-100x100-5050nz--Z-N-1--base.eps test-tuning-lower-100x100-5050nz--Z-N-1--mv-tuned_merge1_1x1th.eps --rw-r--r-- 1 pbuilder1 pbuilder1 85638 Mar 12 03:04 test-tuning-lower-100x100-5050nz--D-N-1--base.eps --rw-r--r-- 1 pbuilder1 pbuilder1 84561 Mar 12 03:04 test-tuning-lower-100x100-5050nz--D-N-1--mv-tuned_merge1_1x1th.eps --rw-r--r-- 1 pbuilder1 pbuilder1 85639 Mar 12 03:04 test-tuning-lower-100x100-5050nz--S-N-1--base.eps --rw-r--r-- 1 pbuilder1 pbuilder1 84561 Mar 12 03:04 test-tuning-lower-100x100-5050nz--S-N-1--mv-tuned_merge1_1x1th.eps --rw-r--r-- 1 pbuilder1 pbuilder1 85639 Mar 12 03:04 test-tuning-lower-100x100-5050nz--C-N-1--base.eps --rw-r--r-- 1 pbuilder1 pbuilder1 84561 Mar 12 03:04 test-tuning-lower-100x100-5050nz--C-N-1--mv-tuned_merge1_1x1th.eps --rw-r--r-- 1 pbuilder1 pbuilder1 85639 Mar 12 03:04 test-tuning-lower-100x100-5050nz--Z-N-1--base.eps --rw-r--r-- 1 pbuilder1 pbuilder1 84561 Mar 12 03:04 test-tuning-lower-100x100-5050nz--Z-N-1--mv-tuned_merge1_1x1th.eps +-rw-r--r-- 1 pbuilder2 pbuilder2 85643 Feb 7 22:54 test-tuning-lower-100x100-5050nz--D-N-1--base.eps +-rw-r--r-- 1 pbuilder2 pbuilder2 84565 Feb 7 22:54 test-tuning-lower-100x100-5050nz--D-N-1--mv-tuned_merge1_1x1th.eps +-rw-r--r-- 1 pbuilder2 pbuilder2 85642 Feb 7 22:54 test-tuning-lower-100x100-5050nz--S-N-1--base.eps +-rw-r--r-- 1 pbuilder2 pbuilder2 84564 Feb 7 22:54 test-tuning-lower-100x100-5050nz--S-N-1--mv-tuned_merge1_1x1th.eps +-rw-r--r-- 1 pbuilder2 pbuilder2 85643 Feb 7 22:54 test-tuning-lower-100x100-5050nz--C-N-1--base.eps +-rw-r--r-- 1 pbuilder2 pbuilder2 84566 Feb 7 22:54 test-tuning-lower-100x100-5050nz--C-N-1--mv-tuned_merge1_1x1th.eps +-rw-r--r-- 1 pbuilder2 pbuilder2 85643 Feb 7 22:54 test-tuning-lower-100x100-5050nz--Z-N-1--base.eps +-rw-r--r-- 1 pbuilder2 pbuilder2 84566 Feb 7 22:54 test-tuning-lower-100x100-5050nz--Z-N-1--mv-tuned_merge1_1x1th.eps + rsbench --read-performance-record test.rpr + ls -ltr test.txt --rw-r--r-- 1 pbuilder1 pbuilder1 4092 Mar 12 03:04 test.txt +-rw-r--r-- 1 pbuilder2 pbuilder2 4092 Feb 7 22:54 test.txt + RSB_PR_WLTC=2 + RSB_PR_SR=0 + rsbench --read-performance-record test.rpr @@ -8171,29 +8206,29 @@ /usr/bin/kpsepath ++ kpsepath tex ++ sed 's/!!//g;s/:/\n/g;' -+ find . /nonexistent/first-build/.texlive2024/texmf-config/tex/kpsewhich// /nonexistent/first-build/.texlive2024/texmf-var/tex/kpsewhich// /nonexistent/first-build/texmf/tex/kpsewhich// /usr/local/share/texmf/tex/kpsewhich// /etc/texmf/tex/kpsewhich// /var/lib/texmf/tex/kpsewhich// /usr/share/texmf/tex/kpsewhich// /usr/share/texlive/texmf-dist/tex/kpsewhich// /nonexistent/first-build/.texlive2024/texmf-config/tex/generic// /nonexistent/first-build/.texlive2024/texmf-var/tex/generic// /nonexistent/first-build/texmf/tex/generic// /usr/local/share/texmf/tex/generic// /etc/texmf/tex/generic// /var/lib/texmf/tex/generic// /usr/share/texmf/tex/generic// /usr/share/texlive/texmf-dist/tex/generic// /nonexistent/first-build/.texlive2024/texmf-config/tex/latex// /nonexistent/first-build/.texlive2024/texmf-var/tex/latex// /nonexistent/first-build/texmf/tex/latex// /usr/local/share/texmf/tex/latex// /etc/texmf/tex/latex// /var/lib/texmf/tex/latex// /usr/share/texmf/tex/latex// /usr/share/texlive/texmf-dist/tex/latex// /nonexistent/first-build/.texlive2024/texmf-config/tex/// /nonexistent/first-build/.texlive2024/texmf-var/tex/// /nonexistent/first-build/texmf/tex/// /usr/local/share/texmf/tex/// /etc/texmf/tex/// /var/lib/texmf/tex/// /usr/share/texmf/tex/// /usr/share/texlive/texmf-dist/tex/// -name sciposter.cls -find: '/nonexistent/first-build/.texlive2024/texmf-config/tex/kpsewhich//': No such file or directory -find: '/nonexistent/first-build/.texlive2024/texmf-var/tex/kpsewhich//': No such file or directory -find: '/nonexistent/first-build/texmf/tex/kpsewhich//': No such file or directory ++ find . /nonexistent/second-build/.texlive2024/texmf-config/tex/kpsewhich// /nonexistent/second-build/.texlive2024/texmf-var/tex/kpsewhich// /nonexistent/second-build/texmf/tex/kpsewhich// /usr/local/share/texmf/tex/kpsewhich// /etc/texmf/tex/kpsewhich// /var/lib/texmf/tex/kpsewhich// /usr/share/texmf/tex/kpsewhich// /usr/share/texlive/texmf-dist/tex/kpsewhich// /nonexistent/second-build/.texlive2024/texmf-config/tex/generic// /nonexistent/second-build/.texlive2024/texmf-var/tex/generic// /nonexistent/second-build/texmf/tex/generic// /usr/local/share/texmf/tex/generic// /etc/texmf/tex/generic// /var/lib/texmf/tex/generic// /usr/share/texmf/tex/generic// /usr/share/texlive/texmf-dist/tex/generic// /nonexistent/second-build/.texlive2024/texmf-config/tex/latex// /nonexistent/second-build/.texlive2024/texmf-var/tex/latex// /nonexistent/second-build/texmf/tex/latex// /usr/local/share/texmf/tex/latex// /etc/texmf/tex/latex// /var/lib/texmf/tex/latex// /usr/share/texmf/tex/latex// /usr/share/texlive/texmf-dist/tex/latex// /nonexistent/second-build/.texlive2024/texmf-config/tex/// /nonexistent/second-build/.texlive2024/texmf-var/tex/// /nonexistent/second-build/texmf/tex/// /usr/local/share/texmf/tex/// /etc/texmf/tex/// /var/lib/texmf/tex/// /usr/share/texmf/tex/// /usr/share/texlive/texmf-dist/tex/// -name sciposter.cls +find: '/nonexistent/second-build/.texlive2024/texmf-config/tex/kpsewhich//': No such file or directory +find: '/nonexistent/second-build/.texlive2024/texmf-var/tex/kpsewhich//': No such file or directory +find: '/nonexistent/second-build/texmf/tex/kpsewhich//': No such file or directory find: '/usr/local/share/texmf/tex/kpsewhich//': No such file or directory find: '/etc/texmf/tex/kpsewhich//': No such file or directory find: '/var/lib/texmf/tex/kpsewhich//': No such file or directory find: '/usr/share/texmf/tex/kpsewhich//': No such file or directory find: '/usr/share/texlive/texmf-dist/tex/kpsewhich//': No such file or directory -find: '/nonexistent/first-build/.texlive2024/texmf-config/tex/generic//': No such file or directory -find: '/nonexistent/first-build/.texlive2024/texmf-var/tex/generic//': No such file or directory -find: '/nonexistent/first-build/texmf/tex/generic//': No such file or directory +find: '/nonexistent/second-build/.texlive2024/texmf-config/tex/generic//': No such file or directory +find: '/nonexistent/second-build/.texlive2024/texmf-var/tex/generic//': No such file or directory +find: '/nonexistent/second-build/texmf/tex/generic//': No such file or directory find: '/usr/local/share/texmf/tex/generic//': No such file or directory find: '/usr/share/texmf/tex/generic//': No such file or directory -find: '/nonexistent/first-build/.texlive2024/texmf-config/tex/latex//': No such file or directory -find: '/nonexistent/first-build/.texlive2024/texmf-var/tex/latex//': No such file or directory -find: '/nonexistent/first-build/texmf/tex/latex//': No such file or directory +find: '/nonexistent/second-build/.texlive2024/texmf-config/tex/latex//': No such file or directory +find: '/nonexistent/second-build/.texlive2024/texmf-var/tex/latex//': No such file or directory +find: '/nonexistent/second-build/texmf/tex/latex//': No such file or directory find: '/usr/local/share/texmf/tex/latex//': No such file or directory find: '/etc/texmf/tex/latex//': No such file or directory find: '/var/lib/texmf/tex/latex//': No such file or directory -find: '/nonexistent/first-build/.texlive2024/texmf-config/tex///': No such file or directory -find: '/nonexistent/first-build/.texlive2024/texmf-var/tex///': No such file or directory -find: '/nonexistent/first-build/texmf/tex///': No such file or directory +find: '/nonexistent/second-build/.texlive2024/texmf-config/tex///': No such file or directory +find: '/nonexistent/second-build/.texlive2024/texmf-var/tex///': No such file or directory +find: '/nonexistent/second-build/texmf/tex///': No such file or directory find: '/usr/local/share/texmf/tex///': No such file or directory + exit 0 for mf in pd.mtx vf.mtx ; do if test -f /build/reproducible-path/librsb-1.3.0.2+dfsg/examples/$mf ; then true; else cp -p /build/reproducible-path/librsb-1.3.0.2+dfsg/$mf /build/reproducible-path/librsb-1.3.0.2+dfsg/examples/$mf ; fi; done @@ -8208,7 +8243,7 @@ This error may be safely ignored. Correctly allocated a matrix. Summary information of the matrix: -(3 x 3)[0xaaab12f054a0]{D} @ (0(0..3),0(0..3)) (3 nnz, 1 nnz/r) flags 0x2040384 (coo:1, csr:0, hw:0, ic:1, fi:0), storage: 40, subm: 1, symflags:'' +(3 x 3)[0xaaab1f29d4a0]{D} @ (0(0..3),0(0..3)) (3 nnz, 1 nnz/r) flags 0x2040384 (coo:1, csr:0, hw:0, ic:1, fi:0), storage: 40, subm: 1, symflags:'' Correctly performed a SPMV. Correctly freed the matrix. Correctly finalized the library. @@ -8223,7 +8258,7 @@ This error may be safely ignored. Correctly allocated a matrix. Summary information of the matrix: -(3 x 3)[0xaaaac6fec4a0]{D} @ (0(0..3),0(0..3)) (3 nnz, 1 nnz/r) flags 0x2040384 (coo:1, csr:0, hw:0, ic:1, fi:0), storage: 40, subm: 1, symflags:'' +(3 x 3)[0xaaab15d204a0]{D} @ (0(0..3),0(0..3)) (3 nnz, 1 nnz/r) flags 0x2040384 (coo:1, csr:0, hw:0, ic:1, fi:0), storage: 40, subm: 1, symflags:'' Correctly performed a SPMV. Correctly freed the matrix. Correctly finalized the library. @@ -8287,51 +8322,51 @@ Done. Building a matrix with 5 nnz, 5 x 5 Duplicates check: 5 - 0 = 5 - converted COO to RSB in 8.900e-03 s (100.00 %) - analyzed arrays in 2.386e-03 s (26.81 %) - cleaned-up arrays in 1.192e-06 s (0.01 %) - deduplicated arrays in 9.537e-07 s (0.01 %) - sorted arrays in 1.216e-03 s (13.66 %) - shuffled partitions in 2.309e-03 s (25.94 %) - memory allocations took 1.073e-05 s (0.12 %) - leafs setup took 9.537e-07 s (0.01 %) - halfword conversion took 2.974e-03 s (33.42 %) -Built (5 x 5)[0xaaaac6fee820]{D} @ (0(0..0),0(0..0)) (5 nnz, 1 nnz/r) flags 0x2046186 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 2, symflags:'' + converted COO to RSB in 1.192e-02 s (100.00 %) + analyzed arrays in 3.948e-03 s (33.11 %) + cleaned-up arrays in 9.537e-07 s (0.01 %) + deduplicated arrays in 0.000e+00 s (0.00 %) + sorted arrays in 2.023e-03 s (16.97 %) + shuffled partitions in 3.794e-03 s (31.82 %) + memory allocations took 4.053e-06 s (0.03 %) + leafs setup took 1.907e-06 s (0.02 %) + halfword conversion took 2.151e-03 s (18.04 %) +Built (5 x 5)[0xaaab15d22820]{D} @ (0(0..0),0(0..0)) (5 nnz, 1 nnz/r) flags 0x2046186 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 2, symflags:'' Allocated matrix of 5 nonzeroes: -(5 x 5)[0xaaaac6fee820]{D} @ (0(0..0),0(0..0)) (5 nnz, 1 nnz/r) flags 0x2046186 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 2, symflags:'' +(5 x 5)[0xaaab15d22820]{D} @ (0(0..0),0(0..0)) (5 nnz, 1 nnz/r) flags 0x2046186 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 2, symflags:'' -Before auto-tuning, 100 multiplications took 0.100310s. +Before auto-tuning, 100 multiplications took 0.160826s. Threads autotuning (may take more than 1.500000s)... Will use autotuning routine to sample matrix: 5 x 5, type D, 5 nnz, 1 nnz/r, 3 subms, 2 lsubms, 4.0000 bpnz. Parameters: verbosity:1 mintimes:3 maxtimes:10 mindt:0 maxdt:0.1 -Sampling (15 x 0.1 s stages, transA=N, nrhs=2, timer gran.=7.06911e-08), 12 suggested as starting thread count(default). -3 iterations (12 th.) took 0.002886s; avg 0.000962s ( +/- 32.84/ 25.25 %); best 0.0006461s; worst 0.001205s; std dev. 0.0002339 (taking best). -Reference operation time is 0.000646114 s (0.03095 Mflops) with 12 threads. -3 iterations (12 th.) took 0.003491s; avg 0.001164s ( +/- 21.81/ 29.16 %); best 0.0009098s; worst 0.001503s; std dev. 0.0002496 (taking best). -Reference operation time is 0.000909805 s (0.02198 Mflops) with 12 threads. -After 0.006459s, autotuning routine did not find a better threads count configuration. -(5 x 5)[0xaaaac6fee820]{D} @ (0(0..0),0(0..0)) (5 nnz, 1 nnz/r) flags 0x2046186 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 2, symflags:'' -After threads auto-tuning, 100 multiplications took 0.061788s -- effective speedup of 1.62345 x +Sampling (15 x 0.1 s stages, transA=N, nrhs=2, timer gran.=4.47392e-08), 12 suggested as starting thread count(default). +3 iterations (12 th.) took 0.003455s; avg 0.001152s ( +/- 31.66/ 44.67 %); best 0.000787s; worst 0.001666s; std dev. 0.0003742 (taking best). +Reference operation time is 0.00078702 s (0.02541 Mflops) with 12 threads. +3 iterations (12 th.) took 0.002975s; avg 0.0009917s ( +/- 1.07/ 1.43 %); best 0.0009811s; worst 0.001006s; std dev. 1.045e-05 (taking best). +Reference operation time is 0.000981092 s (0.02039 Mflops) with 12 threads. +After 0.006485s, autotuning routine did not find a better threads count configuration. +(5 x 5)[0xaaab15d22820]{D} @ (0(0..0),0(0..0)) (5 nnz, 1 nnz/r) flags 0x2046186 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 2, symflags:'' +After threads auto-tuning, 100 multiplications took 0.096535s -- effective speedup of 1.66598 x Matrix autotuning (may take more than 1.500000s; using 12 threads )... Will autotune matrix: 5 x 5, type D, 5 nnz, 1 nnz/r, 3 subms, 2 lsubms, 4.0000 bpnz. Parameters: verbosity:1 mintimes:3 maxtimes:10 mindt:0 maxdt:0.1 -Starting autotuning (15 x 0.1 s stages, transA=N, nrhs=2, timer gran.=7.06911e-08), 12 suggested as starting thread count. -3 iterations (12 th.) took 0.001854s; avg 0.000618s ( +/- 3.09/ 2.12 %); best 0.0005989s; worst 0.0006311s; std dev. 1.38e-05 (taking best). -Reference operation time is 0.000598907 s (0.03339 Mflops) with 12 threads. -Starting merge (user-supplied threads) based auto-tuning procedure (transA=N, nrhs=2, order=cols) (max 6 steps, inclusive 3 grace steps) on: 5 x 5, type D, 5 nnz, 1 nnz/r, 3 subms, 2 lsubms, 4.0000 bpnz (tpop: 0.0005989 Mflops: 0.033) -Merge (2 -> 1 leaves) took w.c.t. of 1.597e-05s, ~1.907e-06s of computing time (of which 0s sorting, 2.861e-06s analysis) -3 iterations (12 th.) took 3.099e-06s; avg 1.033e-06s ( +/- 93.16/200.00 %); best 7.069e-08s; worst 3.099e-06s; std dev. 1.461e-06 (taking best). -Reference operation time is 7.06911e-08 s (282.9 Mflops) with 12 threads. -After merge step 1: tpop: 7.069e-08 s ~Mflops: 282.921 nsubm:1 otn:12 -Applying merge (2 -> 1 leaves, 12 th.) yielded SPEEDUP of 8472.175x: 0.0005989s -> 7.069e-08s, so taking this instance. +Starting autotuning (15 x 0.1 s stages, transA=N, nrhs=2, timer gran.=4.47392e-08), 12 suggested as starting thread count. +3 iterations (12 th.) took 0.002535s; avg 0.000845s ( +/- 23.54/ 25.33 %); best 0.0006461s; worst 0.001059s; std dev. 0.0001689 (taking best). +Reference operation time is 0.000646114 s (0.03095 Mflops) with 12 threads. +Starting merge (user-supplied threads) based auto-tuning procedure (transA=N, nrhs=2, order=cols) (max 6 steps, inclusive 3 grace steps) on: 5 x 5, type D, 5 nnz, 1 nnz/r, 3 subms, 2 lsubms, 4.0000 bpnz (tpop: 0.0006461 Mflops: 0.031) +Merge (2 -> 1 leaves) took w.c.t. of 1.502e-05s, ~3.099e-06s of computing time (of which 0s sorting, 2.146e-06s analysis) +3 iterations (12 th.) took 9.537e-07s; avg 3.179e-07s ( +/- 85.93/200.00 %); best 4.474e-08s; worst 9.537e-07s; std dev. 4.496e-07 (taking best). +Reference operation time is 4.47392e-08 s (447 Mflops) with 12 threads. +After merge step 1: tpop: 4.474e-08 s ~Mflops: 447.035 nsubm:1 otn:12 +Applying merge (2 -> 1 leaves, 12 th.) yielded SPEEDUP of 14441.780x: 0.0006461s -> 4.474e-08s, so taking this instance. Merged all the matrix leaves: no reason to continue merging. -A total of 1 merge steps (of max 6) (2 -> 1 subms) took 0.002105s (of which 0.0002329s partitioning, 0s I/O); computing times: 1.907e-06s in par. loops, 0s sorting, 2.861e-06s analyzing) -Total merge + benchmarking process took 0.002105s, equivalent to 29777.4/3.5 new/old ops (0.003669s for 2 clones -- as 51905.6/6.1 ops, or 25952.8/3.1 ops per clone), SPEEDUP of 8472.175x -Applying multi-merge (2 -> 1 leaves, 1 steps, 12 -> 12 th.sp.) yielded SPEEDUP of 8472.175x (0.0005989s -> 7.069e-08s), will amortize in 3.5 ops by saving 0.0005988s per op. -In 1 tuning rounds (tot. 0.0058s, 0.0037s for constructor, 2 clones) obtained a SPEEDUP of 847117.5% (8472x) (from 0.03339 to 282.9 Mflops). -After 0.005813s, autotuning routine declared speedup of 8472.18 x, when using threads count of 12. -(5 x 5)[0xaaaac6ff1de0]{D} @ (0(0..5),0(0..5)) (5 nnz, 1 nnz/r) flags 0x2040186 (coo:1, csr:0, hw:1, ic:1, fi:0), storage: 40, subm: 1, symflags:'' -After threads auto-tuning, 100 multiplications took 0.000014s -- further speedup of 4468.24 x +A total of 1 merge steps (of max 6) (2 -> 1 subms) took 0.001971s (of which 3.982e-05s partitioning, 0s I/O); computing times: 3.099e-06s in par. loops, 0s sorting, 2.146e-06s analyzing) +Total merge + benchmarking process took 0.001971s, equivalent to 44050.1/3.1 new/old ops (0.004485s for 2 clones -- as 100250.5/6.9 ops, or 50125.2/3.5 ops per clone), SPEEDUP of 14441.780x +Applying multi-merge (2 -> 1 leaves, 1 steps, 12 -> 12 th.sp.) yielded SPEEDUP of 14441.780x (0.0006461s -> 4.474e-08s), will amortize in 3.1 ops by saving 0.0006461s per op. +In 1 tuning rounds (tot. 0.0071s, 0.0045s for constructor, 2 clones) obtained a SPEEDUP of 1444078.0% (1.444e+04x) (from 0.03095 to 447 Mflops). +After 0.007119s, autotuning routine declared speedup of 14441.8 x, when using threads count of 12. +(5 x 5)[0xaaab15d25de0]{D} @ (0(0..5),0(0..5)) (5 nnz, 1 nnz/r) flags 0x2040186 (coo:1, csr:0, hw:1, ic:1, fi:0), storage: 40, subm: 1, symflags:'' +After threads auto-tuning, 100 multiplications took 0.000014s -- further speedup of 6981 x 0/2 0 0 -> 0 1/2 1 0 -> 5 0/2 0 3 -> 0 @@ -8342,7 +8377,7 @@ Correctly initialized the library. Correctly allocated a matrix with 7 nonzeroes. Summary information of the matrix: -(6 x 6)[0xaaaac6fee820]{D} @ (0(1..2),0(5..6)) (1 nnz, 0.17 nnz/r) flags 0x20443ee (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 1, symflags:'UT' +(6 x 6)[0xaaab15d22820]{D} @ (0(1..2),0(5..6)) (1 nnz, 0.17 nnz/r) flags 0x20443ee (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 1, symflags:'UT' Matrix printout: %%MatrixMarket matrix coordinate real general 6 6 1 @@ -8493,75 +8528,62 @@ Creating 500 x 500 matrix with 62500 nonzeroes. Building a matrix with 62500 nnz, 500 x 500 Duplicates check: 62500 - 0 = 62500 - converted COO to RSB in 1.700e-02 s (100.00 %) - analyzed arrays in 2.334e-03 s (13.73 %) - cleaned-up arrays in 3.290e-04 s (1.94 %) - deduplicated arrays in 2.248e-04 s (1.32 %) - sorted arrays in 6.590e-03 s (38.76 %) - shuffled partitions in 5.123e-03 s (30.13 %) - memory allocations took 4.101e-05 s (0.24 %) - leafs setup took 6.914e-06 s (0.04 %) - halfword conversion took 2.348e-03 s (13.81 %) -Built (500 x 500)[0xaaaae84ac2d0]{D} @ (0(0..0),0(0..0)) (62500 nnz, 1.2e+02 nnz/r) flags 0x2046186 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 55, symflags:'' + converted COO to RSB in 1.381e-02 s (100.00 %) + analyzed arrays in 1.712e-03 s (12.40 %) + cleaned-up arrays in 1.311e-04 s (0.95 %) + deduplicated arrays in 1.111e-04 s (0.80 %) + sorted arrays in 7.137e-03 s (51.68 %) + shuffled partitions in 3.305e-03 s (23.93 %) + memory allocations took 3.600e-05 s (0.26 %) + leafs setup took 5.960e-06 s (0.04 %) + halfword conversion took 1.366e-03 s (9.89 %) +Built (500 x 500)[0xaaaaec55b2d0]{D} @ (0(0..0),0(0..0)) (62500 nnz, 1.2e+02 nnz/r) flags 0x2046186 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 55, symflags:'' Allocated matrix of 62500 nonzeroes: -(500 x 500)[0xaaaae84ac2d0]{D} @ (0(0..0),0(0..0)) (62500 nnz, 1.2e+02 nnz/r) flags 0x2046186 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 55, symflags:'' +(500 x 500)[0xaaaaec55b2d0]{D} @ (0(0..0),0(0..0)) (62500 nnz, 1.2e+02 nnz/r) flags 0x2046186 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 55, symflags:'' -Before auto-tuning, 100 multiplications took 0.136075s. +Before auto-tuning, 100 multiplications took 0.129426s. Threads autotuning (may take more than 1.500000s)... Will use autotuning routine to sample matrix: 500 x 500, type D, 62500 nnz, 1.2e+02 nnz/r, 75 subms, 55 lsubms, 2.1196 bpnz. Parameters: verbosity:1 mintimes:3 maxtimes:10 mindt:0 maxdt:0.1 -Sampling (15 x 0.1 s stages, transA=N, nrhs=2, timer gran.=7.46965e-08), 12 suggested as starting thread count(default). -3 iterations (12 th.) took 0.003805s; avg 0.001268s ( +/- 22.97/ 29.15 %); best 0.000977s; worst 0.001638s; std dev. 0.0002755 (taking best). -Reference operation time is 0.000977039 s (255.9 Mflops) with 12 threads. -3 iterations (12 th.) took 0.0036s; avg 0.0012s ( +/- 16.02/ 21.17 %); best 0.001008s; worst 0.001454s; std dev. 0.0001874 (taking best). -Reference operation time is 0.0010078 s (248.1 Mflops) with 12 threads. -After 0.007491s, autotuning routine did not find a better threads count configuration. -(500 x 500)[0xaaaae84ac2d0]{D} @ (0(0..0),0(0..0)) (62500 nnz, 1.2e+02 nnz/r) flags 0x2046186 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 55, symflags:'' -After threads auto-tuning, 100 multiplications took 0.110047s -- effective speedup of 1.23652 x +Sampling (15 x 0.1 s stages, transA=N, nrhs=2, timer gran.=3.80516e-08), 12 suggested as starting thread count(default). +3 iterations (12 th.) took 0.003397s; avg 0.001132s ( +/- 50.81/ 81.92 %); best 0.0005569s; worst 0.00206s; std dev. 0.0006622 (taking best). +Reference operation time is 0.000556946 s (448.9 Mflops) with 12 threads. +3 iterations (12 th.) took 0.001898s; avg 0.0006327s ( +/- 2.63/ 1.78 %); best 0.0006161s; worst 0.000644s; std dev. 1.199e-05 (taking best). +Reference operation time is 0.000616074 s (405.8 Mflops) with 12 threads. +After 0.005369s, autotuning routine did not find a better threads count configuration. +(500 x 500)[0xaaaaec55b2d0]{D} @ (0(0..0),0(0..0)) (62500 nnz, 1.2e+02 nnz/r) flags 0x2046186 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 55, symflags:'' +After threads auto-tuning, 100 multiplications took 0.146208s -- effective speedup of 0.885219 x Matrix autotuning (may take more than 1.500000s; using 12 threads )... Will autotune matrix: 500 x 500, type D, 62500 nnz, 1.2e+02 nnz/r, 75 subms, 55 lsubms, 2.1196 bpnz. Parameters: verbosity:1 mintimes:3 maxtimes:10 mindt:0 maxdt:0.1 -Starting autotuning (15 x 0.1 s stages, transA=N, nrhs=2, timer gran.=7.46965e-08), 12 suggested as starting thread count. -3 iterations (12 th.) took 0.003247s; avg 0.001082s ( +/- 44.00/ 71.00 %); best 0.0006061s; worst 0.001851s; std dev. 0.0005486 (taking best). -Reference operation time is 0.00060606 s (412.5 Mflops) with 12 threads. -Starting merge (user-supplied threads) based auto-tuning procedure (transA=N, nrhs=2, order=cols) (max 6 steps, inclusive 3 grace steps) on: 500 x 500, type D, 62500 nnz, 1.2e+02 nnz/r, 75 subms, 55 lsubms, 2.1196 bpnz (tpop: 0.0006061 Mflops: 412.500) -Merge (55 -> 37 leaves) took w.c.t. of 0.0009921s, ~0.003821s of computing time (of which 0.000242s sorting, 9.06e-06s analysis) -3 iterations (12 th.) took 0.002831s; avg 0.0009437s ( +/- 27.08/ 42.52 %); best 0.0006881s; worst 0.001345s; std dev. 0.0002873 (taking best). -Reference operation time is 0.000688076 s (363.3 Mflops) with 12 threads. -After merge step 1: tpop: 0.0006881 s ~Mflops: 363.332 nsubm:37 otn:12 -Applying merge (55 -> 37 leaves, 12 th.) yielded SLOWDOWN (1th of 3 tolerable) of 1.135x: 0.0006061s -> 0.0006881s. -Merge (37 -> 28 leaves) took w.c.t. of 0.0002849s, ~0.0001283s of computing time (of which 5.913e-05s sorting, 7.153e-06s analysis) -3 iterations (12 th.) took 0.002286s; avg 0.000762s ( +/- 20.46/ 22.31 %); best 0.0006061s; worst 0.000932s; std dev. 0.0001334 (taking best). -Reference operation time is 0.00060606 s (412.5 Mflops) with 12 threads. -After merge step 2: tpop: 0.0006061 s ~Mflops: 412.500 nsubm:28 otn:12 -Applying merge (37 -> 28 leaves, 12 th.) yielded NEGLIGIBLE change (1th in a row) (old/new=1.00000x): 0.0006061s -> 0.0006061s, so IGNORING this instance. -Merge (28 -> 22 leaves) took w.c.t. of 0.0002971s, ~7.391e-05s of computing time (of which 3.791e-05s sorting, 5.007e-06s analysis) -3 iterations (12 th.) took 0.002175s; avg 0.000725s ( +/- 34.79/ 52.02 %); best 0.0004728s; worst 0.001102s; std dev. 0.0002717 (taking best). -Reference operation time is 0.000472784 s (528.8 Mflops) with 12 threads. -After merge step 3: tpop: 0.0004728 s ~Mflops: 528.783 nsubm:22 otn:12 -Applying merge (28 -> 22 leaves, 12 th.) yielded SPEEDUP of 1.282x: 0.0006061s -> 0.0004728s, so taking this instance. -Merge (22 -> 16 leaves) took w.c.t. of 0.0003641s, ~0.0001009s of computing time (of which 4.888e-05s sorting, 4.768e-06s analysis) -3 iterations (12 th.) took 0.00195s; avg 0.00065s ( +/- 17.40/ 29.55 %); best 0.0005369s; worst 0.0008421s; std dev. 0.0001365 (taking best). -Reference operation time is 0.000536919 s (465.6 Mflops) with 12 threads. -After merge step 4: tpop: 0.0005369 s ~Mflops: 465.620 nsubm:16 otn:12 -Applying merge (22 -> 16 leaves, 12 th.) yielded SLOWDOWN (1th of 3 tolerable) of 1.136x: 0.0004728s -> 0.0005369s. -Merge (16 -> 10 leaves) took w.c.t. of 0.0006561s, ~0.0007989s of computing time (of which 0.000644s sorting, 5.007e-06s analysis) -3 iterations (12 th.) took 0.001577s; avg 0.0005256s ( +/- 7.56/ 14.53 %); best 0.0004859s; worst 0.000602s; std dev. 5.402e-05 (taking best). -Reference operation time is 0.000485897 s (514.5 Mflops) with 12 threads. -After merge step 5: tpop: 0.0004859 s ~Mflops: 514.512 nsubm:10 otn:12 -Applying merge (16 -> 10 leaves, 12 th.) yielded SLOWDOWN (2th of 3 tolerable) of 1.028x: 0.0004728s -> 0.0004859s. -Merge (10 -> 7 leaves) took w.c.t. of 0.0001171s, ~0.0001061s of computing time (of which 4.792e-05s sorting, 4.053e-06s analysis) -3 iterations (12 th.) took 0.001565s; avg 0.0005217s ( +/- 22.35/ 13.67 %); best 0.0004051s; worst 0.0005929s; std dev. 8.312e-05 (taking best). -Reference operation time is 0.000405073 s (617.2 Mflops) with 12 threads. -After merge step 6: tpop: 0.0004051 s ~Mflops: 617.172 nsubm:7 otn:12 -Applying merge (10 -> 7 leaves, 12 th.) yielded SPEEDUP of 1.167x: 0.0004728s -> 0.0004051s, so taking this instance. -A total of 6 merge steps (of max 6) (55 -> 7 subms) took 0.01904s (of which 0.002746s partitioning, 0s I/O); computing times: 0.005029s in par. loops, 0.00108s sorting, 3.505e-05s analyzing) -Total merge + benchmarking process took 0.01904s, equivalent to 47.0/31.4 new/old ops (0.005315s for 3 clones -- as 13.1/8.8 ops, or 4.4/2.9 ops per clone), SPEEDUP of 1.496x -Applying multi-merge (55 -> 7 leaves, 6 steps, 12 -> 12 th.sp.) yielded SPEEDUP of 1.496x (0.0006061s -> 0.0004051s), will amortize in 94.7 ops by saving 0.000201s per op. -In 1 tuning rounds (tot. 0.024s, 0.0053s for constructor, 3 clones) obtained a SPEEDUP of 49.6% (1.496x) (from 412.5 to 617.2 Mflops). -After 0.024117s, autotuning routine declared speedup of 1.49617 x, when using threads count of 12. -(500 x 500)[0xaaaae85af290]{D} @ (0(0..0),0(0..0)) (62500 nnz, 1.2e+02 nnz/r) flags 0x2046186 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 7, symflags:'' -After threads auto-tuning, 100 multiplications took 0.062386s -- further speedup of 1.76397 x +Starting autotuning (15 x 0.1 s stages, transA=N, nrhs=2, timer gran.=3.80516e-08), 12 suggested as starting thread count. +3 iterations (12 th.) took 0.001868s; avg 0.0006227s ( +/- 8.14/ 6.48 %); best 0.000572s; worst 0.000663s; std dev. 3.789e-05 (taking best). +Reference operation time is 0.000571966 s (437.1 Mflops) with 12 threads. +Starting merge (user-supplied threads) based auto-tuning procedure (transA=N, nrhs=2, order=cols) (max 6 steps, inclusive 3 grace steps) on: 500 x 500, type D, 62500 nnz, 1.2e+02 nnz/r, 75 subms, 55 lsubms, 2.1196 bpnz (tpop: 0.000572 Mflops: 437.089) +Merge (55 -> 37 leaves) took w.c.t. of 0.001764s, ~0.005548s of computing time (of which 0.0004299s sorting, 7.868e-06s analysis) +3 iterations (12 th.) took 0.004421s; avg 0.001474s ( +/- 18.98/ 13.27 %); best 0.001194s; worst 0.001669s; std dev. 0.0002029 (taking best). +Reference operation time is 0.001194 s (209.4 Mflops) with 12 threads. +After merge step 1: tpop: 0.001194 s ~Mflops: 209.380 nsubm:37 otn:12 +Applying merge (55 -> 37 leaves, 12 th.) yielded SLOWDOWN (1th of 3 tolerable) of 2.088x: 0.000572s -> 0.001194s. +Skipping further merge based tests after 1 definite performance degradations in a row (and last exceeding limit). +A total of 1 merge steps (of max 6) (55 -> 37 subms) took 0.006207s (of which 0.00177s partitioning, 0s I/O); computing times: 0.005548s in par. loops, 0.0004299s sorting, 7.868e-06s analyzing) +Total merge + benchmarking process took 0.006207s, equivalent to 10.9/10.9 new/old ops (0.001416s for 1 clones -- as 2.5/2.5 ops, or 2.5/2.5 ops per clone), SPEEDUP of 1.000x (NO SPEEDUP) +Merging based autotuning FAILED (=NO SPEEDUP); let's try splitting then... +3 iterations (12 th.) took 0.003779s; avg 0.00126s ( +/- 38.39/ 41.79 %); best 0.0007761s; worst 0.001786s; std dev. 0.0004134 (taking best). +Reference operation time is 0.000776052 s (322.1 Mflops) with 12 threads. +Starting split (user-supplied threads) based auto-tuning procedure (transA=N, nrhs=2, order=cols) (max 6 steps, inclusive 3 grace steps) on: 500 x 500, type D, 62500 nnz, 1.2e+02 nnz/r, 75 subms, 55 lsubms, 2.1196 bpnz (tpop: 0.0007761 Mflops: 322.143) +Split (55 -> 136 leaves, 75 -> 183 subms) took 0.001914s (of which: 5.96e-06s analysis, -4.695e+10s mem.mgmt); compute time: 0.008213s overall, 0.0006208s searches, 0.007592s shuffle, 0.004597s switch, 9.108e-05s quadrants. +3 iterations (12 th.) took 0.004239s; avg 0.001413s ( +/- 12.89/ 22.36 %); best 0.001231s; worst 0.001729s; std dev. 0.0002243 (taking best). +Reference operation time is 0.00123096 s (203.1 Mflops) with 12 threads. +After split step 1: tpop: 0.001231 s ~Mflops: 203.094 nsubm:136 otn:12 +Applying split (55 -> 136 leaves, 12 th.) yielded SLOWDOWN (1th of 3 tolerable) of 1.586x: 0.0007761s -> 0.001231s. +Skipping further split based tests after 1 definite performance degradations in a row (and last exceeding limit). +A total of 1 split steps (of max 6) (55 -> 136 subms) took 0.006319s (of which 0.002063s partitioning, 0s I/O); computing times: 0.008213s in par. loops, 0.0006208s sorting, 5.96e-06s analyzing) +Total split + benchmarking process took 0.006319s, equivalent to 8.1/8.1 new/old ops (0.001892s for 1 clones -- as 2.4/2.4 ops, or 2.4/2.4 ops per clone), SPEEDUP of 1.000x (NO SPEEDUP) +In 1 tuning rounds (tot. 0.022s, 0.0033s for constructor, 2 clones) obtained NO speedup (best stays 322.1 Mflops). +After 0.021575s, autotuning routine declared speedup of 1 x, when using threads count of 12. +(500 x 500)[0xaaaaec55b2d0]{D} @ (0(0..0),0(0..0)) (62500 nnz, 1.2e+02 nnz/r) flags 0x2046186 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 55, symflags:'' +After threads auto-tuning, 100 multiplications took 0.127056s -- further speedup of 1.15074 x librsb timer-based profiling is not supported in this build. If you wish to have it, re-configure librsb with its support. So you can safely ignore the error you might just have seen printed out on screen. /build/reproducible-path/librsb-1.3.0.2+dfsg/examples/backsolve Hello, RSB! @@ -8569,19 +8591,19 @@ Correctly initialized the library. Building a matrix with 7 nnz, 6 x 6 Duplicates check: 1 - 0 = 1 - converted COO to RSB in 2.245e-03 s (100.00 %) - analyzed arrays in 1.513e-03 s (67.39 %) - cleaned-up arrays in 5.007e-06 s (0.22 %) - deduplicated arrays in 9.537e-07 s (0.04 %) - sorted arrays in 9.537e-07 s (0.04 %) - shuffled partitions in 7.000e-04 s (31.18 %) - memory allocations took 9.298e-06 s (0.41 %) - leafs setup took 5.007e-06 s (0.22 %) - halfword conversion took 9.060e-06 s (0.40 %) -Built (6 x 6)[0xaaaaf70f34d0]{D} @ (0(0..1),0(5..6)) (1 nnz, 0.17 nnz/r) flags 0x20443ee (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 1, symflags:'UT' + converted COO to RSB in 3.947e-03 s (100.00 %) + analyzed arrays in 2.605e-03 s (66.00 %) + cleaned-up arrays in 4.053e-06 s (0.10 %) + deduplicated arrays in 1.192e-06 s (0.03 %) + sorted arrays in 9.537e-07 s (0.02 %) + shuffled partitions in 1.314e-03 s (33.29 %) + memory allocations took 7.868e-06 s (0.20 %) + leafs setup took 5.007e-06 s (0.13 %) + halfword conversion took 6.914e-06 s (0.18 %) +Built (6 x 6)[0xaaab0dc054d0]{D} @ (0(0..1),0(5..6)) (1 nnz, 0.17 nnz/r) flags 0x20443ee (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 1, symflags:'UT' Correctly allocated a matrix with 7 nonzeroes. Summary information of the matrix: -(6 x 6)[0xaaaaf70f34d0]{D} @ (0(0..1),0(5..6)) (1 nnz, 0.17 nnz/r) flags 0x20443ee (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 1, symflags:'UT' +(6 x 6)[0xaaab0dc054d0]{D} @ (0(0..1),0(5..6)) (1 nnz, 0.17 nnz/r) flags 0x20443ee (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 1, symflags:'UT' Matrix printout: %%MatrixMarket matrix coordinate real general 6 6 1 @@ -8607,55 +8629,55 @@ 1 1 Will autotune matrix: 6 x 6, type D, 1 nnz, 0.17 nnz/r, 1 subms, 1 lsubms, 4.0000 bpnz. -Parameters: verbosity:1 mintimes:3 maxtimes:10 mindt:0 maxdt:3.295e-08 -3 iterations (12 th.) took 2.909e-05s; avg 9.696e-06s ( +/- 99.66/200.00 %); best 3.295e-08s; worst 2.909e-05s; std dev. 1.371e-05 (taking best). -Reference operation time is 3.29494e-08 s (60.7 Mflops) with 12 threads. -Starting merge (same threads) based auto-tuning procedure (transA=N, nrhs=1, order=cols) (max 6 steps, inclusive 3 grace steps) on: 6 x 6, type D, 1 nnz, 0.17 nnz/r, 1 subms, 1 lsubms, 4.0000 bpnz (tpop: 3.295e-08 Mflops: 60.699) +Parameters: verbosity:1 mintimes:3 maxtimes:10 mindt:0 maxdt:3.06e-08 +3 iterations (12 th.) took 2.599e-05s; avg 8.663e-06s ( +/- 99.65/188.99 %); best 3.06e-08s; worst 2.503e-05s; std dev. 1.158e-05 (taking best). +Reference operation time is 3.0601e-08 s (65.36 Mflops) with 12 threads. +Starting merge (same threads) based auto-tuning procedure (transA=N, nrhs=1, order=cols) (max 6 steps, inclusive 3 grace steps) on: 6 x 6, type D, 1 nnz, 0.17 nnz/r, 1 subms, 1 lsubms, 4.0000 bpnz (tpop: 3.06e-08 Mflops: 65.357) Merge (1 -> 1 leaves) took w.c.t. of 0s, ~0s of computing time (of which 0s sorting, 0s analysis) -3 iterations (12 th.) took 0s; avg 0s ( +/- -inf/ nan %); best 3.295e-08s; worst 0s; std dev. 0 (taking best). -Reference operation time is 3.29494e-08 s (60.7 Mflops) with 12 threads. -After merge step 1: tpop: 3.295e-08 s ~Mflops: 60.699 nsubm:1 otn:12 -Applying merge (1 -> 1 leaves, 12 th.) yielded NEGLIGIBLE change (1th in a row) (old/new=1.00000x): 3.295e-08s -> 3.295e-08s, so IGNORING this instance. +3 iterations (12 th.) took 0s; avg 0s ( +/- -inf/ nan %); best 3.06e-08s; worst 0s; std dev. 0 (taking best). +Reference operation time is 3.0601e-08 s (65.36 Mflops) with 12 threads. +After merge step 1: tpop: 3.06e-08 s ~Mflops: 65.357 nsubm:1 otn:12 +Applying merge (1 -> 1 leaves, 12 th.) yielded NEGLIGIBLE change (1th in a row) (old/new=1.00000x): 3.06e-08s -> 3.06e-08s, so IGNORING this instance. Merged all the matrix leaves: no reason to continue merging. -A total of 1 merge steps (of max 6) (1 -> 1 subms) took 9.06e-06s (of which 2.146e-06s partitioning, 0s I/O); computing times: 0s in par. loops, 0s sorting, 0s analyzing) -Total merge + benchmarking process took 9.06e-06s, equivalent to 275.0/275.0 new/old ops (0.001529s for 1 clones -- as 46403.8/46403.8 ops, or 46403.8/46403.8 ops per clone), SPEEDUP of 1.000x (NO SPEEDUP) +A total of 1 merge steps (of max 6) (1 -> 1 subms) took 8.106e-06s (of which 2.146e-06s partitioning, 0s I/O); computing times: 0s in par. loops, 0s sorting, 0s analyzing) +Total merge + benchmarking process took 8.106e-06s, equivalent to 264.9/264.9 new/old ops (0.00322s for 1 clones -- as 105227.9/105227.9 ops, or 105227.9/105227.9 ops per clone), SPEEDUP of 1.000x (NO SPEEDUP) Merging based autotuning FAILED (=NO SPEEDUP); let's try splitting then... -3 iterations (12 th.) took 2.861e-06s; avg 9.537e-07s ( +/- 96.55/200.00 %); best 3.295e-08s; worst 2.861e-06s; std dev. 1.349e-06 (taking best). -Reference operation time is 3.29494e-08 s (60.7 Mflops) with 12 threads. -Starting split (same threads) based auto-tuning procedure (transA=N, nrhs=1, order=cols) (max 6 steps, inclusive 3 grace steps) on: 6 x 6, type D, 1 nnz, 0.17 nnz/r, 1 subms, 1 lsubms, 4.0000 bpnz (tpop: 3.295e-08 Mflops: 60.699) -Split (1 -> 1 leaves, 1 -> 1 subms) took 1.597e-05s (of which: 1.907e-06s analysis, 0s mem.mgmt); compute time: 0s overall, 0s searches, 0s shuffle, 0s switch, 0s quadrants. -3 iterations (12 th.) took 9.537e-07s; avg 3.179e-07s ( +/- 89.63/200.00 %); best 3.295e-08s; worst 9.537e-07s; std dev. 4.496e-07 (taking best). -Reference operation time is 3.29494e-08 s (60.7 Mflops) with 12 threads. -After split step 1: tpop: 3.295e-08 s ~Mflops: 60.699 nsubm:1 otn:12 -Applying split (1 -> 1 leaves, 12 th.) yielded NEGLIGIBLE change (1th in a row) (old/new=1.00000x): 3.295e-08s -> 3.295e-08s, so IGNORING this instance. +3 iterations (12 th.) took 5.96e-06s; avg 1.987e-06s ( +/- 98.46/200.00 %); best 3.06e-08s; worst 5.96e-06s; std dev. 2.81e-06 (taking best). +Reference operation time is 3.0601e-08 s (65.36 Mflops) with 12 threads. +Starting split (same threads) based auto-tuning procedure (transA=N, nrhs=1, order=cols) (max 6 steps, inclusive 3 grace steps) on: 6 x 6, type D, 1 nnz, 0.17 nnz/r, 1 subms, 1 lsubms, 4.0000 bpnz (tpop: 3.06e-08 Mflops: 65.357) +Split (1 -> 1 leaves, 1 -> 1 subms) took 1.693e-05s (of which: 1.907e-06s analysis, 0s mem.mgmt); compute time: 0s overall, 0s searches, 0s shuffle, 0s switch, 0s quadrants. +3 iterations (12 th.) took 9.537e-07s; avg 3.179e-07s ( +/- 90.37/200.00 %); best 3.06e-08s; worst 9.537e-07s; std dev. 4.496e-07 (taking best). +Reference operation time is 3.0601e-08 s (65.36 Mflops) with 12 threads. +After split step 1: tpop: 3.06e-08 s ~Mflops: 65.357 nsubm:1 otn:12 +Applying split (1 -> 1 leaves, 12 th.) yielded NEGLIGIBLE change (1th in a row) (old/new=1.00000x): 3.06e-08s -> 3.06e-08s, so IGNORING this instance. Split (1 -> 1 leaves, 1 -> 1 subms) took 9.537e-07s (of which: 0s analysis, 0s mem.mgmt); compute time: 0s overall, 0s searches, 0s shuffle, 0s switch, 0s quadrants. -3 iterations (12 th.) took 0s; avg 0s ( +/- -inf/ nan %); best 3.295e-08s; worst 0s; std dev. 0 (taking best). -Reference operation time is 3.29494e-08 s (60.7 Mflops) with 12 threads. -After split step 2: tpop: 3.295e-08 s ~Mflops: 60.699 nsubm:1 otn:12 -Applying split (1 -> 1 leaves, 12 th.) yielded NEGLIGIBLE change (2th in a row) (old/new=1.00000x): 3.295e-08s -> 3.295e-08s, so IGNORING this instance. -Split (1 -> 1 leaves, 1 -> 1 subms) took 2.146e-06s (of which: 0s analysis, 0s mem.mgmt); compute time: 0s overall, 0s searches, 0s shuffle, 0s switch, 0s quadrants. -3 iterations (12 th.) took 0s; avg 0s ( +/- -inf/ nan %); best 3.295e-08s; worst 0s; std dev. 0 (taking best). -Reference operation time is 3.29494e-08 s (60.7 Mflops) with 12 threads. -After split step 3: tpop: 3.295e-08 s ~Mflops: 60.699 nsubm:1 otn:12 -Applying split (1 -> 1 leaves, 12 th.) yielded NEGLIGIBLE change (3th in a row) (old/new=1.00000x): 3.295e-08s -> 3.295e-08s, so IGNORING this instance. -Split (1 -> 1 leaves, 1 -> 1 subms) took 9.537e-07s (of which: 0s analysis, 0s mem.mgmt); compute time: 0s overall, 0s searches, 0s shuffle, 0s switch, 0s quadrants. -3 iterations (12 th.) took 1.192e-06s; avg 3.974e-07s ( +/- 91.71/200.00 %); best 3.295e-08s; worst 1.192e-06s; std dev. 5.62e-07 (taking best). -Reference operation time is 3.29494e-08 s (60.7 Mflops) with 12 threads. -After split step 4: tpop: 3.295e-08 s ~Mflops: 60.699 nsubm:1 otn:12 -Applying split (1 -> 1 leaves, 12 th.) yielded NEGLIGIBLE change (4th in a row) (old/new=1.00000x): 3.295e-08s -> 3.295e-08s, so IGNORING this instance. +3 iterations (12 th.) took 1.192e-06s; avg 3.974e-07s ( +/- 92.30/200.00 %); best 3.06e-08s; worst 1.192e-06s; std dev. 5.62e-07 (taking best). +Reference operation time is 3.0601e-08 s (65.36 Mflops) with 12 threads. +After split step 2: tpop: 3.06e-08 s ~Mflops: 65.357 nsubm:1 otn:12 +Applying split (1 -> 1 leaves, 12 th.) yielded NEGLIGIBLE change (2th in a row) (old/new=1.00000x): 3.06e-08s -> 3.06e-08s, so IGNORING this instance. +Split (1 -> 1 leaves, 1 -> 1 subms) took 5.007e-06s (of which: 9.537e-07s analysis, 0s mem.mgmt); compute time: 0s overall, 0s searches, 0s shuffle, 0s switch, 0s quadrants. +3 iterations (12 th.) took 2.146e-06s; avg 7.153e-07s ( +/- 95.72/ 66.67 %); best 3.06e-08s; worst 1.192e-06s; std dev. 5.15e-07 (taking best). +Reference operation time is 3.0601e-08 s (65.36 Mflops) with 12 threads. +After split step 3: tpop: 3.06e-08 s ~Mflops: 65.357 nsubm:1 otn:12 +Applying split (1 -> 1 leaves, 12 th.) yielded NEGLIGIBLE change (3th in a row) (old/new=1.00000x): 3.06e-08s -> 3.06e-08s, so IGNORING this instance. Split (1 -> 1 leaves, 1 -> 1 subms) took 1.192e-06s (of which: 0s analysis, 0s mem.mgmt); compute time: 0s overall, 0s searches, 0s shuffle, 0s switch, 0s quadrants. -3 iterations (12 th.) took 0s; avg 0s ( +/- -inf/ nan %); best 3.295e-08s; worst 0s; std dev. 0 (taking best). -Reference operation time is 3.29494e-08 s (60.7 Mflops) with 12 threads. -After split step 5: tpop: 3.295e-08 s ~Mflops: 60.699 nsubm:1 otn:12 -Applying split (1 -> 1 leaves, 12 th.) yielded NEGLIGIBLE change (5th in a row) (old/new=1.00000x): 3.295e-08s -> 3.295e-08s, so IGNORING this instance. -Split (1 -> 1 leaves, 1 -> 1 subms) took 9.537e-07s (of which: 9.537e-07s analysis, 0s mem.mgmt); compute time: 0s overall, 0s searches, 0s shuffle, 0s switch, 0s quadrants. -3 iterations (12 th.) took 9.537e-07s; avg 3.179e-07s ( +/- 89.63/200.00 %); best 3.295e-08s; worst 9.537e-07s; std dev. 4.496e-07 (taking best). -Reference operation time is 3.29494e-08 s (60.7 Mflops) with 12 threads. -After split step 6: tpop: 3.295e-08 s ~Mflops: 60.699 nsubm:1 otn:12 -Applying split (1 -> 1 leaves, 12 th.) yielded NEGLIGIBLE change (6th in a row) (old/new=1.00000x): 3.295e-08s -> 3.295e-08s, so IGNORING this instance. -A total of 6 split steps (of max 6) (1 -> 1 subms) took 8.106e-05s (of which 3.815e-05s partitioning, 0s I/O); computing times: 0s in par. loops, 0s sorting, 2.861e-06s analyzing) -Total split + benchmarking process took 8.106e-05s, equivalent to 2460.2/2460.2 new/old ops (0.001594s for 1 clones -- as 48379.2/48379.2 ops, or 48379.2/48379.2 ops per clone), SPEEDUP of 1.000x (NO SPEEDUP) -In 1 tuning rounds (tot. 0.0033s, 0.0031s for constructor, 2 clones) obtained NO speedup (best stays 60.7 Mflops). +3 iterations (12 th.) took 9.537e-07s; avg 3.179e-07s ( +/- 90.37/200.00 %); best 3.06e-08s; worst 9.537e-07s; std dev. 4.496e-07 (taking best). +Reference operation time is 3.0601e-08 s (65.36 Mflops) with 12 threads. +After split step 4: tpop: 3.06e-08 s ~Mflops: 65.357 nsubm:1 otn:12 +Applying split (1 -> 1 leaves, 12 th.) yielded NEGLIGIBLE change (4th in a row) (old/new=1.00000x): 3.06e-08s -> 3.06e-08s, so IGNORING this instance. +Split (1 -> 1 leaves, 1 -> 1 subms) took 9.537e-07s (of which: 0s analysis, 0s mem.mgmt); compute time: 0s overall, 0s searches, 0s shuffle, 0s switch, 0s quadrants. +3 iterations (12 th.) took 0s; avg 0s ( +/- -inf/ nan %); best 3.06e-08s; worst 0s; std dev. 0 (taking best). +Reference operation time is 3.0601e-08 s (65.36 Mflops) with 12 threads. +After split step 5: tpop: 3.06e-08 s ~Mflops: 65.357 nsubm:1 otn:12 +Applying split (1 -> 1 leaves, 12 th.) yielded NEGLIGIBLE change (5th in a row) (old/new=1.00000x): 3.06e-08s -> 3.06e-08s, so IGNORING this instance. +Split (1 -> 1 leaves, 1 -> 1 subms) took 9.537e-07s (of which: 0s analysis, 0s mem.mgmt); compute time: 0s overall, 0s searches, 0s shuffle, 0s switch, 0s quadrants. +3 iterations (12 th.) took 9.537e-07s; avg 3.179e-07s ( +/- 90.37/200.00 %); best 3.06e-08s; worst 9.537e-07s; std dev. 4.496e-07 (taking best). +Reference operation time is 3.0601e-08 s (65.36 Mflops) with 12 threads. +After split step 6: tpop: 3.06e-08 s ~Mflops: 65.357 nsubm:1 otn:12 +Applying split (1 -> 1 leaves, 12 th.) yielded NEGLIGIBLE change (6th in a row) (old/new=1.00000x): 3.06e-08s -> 3.06e-08s, so IGNORING this instance. +A total of 6 split steps (of max 6) (1 -> 1 subms) took 0.0002732s (of which 4.506e-05s partitioning, 0s I/O); computing times: 0s in par. loops, 0s sorting, 2.861e-06s analyzing) +Total split + benchmarking process took 0.0002732s, equivalent to 8928.7/8928.7 new/old ops (0.002942s for 1 clones -- as 96143.4/96143.4 ops, or 96143.4/96143.4 ops per clone), SPEEDUP of 1.000x (NO SPEEDUP) +In 1 tuning rounds (tot. 0.0065s, 0.0062s for constructor, 2 clones) obtained NO speedup (best stays 65.36 Mflops). Backsolving we should get a unitary vector: %%MatrixMarket matrix array real general @@ -8690,119 +8712,184 @@ /build/reproducible-path/librsb-1.3.0.2+dfsg/examples/fortran Building a matrix with 210 nnz, 20 x 20 Duplicates check: 210 - 0 = 210 - converted COO to RSB in 7.586e-03 s (100.00 %) - analyzed arrays in 2.093e-03 s (27.59 %) - cleaned-up arrays in 2.861e-06 s (0.04 %) - deduplicated arrays in 3.099e-06 s (0.04 %) - sorted arrays in 1.306e-03 s (17.22 %) - shuffled partitions in 1.911e-03 s (25.19 %) - memory allocations took 3.409e-05 s (0.45 %) - leafs setup took 8.106e-06 s (0.11 %) - halfword conversion took 2.211e-03 s (29.14 %) -Built (20 x 20)[0xaaaae0fab9f0]{D} @ (0(0..0),0(0..0)) (210 nnz, 10 nnz/r) flags 0x2446396 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 22, symflags:'LS' + converted COO to RSB in 8.466e-03 s (100.00 %) + analyzed arrays in 2.049e-03 s (24.21 %) + cleaned-up arrays in 2.146e-06 s (0.03 %) + deduplicated arrays in 2.146e-06 s (0.03 %) + sorted arrays in 1.429e-03 s (16.88 %) + shuffled partitions in 2.032e-03 s (24.00 %) + memory allocations took 2.670e-05 s (0.32 %) + leafs setup took 5.007e-06 s (0.06 %) + halfword conversion took 2.908e-03 s (34.35 %) +Built (20 x 20)[0xaaaade4429f0]{D} @ (0(0..0),0(0..0)) (210 nnz, 10 nnz/r) flags 0x2446396 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 22, symflags:'LS' Will autotune matrix: 20 x 20, type D, 210 nnz, 10 nnz/r, 30 subms, 22 lsubms, 3.7524 bpnz. -Parameters: verbosity:1 mintimes:3 maxtimes:10 mindt:0 maxdt:4.134e-08 -Starting autotuning (16 x 4.13418e-08 s stages, transA=N, nrhs=1, timer gran.=4.13418e-08), 12 suggested as starting thread count(default). -3 iterations (12 th.) took 0.008901s; avg 0.002967s ( +/- 56.52/ 59.39 %); best 0.00129s; worst 0.004729s; std dev. 0.001405 (taking best). -Reference operation time is 0.00129008 s (0.6511 Mflops) with 12 threads. -Starting merge (same threads) based auto-tuning procedure (transA=N, nrhs=1, order=cols) (max 6 steps, inclusive 3 grace steps) on: 20 x 20, type D, 210 nnz, 10 nnz/r, 30 subms, 22 lsubms, 3.7524 bpnz (tpop: 0.00129 Mflops: 0.651) -Merge (22 -> 16 leaves) took w.c.t. of 0.001207s, ~0.002315s of computing time (of which 3.099e-06s sorting, 5.007e-06s analysis) -3 iterations (12 th.) took 0.006034s; avg 0.002011s ( +/- 17.42/ 19.02 %); best 0.001661s; worst 0.002394s; std dev. 0.0003001 (taking best). -Reference operation time is 0.00166106 s (0.5057 Mflops) with 12 threads. -After merge step 1: tpop: 0.001661 s ~Mflops: 0.506 nsubm:16 otn:12 -Applying merge (22 -> 16 leaves, 12 th.) yielded SLOWDOWN (1th of 3 tolerable) of 1.288x: 0.00129s -> 0.001661s. -Skipping further merge based tests after 1 definite performance degradations in a row (and last exceeding limit). -A total of 1 merge steps (of max 6) (22 -> 16 subms) took 0.007272s (of which 0.001218s partitioning, 0s I/O); computing times: 0.002315s in par. loops, 3.099e-06s sorting, 5.007e-06s analyzing) -Total merge + benchmarking process took 0.007272s, equivalent to 5.6/5.6 new/old ops (0.003032s for 1 clones -- as 2.4/2.4 ops, or 2.4/2.4 ops per clone), SPEEDUP of 1.000x (NO SPEEDUP) +Parameters: verbosity:1 mintimes:3 maxtimes:10 mindt:0 maxdt:3.8e-08 +Starting autotuning (16 x 3.80039e-08 s stages, transA=N, nrhs=1, timer gran.=3.80039e-08), 12 suggested as starting thread count(default). +3 iterations (12 th.) took 0.005578s; avg 0.001859s ( +/- 2.87/ 4.02 %); best 0.001806s; worst 0.001934s; std dev. 5.441e-05 (taking best). +Reference operation time is 0.00180602 s (0.4651 Mflops) with 12 threads. +Starting merge (same threads) based auto-tuning procedure (transA=N, nrhs=1, order=cols) (max 6 steps, inclusive 3 grace steps) on: 20 x 20, type D, 210 nnz, 10 nnz/r, 30 subms, 22 lsubms, 3.7524 bpnz (tpop: 0.001806 Mflops: 0.465) +Merge (22 -> 16 leaves) took w.c.t. of 0.001031s, ~0.0007141s of computing time (of which 1.907e-06s sorting, 5.007e-06s analysis) +3 iterations (12 th.) took 0.003712s; avg 0.001237s ( +/- 35.49/ 22.10 %); best 0.0007982s; worst 0.001511s; std dev. 0.0003136 (taking best). +Reference operation time is 0.000798225 s (1.052 Mflops) with 12 threads. +After merge step 1: tpop: 0.0007982 s ~Mflops: 1.052 nsubm:16 otn:12 +Applying merge (22 -> 16 leaves, 12 th.) yielded SPEEDUP of 2.263x: 0.001806s -> 0.0007982s, so taking this instance. +Merge (16 -> 10 leaves) took w.c.t. of 0.0005081s, ~1.264e-05s of computing time (of which 3.099e-06s sorting, 4.053e-06s analysis) +3 iterations (12 th.) took 0.002369s; avg 0.0007896s ( +/- 31.37/ 58.70 %); best 0.0005419s; worst 0.001253s; std dev. 0.000328 (taking best). +Reference operation time is 0.000541925 s (1.55 Mflops) with 12 threads. +After merge step 2: tpop: 0.0005419 s ~Mflops: 1.550 nsubm:10 otn:12 +Applying merge (16 -> 10 leaves, 12 th.) yielded SPEEDUP of 1.473x: 0.0007982s -> 0.0005419s, so taking this instance. +Merge (10 -> 8 leaves) took w.c.t. of 1.192e-05s, ~5.007e-06s of computing time (of which 1.192e-06s sorting, 3.099e-06s analysis) +3 iterations (12 th.) took 0.00219s; avg 0.00073s ( +/- 25.50/ 38.62 %); best 0.0005438s; worst 0.001012s; std dev. 0.0002027 (taking best). +Reference operation time is 0.000543833 s (1.545 Mflops) with 12 threads. +After merge step 3: tpop: 0.0005438 s ~Mflops: 1.545 nsubm:8 otn:12 +Applying merge (10 -> 8 leaves, 12 th.) yielded NEGLIGIBLE change (1th in a row) (old/new=0.99649x): 0.0005419s -> 0.0005438s, so IGNORING this instance. +Merge (8 -> 6 leaves) took w.c.t. of 5.96e-06s, ~1.907e-06s of computing time (of which 9.537e-07s sorting, 9.537e-07s analysis) +3 iterations (12 th.) took 0.001692s; avg 0.0005639s ( +/- 9.57/ 18.08 %); best 0.00051s; worst 0.0006659s; std dev. 7.214e-05 (taking best). +Reference operation time is 0.000509977 s (1.647 Mflops) with 12 threads. +After merge step 4: tpop: 0.00051 s ~Mflops: 1.647 nsubm:6 otn:12 +Applying merge (8 -> 6 leaves, 12 th.) yielded SPEEDUP of 1.063x: 0.0005419s -> 0.00051s, so taking this instance. +Merge (6 -> 3 leaves) took w.c.t. of 7.868e-06s, ~3.099e-06s of computing time (of which 2.146e-06s sorting, 0s analysis) +3 iterations (12 th.) took 0.001658s; avg 0.0005527s ( +/- 7.35/ 13.10 %); best 0.0005121s; worst 0.0006251s; std dev. 5.132e-05 (taking best). +Reference operation time is 0.000512123 s (1.64 Mflops) with 12 threads. +After merge step 5: tpop: 0.0005121 s ~Mflops: 1.640 nsubm:3 otn:12 +Applying merge (6 -> 3 leaves, 12 th.) yielded NEGLIGIBLE change (1th in a row) (old/new=0.99581x): 0.00051s -> 0.0005121s, so IGNORING this instance. +Merge (3 -> 1 leaves) took w.c.t. of 7.153e-06s, ~3.815e-06s of computing time (of which 1.907e-06s sorting, 1.192e-06s analysis) +3 iterations (12 th.) took 3.099e-06s; avg 1.033e-06s ( +/- 96.32/ 84.62 %); best 3.8e-08s; worst 1.907e-06s; std dev. 7.867e-07 (taking best). +Reference operation time is 3.80039e-08 s (2.21e+04 Mflops) with 12 threads. +After merge step 6: tpop: 3.8e-08 s ~Mflops: 22102.982 nsubm:1 otn:12 +Applying merge (3 -> 1 leaves, 12 th.) yielded SPEEDUP of 13419.072x: 0.00051s -> 3.8e-08s, so taking this instance. +Merged all the matrix leaves: no reason to continue merging. +A total of 6 merge steps (of max 6) (22 -> 1 subms) took 0.0216s (of which 0.001588s partitioning, 0s I/O); computing times: 0.0007405s in par. loops, 1.121e-05s sorting, 1.431e-05s analyzing) +Total merge + benchmarking process took 0.0216s, equivalent to 568230.9/12.0 new/old ops (0.01246s for 5 clones -- as 327885.8/6.9 ops, or 65577.2/1.4 ops per clone), SPEEDUP of 47521.957x +Applying multi-merge (22 -> 1 leaves, 6 steps, 0 -> 12 th.sp.) yielded SPEEDUP of 47521.957x (0.001806s -> 3.8e-08s), will amortize in 12.0 ops by saving 0.001806s per op. +In 1 tuning rounds (tot. 0.031s, 0.012s for constructor, 5 clones) obtained a SPEEDUP of 4752095.7% (4.752e+04x) (from 0.4651 to 2.21e+04 Mflops). + autotuner chose 12 threads +Will autotune matrix: 20 x 20, type D, 210 nnz, 10 nnz/r, 1 subms, 1 lsubms, 2.4000 bpnz. +Parameters: verbosity:1 mintimes:3 maxtimes:10 mindt:0 maxdt:3.8e-08 +Starting autotuning (16 x 3.80039e-08 s stages, transA=N, nrhs=1, timer gran.=3.80039e-08), 12 suggested as starting thread count(default). +3 iterations (12 th.) took 2.861e-06s; avg 9.537e-07s ( +/- 96.02/100.00 %); best 3.8e-08s; worst 1.907e-06s; std dev. 7.787e-07 (taking best). +~ 12 threads: 3.8e-08s (2.2e+04 Mflops) (0/2 degradations so far) - +3 iterations (11 th.) took 9.537e-07s; avg 3.179e-07s ( +/- 88.05/200.00 %); best 3.8e-08s; worst 9.537e-07s; std dev. 4.496e-07 (taking best). + 11 threads: 3.8e-08s (2.2e+04 Mflops) (0/2 degradations so far) - +3 iterations (10 th.) took 9.537e-07s; avg 3.179e-07s ( +/- 88.05/200.00 %); best 3.8e-08s; worst 9.537e-07s; std dev. 4.496e-07 (taking best). + 10 threads: 3.8e-08s (2.2e+04 Mflops) (0/2 degradations so far) - +3 iterations (9 th.) took 9.537e-07s; avg 3.179e-07s ( +/- 88.05/200.00 %); best 3.8e-08s; worst 9.537e-07s; std dev. 4.496e-07 (taking best). + 9 threads: 3.8e-08s (2.2e+04 Mflops) (0/2 degradations so far) - +3 iterations (8 th.) took 1.907e-06s; avg 6.358e-07s ( +/- 94.02/ 50.00 %); best 3.8e-08s; worst 9.537e-07s; std dev. 4.496e-07 (taking best). + 8 threads: 3.8e-08s (2.2e+04 Mflops) (0/2 degradations so far) - +3 iterations (7 th.) took 9.537e-07s; avg 3.179e-07s ( +/- 88.05/200.00 %); best 3.8e-08s; worst 9.537e-07s; std dev. 4.496e-07 (taking best). + 7 threads: 3.8e-08s (2.2e+04 Mflops) (0/2 degradations so far) - +3 iterations (6 th.) took 1.192e-06s; avg 3.974e-07s ( +/- 90.44/200.00 %); best 3.8e-08s; worst 1.192e-06s; std dev. 5.62e-07 (taking best). + 6 threads: 3.8e-08s (2.2e+04 Mflops) (0/2 degradations so far) - +3 iterations (5 th.) took 9.537e-07s; avg 3.179e-07s ( +/- 88.05/200.00 %); best 3.8e-08s; worst 9.537e-07s; std dev. 4.496e-07 (taking best). + 5 threads: 3.8e-08s (2.2e+04 Mflops) (0/2 degradations so far) - +3 iterations (4 th.) took 9.537e-07s; avg 3.179e-07s ( +/- 88.05/200.00 %); best 3.8e-08s; worst 9.537e-07s; std dev. 4.496e-07 (taking best). + 4 threads: 3.8e-08s (2.2e+04 Mflops) (0/2 degradations so far) - +3 iterations (3 th.) took 9.537e-07s; avg 3.179e-07s ( +/- 88.05/200.00 %); best 3.8e-08s; worst 9.537e-07s; std dev. 4.496e-07 (taking best). + 3 threads: 3.8e-08s (2.2e+04 Mflops) (0/2 degradations so far) - +3 iterations (2 th.) took 1.192e-06s; avg 3.974e-07s ( +/- 90.44/200.00 %); best 3.8e-08s; worst 1.192e-06s; std dev. 5.62e-07 (taking best). + 2 threads: 3.8e-08s (2.2e+04 Mflops) (0/2 degradations so far) - +3 iterations (1 th.) took 9.537e-07s; avg 3.179e-07s ( +/- 88.05/200.00 %); best 3.8e-08s; worst 9.537e-07s; std dev. 4.496e-07 (taking best). + 1 threads: 3.8e-08s (2.2e+04 Mflops) (0/2 degradations so far) - +Best threads choice is 12; starting threads were 12; max speed gap is 1x; search took 5.1e-05s. +Starting merge (and threads) based auto-tuning procedure (transA=N, nrhs=1, order=cols) (max 6 steps, inclusive 3 grace steps) on: 20 x 20, type D, 210 nnz, 10 nnz/r, 1 subms, 1 lsubms, 2.4000 bpnz (tpop: 3.8e-08 Mflops: 22102.982) +Merge (1 -> 1 leaves) took w.c.t. of 0s, ~0s of computing time (of which 0s sorting, 0s analysis) +3 iterations (12 th.) took 9.537e-07s; avg 3.179e-07s ( +/- 88.05/200.00 %); best 3.8e-08s; worst 9.537e-07s; std dev. 4.496e-07 (taking best). +~ 12 threads: 3.8e-08s (2.2e+04 Mflops) (0/2 degradations so far) - +3 iterations (11 th.) took 2.146e-06s; avg 7.153e-07s ( +/- 94.69/ 66.67 %); best 3.8e-08s; worst 1.192e-06s; std dev. 5.15e-07 (taking best). + 11 threads: 3.8e-08s (2.2e+04 Mflops) (0/2 degradations so far) - +3 iterations (10 th.) took 9.537e-07s; avg 3.179e-07s ( +/- 88.05/200.00 %); best 3.8e-08s; worst 9.537e-07s; std dev. 4.496e-07 (taking best). + 10 threads: 3.8e-08s (2.2e+04 Mflops) (0/2 degradations so far) - +3 iterations (9 th.) took 9.537e-07s; avg 3.179e-07s ( +/- 88.05/200.00 %); best 3.8e-08s; worst 9.537e-07s; std dev. 4.496e-07 (taking best). + 9 threads: 3.8e-08s (2.2e+04 Mflops) (0/2 degradations so far) - +3 iterations (8 th.) took 1.907e-06s; avg 6.358e-07s ( +/- 94.02/ 50.00 %); best 3.8e-08s; worst 9.537e-07s; std dev. 4.496e-07 (taking best). + 8 threads: 3.8e-08s (2.2e+04 Mflops) (0/2 degradations so far) - +3 iterations (7 th.) took 9.537e-07s; avg 3.179e-07s ( +/- 88.05/200.00 %); best 3.8e-08s; worst 9.537e-07s; std dev. 4.496e-07 (taking best). + 7 threads: 3.8e-08s (2.2e+04 Mflops) (0/2 degradations so far) - +3 iterations (6 th.) took 1.192e-06s; avg 3.974e-07s ( +/- 90.44/200.00 %); best 3.8e-08s; worst 1.192e-06s; std dev. 5.62e-07 (taking best). + 6 threads: 3.8e-08s (2.2e+04 Mflops) (0/2 degradations so far) - +3 iterations (5 th.) took 1.907e-06s; avg 6.358e-07s ( +/- 94.02/ 50.00 %); best 3.8e-08s; worst 9.537e-07s; std dev. 4.496e-07 (taking best). + 5 threads: 3.8e-08s (2.2e+04 Mflops) (0/2 degradations so far) - +3 iterations (4 th.) took 9.537e-07s; avg 3.179e-07s ( +/- 88.05/200.00 %); best 3.8e-08s; worst 9.537e-07s; std dev. 4.496e-07 (taking best). + 4 threads: 3.8e-08s (2.2e+04 Mflops) (0/2 degradations so far) - +3 iterations (3 th.) took 1.192e-06s; avg 3.974e-07s ( +/- 90.44/200.00 %); best 3.8e-08s; worst 1.192e-06s; std dev. 5.62e-07 (taking best). + 3 threads: 3.8e-08s (2.2e+04 Mflops) (0/2 degradations so far) - +3 iterations (2 th.) took 1.907e-06s; avg 6.358e-07s ( +/- 94.02/ 50.00 %); best 3.8e-08s; worst 9.537e-07s; std dev. 4.496e-07 (taking best). + 2 threads: 3.8e-08s (2.2e+04 Mflops) (0/2 degradations so far) - +3 iterations (1 th.) took 9.537e-07s; avg 3.179e-07s ( +/- 88.05/200.00 %); best 3.8e-08s; worst 9.537e-07s; std dev. 4.496e-07 (taking best). + 1 threads: 3.8e-08s (2.2e+04 Mflops) (0/2 degradations so far) - +Best threads choice is 12; starting threads were 12; max speed gap is 1x; search took 4.9e-05s. +After merge step 1: tpop: 3.8e-08 s ~Mflops: 22102.982 nsubm:1 otn:12 +Applying merge (1 -> 1 leaves, 12 th.) yielded NEGLIGIBLE change (1th in a row) (old/new=1.00000x): 3.8e-08s -> 3.8e-08s, so IGNORING this instance. +Merged all the matrix leaves: no reason to continue merging. +A total of 1 merge steps (of max 6) (1 -> 1 subms) took 5.507e-05s (of which 1.192e-06s partitioning, 0s I/O); computing times: 0s in par. loops, 0s sorting, 0s analyzing) +Total merge + benchmarking process took 5.507e-05s, equivalent to 1449.2/1449.2 new/old ops (0.001548s for 1 clones -- as 40734.0/40734.0 ops, or 40734.0/40734.0 ops per clone), SPEEDUP of 1.000x (NO SPEEDUP) Merging based autotuning FAILED (=NO SPEEDUP); let's try splitting then... -3 iterations (12 th.) took 0.01307s; avg 0.004358s ( +/- 68.91/ 50.61 %); best 0.001355s; worst 0.006563s; std dev. 0.0022 (taking best). -Reference operation time is 0.00135493 s (0.62 Mflops) with 12 threads. -Starting split (same threads) based auto-tuning procedure (transA=N, nrhs=1, order=cols) (max 6 steps, inclusive 3 grace steps) on: 20 x 20, type D, 210 nnz, 10 nnz/r, 30 subms, 22 lsubms, 3.7524 bpnz (tpop: 0.001355 Mflops: 0.620) -Split (22 -> 51 leaves, 30 -> 70 subms) took 0.001385s (of which: 4.053e-06s analysis, -1.951e+10s mem.mgmt); compute time: 0.006516s overall, 6.437e-06s searches, 0.006509s shuffle, 0.00593s switch, 0.000113s quadrants. -3 iterations (12 th.) took 0.01345s; avg 0.004485s ( +/- 55.92/100.19 %); best 0.001977s; worst 0.008978s; std dev. 0.003184 (taking best). -Reference operation time is 0.00197697 s (0.4249 Mflops) with 12 threads. -After split step 1: tpop: 0.001977 s ~Mflops: 0.425 nsubm:51 otn:12 -Applying split (22 -> 51 leaves, 12 th.) yielded SLOWDOWN (1th of 3 tolerable) of 1.459x: 0.001355s -> 0.001977s. +3 iterations (12 th.) took 2.861e-06s; avg 9.537e-07s ( +/- 96.02/100.00 %); best 3.8e-08s; worst 1.907e-06s; std dev. 7.787e-07 (taking best). +~ 12 threads: 3.8e-08s (2.2e+04 Mflops) (0/2 degradations so far) - +3 iterations (11 th.) took 1.192e-06s; avg 3.974e-07s ( +/- 90.44/200.00 %); best 3.8e-08s; worst 1.192e-06s; std dev. 5.62e-07 (taking best). + 11 threads: 3.8e-08s (2.2e+04 Mflops) (0/2 degradations so far) - +3 iterations (10 th.) took 9.537e-07s; avg 3.179e-07s ( +/- 88.05/200.00 %); best 3.8e-08s; worst 9.537e-07s; std dev. 4.496e-07 (taking best). + 10 threads: 3.8e-08s (2.2e+04 Mflops) (0/2 degradations so far) - +3 iterations (9 th.) took 1.907e-06s; avg 6.358e-07s ( +/- 94.02/ 50.00 %); best 3.8e-08s; worst 9.537e-07s; std dev. 4.496e-07 (taking best). + 9 threads: 3.8e-08s (2.2e+04 Mflops) (0/2 degradations so far) - +3 iterations (8 th.) took 9.537e-07s; avg 3.179e-07s ( +/- 88.05/200.00 %); best 3.8e-08s; worst 9.537e-07s; std dev. 4.496e-07 (taking best). + 8 threads: 3.8e-08s (2.2e+04 Mflops) (0/2 degradations so far) - +3 iterations (7 th.) took 1.192e-06s; avg 3.974e-07s ( +/- 90.44/200.00 %); best 3.8e-08s; worst 1.192e-06s; std dev. 5.62e-07 (taking best). + 7 threads: 3.8e-08s (2.2e+04 Mflops) (0/2 degradations so far) - +3 iterations (6 th.) took 1.907e-06s; avg 6.358e-07s ( +/- 94.02/ 50.00 %); best 3.8e-08s; worst 9.537e-07s; std dev. 4.496e-07 (taking best). + 6 threads: 3.8e-08s (2.2e+04 Mflops) (0/2 degradations so far) - +3 iterations (5 th.) took 9.537e-07s; avg 3.179e-07s ( +/- 88.05/200.00 %); best 3.8e-08s; worst 9.537e-07s; std dev. 4.496e-07 (taking best). + 5 threads: 3.8e-08s (2.2e+04 Mflops) (0/2 degradations so far) - +3 iterations (4 th.) took 9.537e-07s; avg 3.179e-07s ( +/- 88.05/200.00 %); best 3.8e-08s; worst 9.537e-07s; std dev. 4.496e-07 (taking best). + 4 threads: 3.8e-08s (2.2e+04 Mflops) (0/2 degradations so far) - +3 iterations (3 th.) took 1.192e-06s; avg 3.974e-07s ( +/- 90.44/200.00 %); best 3.8e-08s; worst 1.192e-06s; std dev. 5.62e-07 (taking best). + 3 threads: 3.8e-08s (2.2e+04 Mflops) (0/2 degradations so far) - +3 iterations (2 th.) took 9.537e-07s; avg 3.179e-07s ( +/- 88.05/200.00 %); best 3.8e-08s; worst 9.537e-07s; std dev. 4.496e-07 (taking best). + 2 threads: 3.8e-08s (2.2e+04 Mflops) (0/2 degradations so far) - +3 iterations (1 th.) took 9.537e-07s; avg 3.179e-07s ( +/- 88.05/200.00 %); best 3.8e-08s; worst 9.537e-07s; std dev. 4.496e-07 (taking best). + 1 threads: 3.8e-08s (2.2e+04 Mflops) (0/2 degradations so far) - +Best threads choice is 12; starting threads were 12; max speed gap is 1x; search took 5.5e-05s. +Starting split (and threads) based auto-tuning procedure (transA=N, nrhs=1, order=cols) (max 6 steps, inclusive 3 grace steps) on: 20 x 20, type D, 210 nnz, 10 nnz/r, 1 subms, 1 lsubms, 2.4000 bpnz (tpop: 3.8e-08 Mflops: 22102.982) +Split (1 -> 3 leaves, 1 -> 4 subms) took 2.408e-05s (of which: 1.907e-06s analysis, -1.739e+09s mem.mgmt); compute time: 8.821e-06s overall, 2.146e-06s searches, 6.676e-06s shuffle, 2.861e-06s switch, 0s quadrants. +3 iterations (12 th.) took 0.003048s; avg 0.001016s ( +/- 24.02/ 31.19 %); best 0.000772s; worst 0.001333s; std dev. 0.0002348 (taking best). +~ 12 threads: 0.000772s (1.1 Mflops) (0/2 degradations so far) - +3 iterations (11 th.) took 0.00226s; avg 0.0007533s ( +/- 9.86/ 19.60 %); best 0.000679s; worst 0.000901s; std dev. 0.0001044 (taking best). + 11 threads: 0.000679s (1.2 Mflops) (0/2 degradations so far) - +3 iterations (10 th.) took 0.004276s; avg 0.001425s ( +/- 39.16/ 20.03 %); best 0.0008671s; worst 0.001711s; std dev. 0.0003948 (taking best). + 10 threads: 0.0008671s (0.97 Mflops) (1/2 degradations so far) - +3 iterations (9 th.) took 0.00399s; avg 0.00133s ( +/- 31.51/ 43.91 %); best 0.000911s; worst 0.001914s; std dev. 0.0004258 (taking best). + 9 threads: 0.000911s (0.92 Mflops) (2/2 degradations so far) - +Best threads choice is 11; starting threads were 12; max speed gap is 1.3x; search took 0.014s. +After split step 1: tpop: 0.000679 s ~Mflops: 1.237 nsubm:3 otn:11 +Applying split (1 -> 3 leaves, 11 th.) yielded SLOWDOWN (1th of 3 tolerable) of 17867.001x: 3.8e-08s -> 0.000679s. Skipping further split based tests after 1 definite performance degradations in a row (and last exceeding limit). -A total of 1 split steps (of max 6) (22 -> 51 subms) took 0.01493s (of which 0.001456s partitioning, 0s I/O); computing times: 0.006516s in par. loops, 6.437e-06s sorting, 4.053e-06s analyzing) -Total split + benchmarking process took 0.01493s, equivalent to 11.0/11.0 new/old ops (0.003503s for 1 clones -- as 2.6/2.6 ops, or 2.6/2.6 ops per clone), SPEEDUP of 1.000x (NO SPEEDUP) -In 1 tuning rounds (tot. 0.051s, 0.0065s for constructor, 2 clones) obtained NO speedup (best stays 0.62 Mflops). - autotuner chose 12 threads -Will autotune matrix: 20 x 20, type D, 210 nnz, 10 nnz/r, 30 subms, 22 lsubms, 3.7524 bpnz. -Parameters: verbosity:1 mintimes:3 maxtimes:10 mindt:0 maxdt:4.134e-08 -Starting autotuning (16 x 4.13418e-08 s stages, transA=N, nrhs=1, timer gran.=4.13418e-08), 12 suggested as starting thread count(default). -3 iterations (12 th.) took 0.003517s; avg 0.001172s ( +/- 40.56/ 79.30 %); best 0.0006969s; worst 0.002102s; std dev. 0.0006575 (taking best). -~ 12 threads: 0.0006969s (1.2 Mflops) (0/2 degradations so far) - -3 iterations (11 th.) took 0.002576s; avg 0.0008587s ( +/- 41.64/ 27.86 %); best 0.0005012s; worst 0.001098s; std dev. 0.0002576 (taking best). - 11 threads: 0.0005012s (1.7 Mflops) (0/2 degradations so far) - -3 iterations (10 th.) took 0.003805s; avg 0.001268s ( +/- 35.03/ 39.88 %); best 0.000824s; worst 0.001774s; std dev. 0.0003903 (taking best). - 10 threads: 0.000824s (1 Mflops) (1/2 degradations so far) - -3 iterations (9 th.) took 0.007632s; avg 0.002544s ( +/- 77.55/ 97.72 %); best 0.000571s; worst 0.00503s; std dev. 0.001856 (taking best). - 9 threads: 0.000571s (1.5 Mflops) (2/2 degradations so far) - -Best threads choice is 11; starting threads were 12; max speed gap is 1.6x; search took 0.018s. -Starting merge (and threads) based auto-tuning procedure (transA=N, nrhs=1, order=cols) (max 6 steps, inclusive 3 grace steps) on: 20 x 20, type D, 210 nnz, 10 nnz/r, 30 subms, 22 lsubms, 3.7524 bpnz (tpop: 0.0005012 Mflops: 1.676) -Merge (22 -> 16 leaves) took w.c.t. of 0.0003519s, ~1.287e-05s of computing time (of which 1.907e-06s sorting, 5.007e-06s analysis) -3 iterations (12 th.) took 0.004325s; avg 0.001442s ( +/- 28.90/ 33.59 %); best 0.001025s; worst 0.001926s; std dev. 0.0003709 (taking best). -~ 12 threads: 0.001025s (0.82 Mflops) (0/2 degradations so far) - -3 iterations (11 th.) took 0.002726s; avg 0.0009087s ( +/- 27.35/ 21.16 %); best 0.0006602s; worst 0.001101s; std dev. 0.0001843 (taking best). - 11 threads: 0.0006602s (1.3 Mflops) (0/2 degradations so far) - -3 iterations (10 th.) took 0.00376s; avg 0.001253s ( +/- 57.87/ 36.35 %); best 0.0005281s; worst 0.001709s; std dev. 0.0005184 (taking best). - 10 threads: 0.0005281s (1.6 Mflops) (0/2 degradations so far) - -3 iterations (9 th.) took 0.005544s; avg 0.001848s ( +/- 71.91/ 68.62 %); best 0.000519s; worst 0.003116s; std dev. 0.001061 (taking best). - 9 threads: 0.000519s (1.6 Mflops) (0/2 degradations so far) - -3 iterations (8 th.) took 0.003409s; avg 0.001136s ( +/- 19.47/ 26.81 %); best 0.0009151s; worst 0.001441s; std dev. 0.0002227 (taking best). - 8 threads: 0.0009151s (0.92 Mflops) (1/2 degradations so far) - -3 iterations (7 th.) took 0.001562s; avg 0.0005206s ( +/- 33.51/ 27.13 %); best 0.0003462s; worst 0.0006618s; std dev. 0.000131 (taking best). - 7 threads: 0.0003462s (2.4 Mflops) (0/2 degradations so far) - -3 iterations (6 th.) took 0.004438s; avg 0.001479s ( +/- 62.14/ 71.89 %); best 0.00056s; worst 0.002543s; std dev. 0.0008159 (taking best). - 6 threads: 0.00056s (1.5 Mflops) (1/2 degradations so far) - -3 iterations (5 th.) took 0.002313s; avg 0.000771s ( +/- 34.10/ 34.24 %); best 0.0005081s; worst 0.001035s; std dev. 0.0002151 (taking best). - 5 threads: 0.0005081s (1.7 Mflops) (2/2 degradations so far) - -Best threads choice is 7; starting threads were 12; max speed gap is 3x; search took 0.028s. -After merge step 1: tpop: 0.0003462 s ~Mflops: 2.426 nsubm:16 otn:7 -Applying merge (22 -> 16 leaves, 7 th.) yielded SPEEDUP of 1.448x: 0.0005012s -> 0.0003462s, so taking this instance. -Merge (16 -> 10 leaves) took w.c.t. of 0.000277s, ~1.287e-05s of computing time (of which 1.907e-06s sorting, 3.815e-06s analysis) -3 iterations (12 th.) took 0.006041s; avg 0.002014s ( +/- 66.67/122.38 %); best 0.0006711s; worst 0.004478s; std dev. 0.001745 (taking best). -~ 12 threads: 0.0006711s (1.3 Mflops) (0/2 degradations so far) - -3 iterations (11 th.) took 0.001901s; avg 0.0006337s ( +/- 25.36/ 48.65 %); best 0.000473s; worst 0.000942s; std dev. 0.000218 (taking best). - 11 threads: 0.000473s (1.8 Mflops) (0/2 degradations so far) - -3 iterations (10 th.) took 0.001627s; avg 0.0005423s ( +/- 17.57/ 23.71 %); best 0.000447s; worst 0.0006709s; std dev. 9.438e-05 (taking best). - 10 threads: 0.000447s (1.9 Mflops) (0/2 degradations so far) - -3 iterations (9 th.) took 0.001511s; avg 0.0005036s ( +/- 0.54/ 0.46 %); best 0.0005009s; worst 0.0005059s; std dev. 2.063e-06 (taking best). - 9 threads: 0.0005009s (1.7 Mflops) (1/2 degradations so far) - -3 iterations (8 th.) took 0.00189s; avg 0.00063s ( +/- 20.94/ 39.35 %); best 0.0004981s; worst 0.0008779s; std dev. 0.0001754 (taking best). - 8 threads: 0.0004981s (1.7 Mflops) (2/2 degradations so far) - -Best threads choice is 10; starting threads were 12; max speed gap is 1.5x; search took 0.013s. -After merge step 2: tpop: 0.000447 s ~Mflops: 1.879 nsubm:10 otn:10 -Applying merge (16 -> 10 leaves, 10 th.) yielded SLOWDOWN (1th of 3 tolerable) of 1.291x: 0.0003462s -> 0.000447s. -Skipping further merge based tests after 1 definite performance degradations in a row (and last exceeding limit). -A total of 2 merge steps (of max 6) (22 -> 10 subms) took 0.04357s (of which 0.0006402s partitioning, 0s I/O); computing times: 2.575e-05s in par. loops, 3.815e-06s sorting, 8.821e-06s analyzing) -Total merge + benchmarking process took 0.04357s, equivalent to 125.8/86.9 new/old ops (0.003694s for 2 clones -- as 10.7/7.4 ops, or 5.3/3.7 ops per clone), SPEEDUP of 1.448x -Applying multi-merge (22 -> 16 leaves, 1 steps, 11 -> 7 th.sp.) yielded SPEEDUP of 1.448x (0.0005012s -> 0.0003462s), will amortize in 281.1 ops by saving 0.000155s per op. -In 1 tuning rounds (tot. 0.063s, 0.0037s for constructor, 2 clones) obtained a SPEEDUP of 44.8% (1.448x) (from 1.676 to 2.426 Mflops). +A total of 1 split steps (of max 6) (1 -> 3 subms) took 0.01364s (of which 3.099e-05s partitioning, 0s I/O); computing times: 8.821e-06s in par. loops, 2.146e-06s sorting, 1.907e-06s analyzing) +Total split + benchmarking process took 0.01364s, equivalent to 358808.0/358808.0 new/old ops (0.001512s for 1 clones -- as 39780.4/39780.4 ops, or 39780.4/39780.4 ops per clone), SPEEDUP of 1.000x (NO SPEEDUP) +In 1 tuning rounds (tot. 0.017s, 0.0031s for constructor, 2 clones) obtained NO speedup (best stays 2.21e+04 Mflops). check results are ok Building a matrix with 36 nnz, 6 x 6 Duplicates check: 36 - 0 = 36 - converted COO to RSB in 1.809e-03 s (100.00 %) - analyzed arrays in 8.891e-04 s (49.14 %) - cleaned-up arrays in 9.537e-07 s (0.05 %) - deduplicated arrays in 9.537e-07 s (0.05 %) - sorted arrays in 3.500e-04 s (19.35 %) - shuffled partitions in 5.610e-04 s (31.01 %) - memory allocations took 4.053e-06 s (0.22 %) - leafs setup took 9.537e-07 s (0.05 %) - halfword conversion took 1.192e-06 s (0.07 %) -Built (6 x 6)[0xaaaae0faa590]{Z} @ (0(0..6),0(0..6)) (36 nnz, 6 nnz/r) flags 0x20440b4 (coo:0, csr:1, hw:0, ic:1, fi:0), storage: 1, subm: 1, symflags:'UL' + converted COO to RSB in 2.679e-03 s (100.00 %) + analyzed arrays in 9.100e-04 s (33.97 %) + cleaned-up arrays in 9.537e-07 s (0.04 %) + deduplicated arrays in 0.000e+00 s (0.00 %) + sorted arrays in 8.910e-04 s (33.26 %) + shuffled partitions in 8.700e-04 s (32.47 %) + memory allocations took 3.099e-06 s (0.12 %) + leafs setup took 2.146e-06 s (0.08 %) + halfword conversion took 9.537e-07 s (0.04 %) +Built (6 x 6)[0xaaaade44e0a0]{Z} @ (0(0..6),0(0..6)) (36 nnz, 6 nnz/r) flags 0x20440b4 (coo:0, csr:1, hw:0, ic:1, fi:0), storage: 1, subm: 1, symflags:'UL' Read matrix pd.mtx 6 x 6 : 36 Matrix has no symmetry Using NRHS=4 -Repeated USMV took 0.1938E-03 s +Repeated USMV took 0.1881E-03 s A single USMM took 0.5007E-05 s -USMM-to-USMV speed ratio is is 38.71 x +USMM-to-USMV speed ratio is is 37.57 x Call auto-tuning routine.. Repeat measurement. -Tuned USMM took 0.1907E-05 s -Tuned-to-untuned speed ratio is is 2.625 x +Tuned USMM took 0.9537E-06 s +Tuned-to-untuned speed ratio is is 5.250 x FAILED: 0 PASSED: 2 /build/reproducible-path/librsb-1.3.0.2+dfsg/examples/fortran_rsb_fi @@ -8851,228 +8938,223 @@ Loading matrix from file "/build/reproducible-path/librsb-1.3.0.2+dfsg/pd.mtx". Building a matrix with 36 nnz, 6 x 6 Duplicates check: 36 - 0 = 36 - converted COO to RSB in 6.818e-03 s (100.00 %) - analyzed arrays in 2.655e-03 s (38.94 %) - cleaned-up arrays in 5.960e-06 s (0.09 %) - deduplicated arrays in 9.537e-07 s (0.01 %) - sorted arrays in 9.930e-04 s (14.56 %) - shuffled partitions in 1.617e-03 s (23.72 %) - memory allocations took 1.407e-05 s (0.21 %) - leafs setup took 4.053e-06 s (0.06 %) - halfword conversion took 1.513e-03 s (22.19 %) -Built (6 x 6)[0xaaaadf828a20]{D} @ (0(0..0),0(0..0)) (36 nnz, 6 nnz/r) flags 0x42046186 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 22, symflags:'' + converted COO to RSB in 7.334e-03 s (100.00 %) + analyzed arrays in 1.738e-03 s (23.70 %) + cleaned-up arrays in 5.960e-06 s (0.08 %) + deduplicated arrays in 1.192e-06 s (0.02 %) + sorted arrays in 1.584e-03 s (21.60 %) + shuffled partitions in 1.254e-03 s (17.10 %) + memory allocations took 9.775e-06 s (0.13 %) + leafs setup took 5.960e-06 s (0.08 %) + halfword conversion took 2.724e-03 s (37.14 %) +Built (6 x 6)[0xaaaadcb5da20]{D} @ (0(0..0),0(0..0)) (36 nnz, 6 nnz/r) flags 0x42046186 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 22, symflags:'' Considering D clone. Base matrix: -(6 x 6)[0xaaaadf82caa0]{D} @ (0(0..0),0(0..0)) (36 nnz, 6 nnz/r) flags 0x2046186 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 22, symflags:'' +(6 x 6)[0xaaaadcb61aa0]{D} @ (0(0..0),0(0..0)) (36 nnz, 6 nnz/r) flags 0x2046186 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 22, symflags:'' Will use autotuning routine to sample matrix: 6 x 6, type D, 36 nnz, 6 nnz/r, 29 subms, 22 lsubms, 4.6667 bpnz. Parameters: verbosity:1 mintimes:3 maxtimes:10 mindt:0 maxdt:0.1 -3 iterations (12 th.) took 0.003867s; avg 0.001289s ( +/- 17.62/ 28.55 %); best 0.001062s; worst 0.001657s; std dev. 0.0002626 (taking best). -Reference operation time is 0.00106192 s (0.1356 Mflops) with 12 threads. -After 0.003915s, autotuning routine did not find a better threads count configuration. +3 iterations (12 th.) took 0.01088s; avg 0.003625s ( +/- 47.62/ 38.88 %); best 0.001899s; worst 0.005035s; std dev. 0.0013 (taking best). +Reference operation time is 0.001899 s (0.07583 Mflops) with 12 threads. +After 0.010932s, autotuning routine did not find a better threads count configuration. Will autotune matrix: 6 x 6, type D, 36 nnz, 6 nnz/r, 29 subms, 22 lsubms, 4.6667 bpnz. Parameters: verbosity:1 mintimes:3 maxtimes:10 mindt:0 maxdt:0.1 -3 iterations (12 th.) took 0.003802s; avg 0.001267s ( +/- 6.35/ 11.50 %); best 0.001187s; worst 0.001413s; std dev. 0.0001033 (taking best). -Reference operation time is 0.00118685 s (0.1213 Mflops) with 12 threads. -Starting merge (same threads) based auto-tuning procedure (transA=N, nrhs=2, order=cols) (max 6 steps, inclusive 3 grace steps) on: 6 x 6, type D, 36 nnz, 6 nnz/r, 29 subms, 22 lsubms, 4.6667 bpnz (tpop: 0.001187 Mflops: 0.121) -Merge (22 -> 16 leaves) took w.c.t. of 0.001051s, ~0.0006301s of computing time (of which 2.146e-06s sorting, 5.96e-06s analysis) -3 iterations (12 th.) took 0.004831s; avg 0.00161s ( +/- 15.24/ 26.24 %); best 0.001365s; worst 0.002033s; std dev. 0.0003001 (taking best). -Reference operation time is 0.00136495 s (0.1055 Mflops) with 12 threads. -After merge step 1: tpop: 0.001365 s ~Mflops: 0.105 nsubm:16 otn:12 -Applying merge (22 -> 16 leaves, 12 th.) yielded SLOWDOWN (1th of 3 tolerable) of 1.150x: 0.001187s -> 0.001365s. -Merge (16 -> 10 leaves) took w.c.t. of 0.000108s, ~1.621e-05s of computing time (of which 3.338e-06s sorting, 4.053e-06s analysis) -3 iterations (12 th.) took 0.02216s; avg 0.007388s ( +/- 82.90/142.32 %); best 0.001263s; worst 0.0179s; std dev. 0.007469 (taking best). -Reference operation time is 0.00126314 s (0.114 Mflops) with 12 threads. -After merge step 2: tpop: 0.001263 s ~Mflops: 0.114 nsubm:10 otn:12 -Applying merge (16 -> 10 leaves, 12 th.) yielded SLOWDOWN (2th of 3 tolerable) of 1.064x: 0.001187s -> 0.001263s. -Merge (10 -> 7 leaves) took w.c.t. of 2.217e-05s, ~5.96e-06s of computing time (of which 1.192e-06s sorting, 6.914e-06s analysis) -3 iterations (12 th.) took 0.003514s; avg 0.001171s ( +/- 2.42/ 4.66 %); best 0.001143s; worst 0.001226s; std dev. 3.862e-05 (taking best). -Reference operation time is 0.00114298 s (0.126 Mflops) with 12 threads. -After merge step 3: tpop: 0.001143 s ~Mflops: 0.126 nsubm:7 otn:12 -Applying merge (10 -> 7 leaves, 12 th.) yielded SPEEDUP of 1.038x: 0.001187s -> 0.001143s, so taking this instance. -Merge (7 -> 4 leaves) took w.c.t. of 2.098e-05s, ~3.099e-06s of computing time (of which 0s sorting, 2.146e-06s analysis) -3 iterations (12 th.) took 0.003464s; avg 0.001155s ( +/- 9.06/ 7.31 %); best 0.00105s; worst 0.001239s; std dev. 7.85e-05 (taking best). -Reference operation time is 0.00105 s (0.1371 Mflops) with 12 threads. -After merge step 4: tpop: 0.00105 s ~Mflops: 0.137 nsubm:4 otn:12 -Applying merge (7 -> 4 leaves, 12 th.) yielded SPEEDUP of 1.089x: 0.001143s -> 0.00105s, so taking this instance. -Merge (4 -> 1 leaves) took w.c.t. of 1.001e-05s, ~4.053e-06s of computing time (of which 1.907e-06s sorting, 9.537e-07s analysis) -3 iterations (12 th.) took 4.053e-06s; avg 1.351e-06s ( +/- 96.75/111.76 %); best 4.386e-08s; worst 2.861e-06s; std dev. 1.173e-06 (taking best). -Reference operation time is 4.38571e-08 s (3283 Mflops) with 12 threads. -After merge step 5: tpop: 4.386e-08 s ~Mflops: 3283.391 nsubm:1 otn:12 -Applying merge (4 -> 1 leaves, 12 th.) yielded SPEEDUP of 23941.288x: 0.00105s -> 4.386e-08s, so taking this instance. -Merged all the matrix leaves: no reason to continue merging. -A total of 5 merge steps (of max 6) (22 -> 1 subms) took 0.04487s (of which 0.00125s partitioning, 0s I/O); computing times: 0.0006595s in par. loops, 8.583e-06s sorting, 2.003e-05s analyzing) -Total merge + benchmarking process took 0.04487s, equivalent to 1023120.4/37.8 new/old ops (0.01257s for 4 clones -- as 286637.7/10.6 ops, or 71659.4/2.6 ops per clone), SPEEDUP of 27061.702x -Applying multi-merge (22 -> 1 leaves, 5 steps, 0 -> 12 th.sp.) yielded SPEEDUP of 27061.702x (0.001187s -> 4.386e-08s), will amortize in 37.8 ops by saving 0.001187s per op. -In 1 tuning rounds (tot. 0.052s, 0.013s for constructor, 4 clones) obtained a SPEEDUP of 2706070.2% (2.706e+04x) (from 0.1213 to 3283 Mflops). -After 0.051742s, global autotuning declared speedup of 27061.7 x, when using threads count of 12 and a new matrix: -(6 x 6)[0xaaaadf82ee70]{D} @ (0(0..6),0(0..6)) (36 nnz, 6 nnz/r) flags 0x2244086 (coo:0, csr:1, hw:1, ic:1, fi:0), storage: 1, subm: 1, symflags:'' +3 iterations (12 th.) took 0.004501s; avg 0.0015s ( +/- 18.88/ 21.17 %); best 0.001217s; worst 0.001818s; std dev. 0.0002465 (taking best). +Reference operation time is 0.00121713 s (0.1183 Mflops) with 12 threads. +Starting merge (same threads) based auto-tuning procedure (transA=N, nrhs=2, order=cols) (max 6 steps, inclusive 3 grace steps) on: 6 x 6, type D, 36 nnz, 6 nnz/r, 29 subms, 22 lsubms, 4.6667 bpnz (tpop: 0.001217 Mflops: 0.118) +Merge (22 -> 16 leaves) took w.c.t. of 0.0008502s, ~0.0008657s of computing time (of which 1.907e-06s sorting, 6.199e-06s analysis) +3 iterations (12 th.) took 0.01638s; avg 0.00546s ( +/- 78.28/143.47 %); best 0.001186s; worst 0.01329s; std dev. 0.005547 (taking best). +Reference operation time is 0.00118589 s (0.1214 Mflops) with 12 threads. +After merge step 1: tpop: 0.001186 s ~Mflops: 0.121 nsubm:16 otn:12 +Applying merge (22 -> 16 leaves, 12 th.) yielded SPEEDUP of 1.026x: 0.001217s -> 0.001186s, so taking this instance. +Merge (16 -> 10 leaves) took w.c.t. of 0.00021s, ~1.717e-05s of computing time (of which 1.907e-06s sorting, 3.815e-06s analysis) +3 iterations (12 th.) took 0.003275s; avg 0.001092s ( +/- 30.57/ 28.53 %); best 0.0007579s; worst 0.001403s; std dev. 0.0002639 (taking best). +Reference operation time is 0.000757933 s (0.19 Mflops) with 12 threads. +After merge step 2: tpop: 0.0007579 s ~Mflops: 0.190 nsubm:10 otn:12 +Applying merge (16 -> 10 leaves, 12 th.) yielded SPEEDUP of 1.565x: 0.001186s -> 0.0007579s, so taking this instance. +Merge (10 -> 7 leaves) took w.c.t. of 1.383e-05s, ~4.053e-06s of computing time (of which 9.537e-07s sorting, 5.007e-06s analysis) +3 iterations (12 th.) took 0.002836s; avg 0.0009453s ( +/- 17.70/ 34.65 %); best 0.000778s; worst 0.001273s; std dev. 0.0002317 (taking best). +Reference operation time is 0.00077796 s (0.1851 Mflops) with 12 threads. +After merge step 3: tpop: 0.000778 s ~Mflops: 0.185 nsubm:7 otn:12 +Applying merge (10 -> 7 leaves, 12 th.) yielded SLOWDOWN (1th of 3 tolerable) of 1.026x: 0.0007579s -> 0.000778s. +Merge (7 -> 4 leaves) took w.c.t. of 5.96e-06s, ~1.907e-06s of computing time (of which 0s sorting, 9.537e-07s analysis) +3 iterations (12 th.) took 0.004084s; avg 0.001361s ( +/- 28.52/ 56.10 %); best 0.000973s; worst 0.002125s; std dev. 0.0005401 (taking best). +Reference operation time is 0.000972986 s (0.148 Mflops) with 12 threads. +After merge step 4: tpop: 0.000973 s ~Mflops: 0.148 nsubm:4 otn:12 +Applying merge (7 -> 4 leaves, 12 th.) yielded SLOWDOWN (2th of 3 tolerable) of 1.284x: 0.0007579s -> 0.000973s. +Skipping further merge based tests after 2 definite performance degradations in a row (and last exceeding limit). +A total of 4 merge steps (of max 6) (22 -> 4 subms) took 0.03581s (of which 0.0011s partitioning, 0s I/O); computing times: 0.0008888s in par. loops, 4.768e-06s sorting, 1.597e-05s analyzing) +Total merge + benchmarking process took 0.03581s, equivalent to 47.2/29.4 new/old ops (0.01102s for 3 clones -- as 14.5/9.1 ops, or 4.8/3.0 ops per clone), SPEEDUP of 1.606x +Applying multi-merge (22 -> 10 leaves, 2 steps, 0 -> 12 th.sp.) yielded SPEEDUP of 1.606x (0.001217s -> 0.0007579s), will amortize in 78.0 ops by saving 0.0004592s per op. +In 1 tuning rounds (tot. 0.043s, 0.011s for constructor, 3 clones) obtained a SPEEDUP of 60.6% (1.606x) (from 0.1183 to 0.19 Mflops). +After 0.043362s, global autotuning declared speedup of 1.60585 x, when using threads count of 12 and a new matrix: +(6 x 6)[0xaaaadcb67ab0]{D} @ (0(0..0),0(0..0)) (36 nnz, 6 nnz/r) flags 0x2046186 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 10, symflags:'' Considering S clone. Building a matrix with 36 nnz, 6 x 6 Duplicates check: 36 - 0 = 36 - converted COO to RSB in 6.329e-03 s (100.00 %) - analyzed arrays in 2.399e-03 s (37.91 %) - cleaned-up arrays in 9.537e-07 s (0.02 %) - deduplicated arrays in 9.537e-07 s (0.02 %) + converted COO to RSB in 7.222e-03 s (100.00 %) + analyzed arrays in 2.747e-03 s (38.04 %) + cleaned-up arrays in 1.192e-06 s (0.02 %) + deduplicated arrays in 0.000e+00 s (0.00 %) sorted arrays in 0.000e+00 s (0.00 %) - shuffled partitions in 1.969e-03 s (31.11 %) - memory allocations took 1.907e-06 s (0.03 %) - leafs setup took 9.537e-07 s (0.02 %) - halfword conversion took 1.955e-03 s (30.89 %) -Built (6 x 6)[0xaaaadf82ee70]{S} @ (0(0..0),0(0..0)) (36 nnz, 6 nnz/r) flags 0x42046186 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 16, symflags:'' + shuffled partitions in 2.589e-03 s (35.85 %) + memory allocations took 4.768e-06 s (0.07 %) + leafs setup took 3.099e-06 s (0.04 %) + halfword conversion took 1.876e-03 s (25.97 %) +Built (6 x 6)[0xaaaadcb61aa0]{S} @ (0(0..0),0(0..0)) (36 nnz, 6 nnz/r) flags 0x42046186 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 16, symflags:'' Base matrix: -(6 x 6)[0xaaaadf82ee70]{S} @ (0(0..0),0(0..0)) (36 nnz, 6 nnz/r) flags 0x2046186 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 16, symflags:'' +(6 x 6)[0xaaaadcb61aa0]{S} @ (0(0..0),0(0..0)) (36 nnz, 6 nnz/r) flags 0x2046186 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 16, symflags:'' -Will use autotuning routine to sample matrix: 6 x 6, type S, 36 nnz, 6 nnz/r, 21 subms, 16 lsubms, 4.8889 bpnz. +Will use autotuning routine to sample matrix: 6 x 6, type S, 36 nnz, 6 nnz/r, 21 subms, 16 lsubms, 4.5000 bpnz. Parameters: verbosity:1 mintimes:3 maxtimes:10 mindt:0 maxdt:0.1 -3 iterations (12 th.) took 0.00306s; avg 0.00102s ( +/- 19.31/ 27.15 %); best 0.000823s; worst 0.001297s; std dev. 0.0002016 (taking best). -Reference operation time is 0.000823021 s (0.175 Mflops) with 12 threads. -After 0.003083s, autotuning routine did not find a better threads count configuration. +3 iterations (12 th.) took 0.01963s; avg 0.006543s ( +/- 61.68/ 88.30 %); best 0.002507s; worst 0.01232s; std dev. 0.004191 (taking best). +Reference operation time is 0.00250721 s (0.05743 Mflops) with 12 threads. +After 0.019658s, autotuning routine did not find a better threads count configuration. -Will autotune matrix: 6 x 6, type S, 36 nnz, 6 nnz/r, 21 subms, 16 lsubms, 4.8889 bpnz. +Will autotune matrix: 6 x 6, type S, 36 nnz, 6 nnz/r, 21 subms, 16 lsubms, 4.5000 bpnz. Parameters: verbosity:1 mintimes:3 maxtimes:10 mindt:0 maxdt:0.1 -3 iterations (12 th.) took 0.002751s; avg 0.000917s ( +/- 0.53/ 0.54 %); best 0.0009122s; worst 0.000922s; std dev. 3.991e-06 (taking best). -Reference operation time is 0.000912189 s (0.1579 Mflops) with 12 threads. -Starting merge (same threads) based auto-tuning procedure (transA=N, nrhs=2, order=cols) (max 6 steps, inclusive 3 grace steps) on: 6 x 6, type S, 36 nnz, 6 nnz/r, 21 subms, 16 lsubms, 4.8889 bpnz (tpop: 0.0009122 Mflops: 0.158) -Merge (16 -> 10 leaves) took w.c.t. of 0.000474s, ~8.106e-06s of computing time (of which 9.537e-07s sorting, 3.099e-06s analysis) -3 iterations (12 th.) took 0.002965s; avg 0.0009883s ( +/- 15.30/ 24.55 %); best 0.0008371s; worst 0.001231s; std dev. 0.0001733 (taking best). -Reference operation time is 0.000837088 s (0.172 Mflops) with 12 threads. -After merge step 1: tpop: 0.0008371 s ~Mflops: 0.172 nsubm:10 otn:12 -Applying merge (16 -> 10 leaves, 12 th.) yielded SPEEDUP of 1.090x: 0.0009122s -> 0.0008371s, so taking this instance. -Merge (10 -> 7 leaves) took w.c.t. of 1.216e-05s, ~4.053e-06s of computing time (of which 9.537e-07s sorting, 3.099e-06s analysis) -3 iterations (12 th.) took 0.002623s; avg 0.0008744s ( +/- 9.88/ 16.90 %); best 0.000788s; worst 0.001022s; std dev. 0.000105 (taking best). -Reference operation time is 0.000787973 s (0.1827 Mflops) with 12 threads. -After merge step 2: tpop: 0.000788 s ~Mflops: 0.183 nsubm:7 otn:12 -Applying merge (10 -> 7 leaves, 12 th.) yielded SPEEDUP of 1.062x: 0.0008371s -> 0.000788s, so taking this instance. -Merge (7 -> 4 leaves) took w.c.t. of 5.96e-06s, ~1.907e-06s of computing time (of which 9.537e-07s sorting, 1.192e-06s analysis) -3 iterations (12 th.) took 0.002297s; avg 0.0007656s ( +/- 4.25/ 5.13 %); best 0.0007331s; worst 0.0008049s; std dev. 2.968e-05 (taking best). -Reference operation time is 0.000733137 s (0.1964 Mflops) with 12 threads. -After merge step 3: tpop: 0.0007331 s ~Mflops: 0.196 nsubm:4 otn:12 -Applying merge (7 -> 4 leaves, 12 th.) yielded SPEEDUP of 1.075x: 0.000788s -> 0.0007331s, so taking this instance. -Merge (4 -> 1 leaves) took w.c.t. of 5.007e-06s, ~2.146e-06s of computing time (of which 9.537e-07s sorting, 9.537e-07s analysis) -3 iterations (12 th.) took 1.907e-06s; avg 6.358e-07s ( +/- 93.10/200.00 %); best 4.386e-08s; worst 1.907e-06s; std dev. 8.991e-07 (taking best). -Reference operation time is 4.38571e-08 s (3283 Mflops) with 12 threads. -After merge step 4: tpop: 4.386e-08 s ~Mflops: 3283.391 nsubm:1 otn:12 -Applying merge (4 -> 1 leaves, 12 th.) yielded SPEEDUP of 16716.499x: 0.0007331s -> 4.386e-08s, so taking this instance. -Merged all the matrix leaves: no reason to continue merging. -A total of 4 merge steps (of max 6) (16 -> 1 subms) took 0.01793s (of which 0.0005291s partitioning, 0s I/O); computing times: 1.621e-05s in par. loops, 3.815e-06s sorting, 8.345e-06s analyzing) -Total merge + benchmarking process took 0.01793s, equivalent to 408920.9/19.7 new/old ops (0.01242s for 5 clones -- as 283125.8/13.6 ops, or 56625.2/2.7 ops per clone), SPEEDUP of 20799.130x -Applying multi-merge (16 -> 1 leaves, 4 steps, 0 -> 12 th.sp.) yielded SPEEDUP of 20799.130x (0.0009122s -> 4.386e-08s), will amortize in 19.7 ops by saving 0.0009121s per op. -In 1 tuning rounds (tot. 0.024s, 0.012s for constructor, 5 clones) obtained a SPEEDUP of 2079813.0% (2.08e+04x) (from 0.1579 to 3283 Mflops). -After 0.023682s, global autotuning declared speedup of 20799.1 x, when using threads count of 12 and a new matrix: -(6 x 6)[0xaaaadf82e310]{S} @ (0(0..6),0(0..6)) (36 nnz, 6 nnz/r) flags 0x2244086 (coo:0, csr:1, hw:1, ic:1, fi:0), storage: 1, subm: 1, symflags:'' +3 iterations (12 th.) took 0.004569s; avg 0.001523s ( +/- 27.83/ 33.22 %); best 0.001099s; worst 0.002029s; std dev. 0.000384 (taking best). +Reference operation time is 0.00109911 s (0.131 Mflops) with 12 threads. +Starting merge (same threads) based auto-tuning procedure (transA=N, nrhs=2, order=cols) (max 6 steps, inclusive 3 grace steps) on: 6 x 6, type S, 36 nnz, 6 nnz/r, 21 subms, 16 lsubms, 4.5000 bpnz (tpop: 0.001099 Mflops: 0.131) +Merge (16 -> 13 leaves) took w.c.t. of 1.597e-05s, ~5.007e-06s of computing time (of which 2.146e-06s sorting, 3.815e-06s analysis) +3 iterations (12 th.) took 0.00894s; avg 0.00298s ( +/- 47.48/ 81.58 %); best 0.001565s; worst 0.005411s; std dev. 0.001727 (taking best). +Reference operation time is 0.00156498 s (0.09201 Mflops) with 12 threads. +After merge step 1: tpop: 0.001565 s ~Mflops: 0.092 nsubm:13 otn:12 +Applying merge (16 -> 13 leaves, 12 th.) yielded SLOWDOWN (1th of 3 tolerable) of 1.424x: 0.001099s -> 0.001565s. +Skipping further merge based tests after 1 definite performance degradations in a row (and last exceeding limit). +A total of 1 merge steps (of max 6) (16 -> 13 subms) took 0.008983s (of which 1.979e-05s partitioning, 0s I/O); computing times: 5.007e-06s in par. loops, 2.146e-06s sorting, 3.815e-06s analyzing) +Total merge + benchmarking process took 0.008983s, equivalent to 8.2/8.2 new/old ops (0.003182s for 1 clones -- as 2.9/2.9 ops, or 2.9/2.9 ops per clone), SPEEDUP of 1.000x (NO SPEEDUP) +Merging based autotuning FAILED (=NO SPEEDUP); let's try splitting then... +3 iterations (12 th.) took 0.003457s; avg 0.001152s ( +/- 19.72/ 31.38 %); best 0.0009251s; worst 0.001514s; std dev. 0.0002585 (taking best). +Reference operation time is 0.000925064 s (0.1557 Mflops) with 12 threads. +Starting split (same threads) based auto-tuning procedure (transA=N, nrhs=2, order=cols) (max 6 steps, inclusive 3 grace steps) on: 6 x 6, type S, 36 nnz, 6 nnz/r, 21 subms, 16 lsubms, 4.5000 bpnz (tpop: 0.0009251 Mflops: 0.156) +Split (16 -> 25 leaves, 21 -> 33 subms) took 0.000535s (of which: 3.099e-06s analysis, -5.217e+09s mem.mgmt); compute time: 2.313e-05s overall, 1.907e-06s searches, 2.122e-05s shuffle, 5.96e-06s switch, 0s quadrants. +3 iterations (12 th.) took 0.01108s; avg 0.003694s ( +/- 68.22/ 66.91 %); best 0.001174s; worst 0.006166s; std dev. 0.002038 (taking best). +Reference operation time is 0.00117397 s (0.1227 Mflops) with 12 threads. +After split step 1: tpop: 0.001174 s ~Mflops: 0.123 nsubm:25 otn:12 +Applying split (16 -> 25 leaves, 12 th.) yielded SLOWDOWN (1th of 3 tolerable) of 1.269x: 0.0009251s -> 0.001174s. +Skipping further split based tests after 1 definite performance degradations in a row (and last exceeding limit). +A total of 1 split steps (of max 6) (16 -> 25 subms) took 0.01168s (of which 0.0005798s partitioning, 0s I/O); computing times: 2.313e-05s in par. loops, 1.907e-06s sorting, 3.099e-06s analyzing) +Total split + benchmarking process took 0.01168s, equivalent to 12.6/12.6 new/old ops (0.005706s for 1 clones -- as 6.2/6.2 ops, or 6.2/6.2 ops per clone), SPEEDUP of 1.000x (NO SPEEDUP) +In 1 tuning rounds (tot. 0.038s, 0.0089s for constructor, 2 clones) obtained NO speedup (best stays 0.1557 Mflops). +After 0.037688s, global autotuning found old matrix optimal, with declared speedup 1 x when using 12 threads Considering C clone. Building a matrix with 36 nnz, 6 x 6 Duplicates check: 36 - 0 = 36 - converted COO to RSB in 4.838e-03 s (100.00 %) - analyzed arrays in 1.969e-03 s (40.70 %) + converted COO to RSB in 7.278e-03 s (100.00 %) + analyzed arrays in 4.629e-03 s (63.60 %) cleaned-up arrays in 1.192e-06 s (0.02 %) - deduplicated arrays in 9.537e-07 s (0.02 %) + deduplicated arrays in 0.000e+00 s (0.00 %) sorted arrays in 0.000e+00 s (0.00 %) - shuffled partitions in 1.512e-03 s (31.25 %) - memory allocations took 1.693e-05 s (0.35 %) - leafs setup took 2.861e-06 s (0.06 %) - halfword conversion took 1.334e-03 s (27.57 %) -Built (6 x 6)[0xaaaadf832ab0]{C} @ (0(0..0),0(0..0)) (36 nnz, 6 nnz/r) flags 0x42046186 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 22, symflags:'' + shuffled partitions in 1.277e-03 s (17.55 %) + memory allocations took 5.960e-06 s (0.08 %) + leafs setup took 1.907e-06 s (0.03 %) + halfword conversion took 1.362e-03 s (18.72 %) +Built (6 x 6)[0xaaaadcb67ab0]{C} @ (0(0..0),0(0..0)) (36 nnz, 6 nnz/r) flags 0x42046186 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 22, symflags:'' Base matrix: -(6 x 6)[0xaaaadf832ab0]{C} @ (0(0..0),0(0..0)) (36 nnz, 6 nnz/r) flags 0x2046186 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 22, symflags:'' +(6 x 6)[0xaaaadcb67ab0]{C} @ (0(0..0),0(0..0)) (36 nnz, 6 nnz/r) flags 0x2046186 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 22, symflags:'' Will use autotuning routine to sample matrix: 6 x 6, type C, 36 nnz, 6 nnz/r, 29 subms, 22 lsubms, 4.6667 bpnz. Parameters: verbosity:1 mintimes:3 maxtimes:10 mindt:0 maxdt:0.1 -3 iterations (12 th.) took 0.003127s; avg 0.001042s ( +/- 14.91/ 10.42 %); best 0.0008869s; worst 0.001151s; std dev. 0.0001127 (taking best). -Reference operation time is 0.000886917 s (0.6494 Mflops) with 12 threads. -After 0.003143s, autotuning routine did not find a better threads count configuration. +3 iterations (12 th.) took 0.004192s; avg 0.001397s ( +/- 31.51/ 29.32 %); best 0.000957s; worst 0.001807s; std dev. 0.0003477 (taking best). +Reference operation time is 0.000957012 s (0.6019 Mflops) with 12 threads. +After 0.004219s, autotuning routine did not find a better threads count configuration. Will autotune matrix: 6 x 6, type C, 36 nnz, 6 nnz/r, 29 subms, 22 lsubms, 4.6667 bpnz. Parameters: verbosity:1 mintimes:3 maxtimes:10 mindt:0 maxdt:0.1 -3 iterations (12 th.) took 0.002741s; avg 0.0009137s ( +/- 1.50/ 0.80 %); best 0.0009s; worst 0.000921s; std dev. 9.674e-06 (taking best). -Reference operation time is 0.00090003 s (0.64 Mflops) with 12 threads. -Starting merge (same threads) based auto-tuning procedure (transA=N, nrhs=2, order=cols) (max 6 steps, inclusive 3 grace steps) on: 6 x 6, type C, 36 nnz, 6 nnz/r, 29 subms, 22 lsubms, 4.6667 bpnz (tpop: 0.0009 Mflops: 0.640) -Merge (22 -> 16 leaves) took w.c.t. of 0.0001152s, ~8.821e-06s of computing time (of which 9.537e-07s sorting, 4.053e-06s analysis) -3 iterations (12 th.) took 0.003131s; avg 0.001044s ( +/- 32.17/ 31.36 %); best 0.0007079s; worst 0.001371s; std dev. 0.0002708 (taking best). -Reference operation time is 0.000707865 s (0.8137 Mflops) with 12 threads. -After merge step 1: tpop: 0.0007079 s ~Mflops: 0.814 nsubm:16 otn:12 -Applying merge (22 -> 16 leaves, 12 th.) yielded SPEEDUP of 1.271x: 0.0009s -> 0.0007079s, so taking this instance. -Merge (16 -> 10 leaves) took w.c.t. of 0.0003581s, ~7.153e-06s of computing time (of which 9.537e-07s sorting, 4.053e-06s analysis) -3 iterations (12 th.) took 0.002161s; avg 0.0007203s ( +/- 13.78/ 27.43 %); best 0.0006211s; worst 0.0009179s; std dev. 0.0001397 (taking best). -Reference operation time is 0.00062108 s (0.9274 Mflops) with 12 threads. -After merge step 2: tpop: 0.0006211 s ~Mflops: 0.927 nsubm:10 otn:12 -Applying merge (16 -> 10 leaves, 12 th.) yielded SPEEDUP of 1.140x: 0.0007079s -> 0.0006211s, so taking this instance. -Merge (10 -> 7 leaves) took w.c.t. of 1.121e-05s, ~2.861e-06s of computing time (of which 0s sorting, 2.861e-06s analysis) -3 iterations (12 th.) took 0.002509s; avg 0.0008363s ( +/- 26.48/ 47.68 %); best 0.0006149s; worst 0.001235s; std dev. 0.0002825 (taking best). -Reference operation time is 0.000614882 s (0.9368 Mflops) with 12 threads. -After merge step 3: tpop: 0.0006149 s ~Mflops: 0.937 nsubm:7 otn:12 -Applying merge (10 -> 7 leaves, 12 th.) yielded SPEEDUP of 1.010x: 0.0006211s -> 0.0006149s, so taking this instance. -Merge (7 -> 4 leaves) took w.c.t. of 1.097e-05s, ~4.053e-06s of computing time (of which 9.537e-07s sorting, 2.146e-06s analysis) -3 iterations (12 th.) took 0.00184s; avg 0.0006133s ( +/- 2.15/ 2.20 %); best 0.0006001s; worst 0.0006268s; std dev. 1.09e-05 (taking best). -Reference operation time is 0.0006001 s (0.9598 Mflops) with 12 threads. -After merge step 4: tpop: 0.0006001 s ~Mflops: 0.960 nsubm:4 otn:12 -Applying merge (7 -> 4 leaves, 12 th.) yielded SPEEDUP of 1.025x: 0.0006149s -> 0.0006001s, so taking this instance. -Merge (4 -> 1 leaves) took w.c.t. of 9.06e-06s, ~4.053e-06s of computing time (of which 9.537e-07s sorting, 1.192e-06s analysis) -3 iterations (12 th.) took 2.861e-06s; avg 9.537e-07s ( +/- 95.40/100.00 %); best 4.386e-08s; worst 1.907e-06s; std dev. 7.787e-07 (taking best). -Reference operation time is 4.38571e-08 s (1.313e+04 Mflops) with 12 threads. -After merge step 5: tpop: 4.386e-08 s ~Mflops: 13133.564 nsubm:1 otn:12 -Applying merge (4 -> 1 leaves, 12 th.) yielded SPEEDUP of 13683.066x: 0.0006001s -> 4.386e-08s, so taking this instance. -Merged all the matrix leaves: no reason to continue merging. -A total of 5 merge steps (of max 6) (22 -> 1 subms) took 0.01994s (of which 0.0005174s partitioning, 0s I/O); computing times: 2.694e-05s in par. loops, 3.815e-06s sorting, 1.431e-05s analyzing) -Total merge + benchmarking process took 0.01994s, equivalent to 454547.4/22.1 new/old ops (0.01134s for 6 clones -- as 258499.6/12.6 ops, or 43083.3/2.1 ops per clone), SPEEDUP of 20521.881x -Applying multi-merge (22 -> 1 leaves, 5 steps, 0 -> 12 th.sp.) yielded SPEEDUP of 20521.881x (0.0009s -> 4.386e-08s), will amortize in 22.2 ops by saving 0.0009s per op. -In 1 tuning rounds (tot. 0.025s, 0.011s for constructor, 6 clones) obtained a SPEEDUP of 2052088.1% (2.052e+04x) (from 0.64 to 1.313e+04 Mflops). -After 0.024557s, global autotuning declared speedup of 20521.9 x, when using threads count of 12 and a new matrix: -(6 x 6)[0xaaaadf832420]{C} @ (0(0..6),0(0..6)) (36 nnz, 6 nnz/r) flags 0x2244086 (coo:0, csr:1, hw:1, ic:1, fi:0), storage: 1, subm: 1, symflags:'' +3 iterations (12 th.) took 0.002976s; avg 0.0009921s ( +/- 19.37/ 34.68 %); best 0.0007999s; worst 0.001336s; std dev. 0.0002438 (taking best). +Reference operation time is 0.000799894 s (0.7201 Mflops) with 12 threads. +Starting merge (same threads) based auto-tuning procedure (transA=N, nrhs=2, order=cols) (max 6 steps, inclusive 3 grace steps) on: 6 x 6, type C, 36 nnz, 6 nnz/r, 29 subms, 22 lsubms, 4.6667 bpnz (tpop: 0.0007999 Mflops: 0.720) +Merge (22 -> 16 leaves) took w.c.t. of 0.0005708s, ~1.001e-05s of computing time (of which 3.099e-06s sorting, 2.861e-06s analysis) +3 iterations (12 th.) took 0.002733s; avg 0.000911s ( +/- 27.66/ 55.01 %); best 0.000659s; worst 0.001412s; std dev. 0.0003544 (taking best). +Reference operation time is 0.000658989 s (0.8741 Mflops) with 12 threads. +After merge step 1: tpop: 0.000659 s ~Mflops: 0.874 nsubm:16 otn:12 +Applying merge (22 -> 16 leaves, 12 th.) yielded SPEEDUP of 1.214x: 0.0007999s -> 0.000659s, so taking this instance. +Merge (16 -> 10 leaves) took w.c.t. of 8.392e-05s, ~1.216e-05s of computing time (of which 1.907e-06s sorting, 3.099e-06s analysis) +3 iterations (12 th.) took 0.004376s; avg 0.001459s ( +/- 46.94/ 46.09 %); best 0.0007739s; worst 0.002131s; std dev. 0.0005541 (taking best). +Reference operation time is 0.000773907 s (0.7443 Mflops) with 12 threads. +After merge step 2: tpop: 0.0007739 s ~Mflops: 0.744 nsubm:10 otn:12 +Applying merge (16 -> 10 leaves, 12 th.) yielded SLOWDOWN (1th of 3 tolerable) of 1.174x: 0.000659s -> 0.0007739s. +Merge (10 -> 7 leaves) took w.c.t. of 1.407e-05s, ~4.053e-06s of computing time (of which 9.537e-07s sorting, 4.053e-06s analysis) +3 iterations (12 th.) took 0.006903s; avg 0.002301s ( +/- 44.03/ 43.73 %); best 0.001288s; worst 0.003307s; std dev. 0.0008243 (taking best). +Reference operation time is 0.00128794 s (0.4472 Mflops) with 12 threads. +After merge step 3: tpop: 0.001288 s ~Mflops: 0.447 nsubm:7 otn:12 +Applying merge (10 -> 7 leaves, 12 th.) yielded SLOWDOWN (2th of 3 tolerable) of 1.954x: 0.000659s -> 0.001288s. +Skipping further merge based tests after 2 definite performance degradations in a row (and last exceeding limit). +A total of 3 merge steps (of max 6) (22 -> 7 subms) took 0.01908s (of which 0.0006828s partitioning, 0s I/O); computing times: 2.623e-05s in par. loops, 5.96e-06s sorting, 1.001e-05s analyzing) +Total merge + benchmarking process took 0.01908s, equivalent to 28.9/23.8 new/old ops (0.006809s for 2 clones -- as 10.3/8.5 ops, or 5.2/4.3 ops per clone), SPEEDUP of 1.214x +Applying multi-merge (22 -> 16 leaves, 1 steps, 0 -> 12 th.sp.) yielded SPEEDUP of 1.214x (0.0007999s -> 0.000659s), will amortize in 135.4 ops by saving 0.0001409s per op. +In 1 tuning rounds (tot. 0.025s, 0.0068s for constructor, 2 clones) obtained a SPEEDUP of 21.4% (1.214x) (from 0.7201 to 0.8741 Mflops). +After 0.024659s, global autotuning declared speedup of 1.21382 x, when using threads count of 12 and a new matrix: +(6 x 6)[0xaaaadcb61aa0]{C} @ (0(0..0),0(0..0)) (36 nnz, 6 nnz/r) flags 0x2046186 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 16, symflags:'' Considering Z clone. Building a matrix with 36 nnz, 6 x 6 Duplicates check: 36 - 0 = 36 - converted COO to RSB in 3.873e-03 s (100.00 %) - analyzed arrays in 1.233e-03 s (31.84 %) + converted COO to RSB in 5.448e-03 s (100.00 %) + analyzed arrays in 1.649e-03 s (30.27 %) cleaned-up arrays in 9.537e-07 s (0.02 %) - deduplicated arrays in 0.000e+00 s (0.00 %) + deduplicated arrays in 1.192e-06 s (0.02 %) sorted arrays in 0.000e+00 s (0.00 %) - shuffled partitions in 1.468e-03 s (37.90 %) - memory allocations took 2.289e-05 s (0.59 %) - leafs setup took 3.099e-06 s (0.08 %) - halfword conversion took 1.144e-03 s (29.54 %) -Built (6 x 6)[0xaaaadf836130]{Z} @ (0(0..0),0(0..0)) (36 nnz, 6 nnz/r) flags 0x42046186 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 28, symflags:'' + shuffled partitions in 2.455e-03 s (45.06 %) + memory allocations took 3.815e-06 s (0.07 %) + leafs setup took 3.099e-06 s (0.06 %) + halfword conversion took 1.334e-03 s (24.49 %) +Built (6 x 6)[0xaaaadcb67ab0]{Z} @ (0(0..0),0(0..0)) (36 nnz, 6 nnz/r) flags 0x42046186 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 28, symflags:'' Base matrix: -(6 x 6)[0xaaaadf836130]{Z} @ (0(0..0),0(0..0)) (36 nnz, 6 nnz/r) flags 0x2046186 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 28, symflags:'' +(6 x 6)[0xaaaadcb67ab0]{Z} @ (0(0..0),0(0..0)) (36 nnz, 6 nnz/r) flags 0x2046186 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 28, symflags:'' Will use autotuning routine to sample matrix: 6 x 6, type Z, 36 nnz, 6 nnz/r, 37 subms, 28 lsubms, 4.4444 bpnz. Parameters: verbosity:1 mintimes:3 maxtimes:10 mindt:0 maxdt:0.1 -3 iterations (12 th.) took 0.003037s; avg 0.001012s ( +/- 36.88/ 33.16 %); best 0.000639s; worst 0.001348s; std dev. 0.0002907 (taking best). -Reference operation time is 0.000638962 s (0.9015 Mflops) with 12 threads. -After 0.003054s, autotuning routine did not find a better threads count configuration. +3 iterations (12 th.) took 0.01524s; avg 0.005081s ( +/- 57.19/ 28.99 %); best 0.002175s; worst 0.006554s; std dev. 0.002055 (taking best). +Reference operation time is 0.00217509 s (0.2648 Mflops) with 12 threads. +After 0.015271s, autotuning routine did not find a better threads count configuration. Will autotune matrix: 6 x 6, type Z, 36 nnz, 6 nnz/r, 37 subms, 28 lsubms, 4.4444 bpnz. Parameters: verbosity:1 mintimes:3 maxtimes:10 mindt:0 maxdt:0.1 -3 iterations (12 th.) took 0.004415s; avg 0.001472s ( +/- 59.17/ 83.67 %); best 0.0006008s; worst 0.002703s; std dev. 0.0008953 (taking best). -Reference operation time is 0.000600815 s (0.9587 Mflops) with 12 threads. -Starting merge (same threads) based auto-tuning procedure (transA=N, nrhs=2, order=cols) (max 6 steps, inclusive 3 grace steps) on: 6 x 6, type Z, 36 nnz, 6 nnz/r, 37 subms, 28 lsubms, 4.4444 bpnz (tpop: 0.0006008 Mflops: 0.959) -Merge (28 -> 22 leaves) took w.c.t. of 0.0003171s, ~1.097e-05s of computing time (of which 2.861e-06s sorting, 4.053e-06s analysis) -3 iterations (12 th.) took 0.002471s; avg 0.0008237s ( +/- 34.06/ 61.46 %); best 0.0005431s; worst 0.00133s; std dev. 0.0003587 (taking best). -Reference operation time is 0.000543118 s (1.061 Mflops) with 12 threads. -After merge step 1: tpop: 0.0005431 s ~Mflops: 1.061 nsubm:22 otn:12 -Applying merge (28 -> 22 leaves, 12 th.) yielded SPEEDUP of 1.106x: 0.0006008s -> 0.0005431s, so taking this instance. -Merge (22 -> 16 leaves) took w.c.t. of 9.203e-05s, ~6.914e-06s of computing time (of which 9.537e-07s sorting, 5.007e-06s analysis) -3 iterations (12 th.) took 0.002323s; avg 0.0007744s ( +/- 51.69/ 42.95 %); best 0.0003741s; worst 0.001107s; std dev. 0.000303 (taking best). -Reference operation time is 0.000374079 s (1.54 Mflops) with 12 threads. -After merge step 2: tpop: 0.0003741 s ~Mflops: 1.540 nsubm:16 otn:12 -Applying merge (22 -> 16 leaves, 12 th.) yielded SPEEDUP of 1.452x: 0.0005431s -> 0.0003741s, so taking this instance. -Merge (16 -> 10 leaves) took w.c.t. of 0.0003211s, ~1.001e-05s of computing time (of which 1.907e-06s sorting, 1.907e-06s analysis) -3 iterations (12 th.) took 0.00303s; avg 0.00101s ( +/- 46.94/ 45.64 %); best 0.000536s; worst 0.001471s; std dev. 0.0003819 (taking best). -Reference operation time is 0.000535965 s (1.075 Mflops) with 12 threads. -After merge step 3: tpop: 0.000536 s ~Mflops: 1.075 nsubm:10 otn:12 -Applying merge (16 -> 10 leaves, 12 th.) yielded SLOWDOWN (1th of 3 tolerable) of 1.433x: 0.0003741s -> 0.000536s. -Skipping further merge based tests after 1 definite performance degradations in a row (and last exceeding limit). -A total of 3 merge steps (of max 6) (28 -> 10 subms) took 0.01304s (of which 0.0007393s partitioning, 0s I/O); computing times: 2.789e-05s in par. loops, 5.722e-06s sorting, 1.097e-05s analyzing) -Total merge + benchmarking process took 0.01304s, equivalent to 34.9/21.7 new/old ops (0.006128s for 3 clones -- as 16.4/10.2 ops, or 5.5/3.4 ops per clone), SPEEDUP of 1.606x -Applying multi-merge (28 -> 16 leaves, 2 steps, 0 -> 12 th.sp.) yielded SPEEDUP of 1.606x (0.0006008s -> 0.0003741s), will amortize in 57.5 ops by saving 0.0002267s per op. -In 1 tuning rounds (tot. 0.019s, 0.0061s for constructor, 3 clones) obtained a SPEEDUP of 60.6% (1.606x) (from 0.9587 to 1.54 Mflops). -After 0.019208s, global autotuning declared speedup of 1.60612 x, when using threads count of 12 and a new matrix: -(6 x 6)[0xaaaadf839880]{Z} @ (0(0..0),0(0..0)) (36 nnz, 6 nnz/r) flags 0x2046186 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 16, symflags:'' +3 iterations (12 th.) took 0.002424s; avg 0.000808s ( +/- 6.08/ 10.15 %); best 0.0007589s; worst 0.00089s; std dev. 5.837e-05 (taking best). +Reference operation time is 0.000758886 s (0.759 Mflops) with 12 threads. +Starting merge (same threads) based auto-tuning procedure (transA=N, nrhs=2, order=cols) (max 6 steps, inclusive 3 grace steps) on: 6 x 6, type Z, 36 nnz, 6 nnz/r, 37 subms, 28 lsubms, 4.4444 bpnz (tpop: 0.0007589 Mflops: 0.759) +Merge (28 -> 22 leaves) took w.c.t. of 0.0005231s, ~1.097e-05s of computing time (of which 1.907e-06s sorting, 5.007e-06s analysis) +3 iterations (12 th.) took 0.005851s; avg 0.00195s ( +/- 68.25/ 35.31 %); best 0.0006192s; worst 0.002639s; std dev. 0.0009414 (taking best). +Reference operation time is 0.000619173 s (0.9303 Mflops) with 12 threads. +After merge step 1: tpop: 0.0006192 s ~Mflops: 0.930 nsubm:22 otn:12 +Applying merge (28 -> 22 leaves, 12 th.) yielded SPEEDUP of 1.226x: 0.0007589s -> 0.0006192s, so taking this instance. +Merge (22 -> 16 leaves) took w.c.t. of 0.0006361s, ~1.097e-05s of computing time (of which 1.907e-06s sorting, 4.053e-06s analysis) +3 iterations (12 th.) took 0.0039s; avg 0.0013s ( +/- 49.78/ 30.33 %); best 0.0006528s; worst 0.001694s; std dev. 0.0004612 (taking best). +Reference operation time is 0.00065279 s (0.8824 Mflops) with 12 threads. +After merge step 2: tpop: 0.0006528 s ~Mflops: 0.882 nsubm:16 otn:12 +Applying merge (22 -> 16 leaves, 12 th.) yielded SLOWDOWN (1th of 3 tolerable) of 1.054x: 0.0006192s -> 0.0006528s. +Merge (16 -> 10 leaves) took w.c.t. of 0.000464s, ~1.168e-05s of computing time (of which 1.907e-06s sorting, 4.053e-06s analysis) +3 iterations (12 th.) took 0.003649s; avg 0.001216s ( +/- 41.47/ 55.71 %); best 0.0007119s; worst 0.001894s; std dev. 0.0004979 (taking best). +Reference operation time is 0.000711918 s (0.8091 Mflops) with 12 threads. +After merge step 3: tpop: 0.0007119 s ~Mflops: 0.809 nsubm:10 otn:12 +Applying merge (16 -> 10 leaves, 12 th.) yielded SLOWDOWN (2th of 3 tolerable) of 1.150x: 0.0006192s -> 0.0007119s. +Merge (10 -> 7 leaves) took w.c.t. of 1.192e-05s, ~4.053e-06s of computing time (of which 9.537e-07s sorting, 3.815e-06s analysis) +3 iterations (12 th.) took 0.002541s; avg 0.0008469s ( +/- 24.44/ 23.86 %); best 0.0006399s; worst 0.001049s; std dev. 0.0001671 (taking best). +Reference operation time is 0.000639915 s (0.9001 Mflops) with 12 threads. +After merge step 4: tpop: 0.0006399 s ~Mflops: 0.900 nsubm:7 otn:12 +Applying merge (10 -> 7 leaves, 12 th.) yielded SLOWDOWN (3th of 3 tolerable) of 1.034x: 0.0006192s -> 0.0006399s. +Merge (7 -> 4 leaves) took w.c.t. of 5.007e-06s, ~9.537e-07s of computing time (of which 0s sorting, 2.146e-06s analysis) +3 iterations (12 th.) took 0.003892s; avg 0.001297s ( +/- 61.54/113.51 %); best 0.000499s; worst 0.00277s; std dev. 0.001043 (taking best). +Reference operation time is 0.00049901 s (1.154 Mflops) with 12 threads. +After merge step 5: tpop: 0.000499 s ~Mflops: 1.154 nsubm:4 otn:12 +Applying merge (7 -> 4 leaves, 12 th.) yielded SPEEDUP of 1.241x: 0.0006192s -> 0.000499s, so taking this instance. +Merge (4 -> 1 leaves) took w.c.t. of 2.909e-05s, ~1.788e-05s of computing time (of which 1.407e-05s sorting, 2.861e-06s analysis) +3 iterations (12 th.) took 5.007e-06s; avg 1.669e-06s ( +/- 97.93/142.86 %); best 3.455e-08s; worst 4.053e-06s; std dev. 1.73e-06 (taking best). +Reference operation time is 3.45469e-08 s (1.667e+04 Mflops) with 12 threads. +After merge step 6: tpop: 3.455e-08 s ~Mflops: 16673.010 nsubm:1 otn:12 +Applying merge (4 -> 1 leaves, 12 th.) yielded SPEEDUP of 14444.444x: 0.000499s -> 3.455e-08s, so taking this instance. +Merged all the matrix leaves: no reason to continue merging. +A total of 6 merge steps (of max 6) (28 -> 1 subms) took 0.03067s (of which 0.001684s partitioning, 0s I/O); computing times: 5.651e-05s in par. loops, 2.074e-05s sorting, 2.193e-05s analyzing) +Total merge + benchmarking process took 0.03067s, equivalent to 887722.6/40.4 new/old ops (0.0164s for 4 clones -- as 474830.9/21.6 ops, or 118707.7/5.4 ops per clone), SPEEDUP of 21966.874x +Applying multi-merge (28 -> 1 leaves, 6 steps, 0 -> 12 th.sp.) yielded SPEEDUP of 21966.874x (0.0007589s -> 3.455e-08s), will amortize in 40.4 ops by saving 0.0007589s per op. +In 1 tuning rounds (tot. 0.041s, 0.016s for constructor, 4 clones) obtained a SPEEDUP of 2196587.4% (2.197e+04x) (from 0.759 to 1.667e+04 Mflops). +After 0.040522s, global autotuning declared speedup of 21966.9 x, when using threads count of 12 and a new matrix: +(6 x 6)[0xaaaadcb62d40]{Z} @ (0(0..6),0(0..6)) (36 nnz, 6 nnz/r) flags 0x2244086 (coo:0, csr:1, hw:1, ic:1, fi:0), storage: 1, subm: 1, symflags:'' gmake[4]: Leaving directory '/build/reproducible-path/librsb-1.3.0.2+dfsg/examples' gmake[3]: Leaving directory '/build/reproducible-path/librsb-1.3.0.2+dfsg' @@ -9203,19 +9285,18 @@ 4 0 DIFF PRINT TEST END Beginning large binary search test. -Detected 63089266688 bytes of memory, comprehensive of 50521370624 of free memory. +Detected 63089258496 bytes of memory, comprehensive of 17585635328 of free memory. On this system, maximal array of coordinates can have 2147483137 elements and occupy 8589932548 bytes. -Will perform the test using less memory (3367 MB) than on the maximal coordinate indices array (3531289600) allows. -(c)allocated 882822400 nnz (3531289600 bytes) -Succeeded retrieving array last element. -Successfully performed large binary search test. +Will perform the test using less memory (17592186040610 MB) than on the maximal coordinate indices array (18446744069718908928) allows. +Skipping test: too little memory. +Skipping large binary search test. BASIC SPARSE BLAS TEST: BEGIN INIT INTERFACE TEST: BEGIN got RSB_IO_WANT_EXTRA_VERBOSE_INTERFACE: -1 got RSB_IO_WANT_IS_INITIALIZED_MARKER: 1 INIT INTERFACE TEST: END (SUCCESS) DEVEL PRINT TEST: BEGIN -(4 x 4)[0xaaaaeba583a0]{S} @ (0(0..0),0(0..0)) (4 nnz, 1 nnz/r) flags 0x2046186 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 2, symflags:'' +(4 x 4)[0xaaaae55193a0]{S} @ (0(0..0),0(0..0)) (4 nnz, 1 nnz/r) flags 0x2046186 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 2, symflags:'' RSB_FLAG_USE_HALFWORD_INDICES | RSB_FLAG_SORTED_INPUT | RSB_FLAG_WANT_COO_STORAGE | @@ -9224,8 +9305,8 @@ RSB_FLAG_ASSEMBLED_IN_COO_ARRAYS | RSB_FLAG_OWN_PARTITIONING_ARRAYS | RSB_FLAG_SORT_INPUT -(2 x 2)[0xaaaaeba584b0]{S} @ (0(0..2),0(0..2)) (2 nnz, 1 nnz/r) flags 0x2144386 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 0, symflags:'' -(2 x 2)[0xaaaaeba585c0]{S} @ (2(2..4),2(2..4)) (2 nnz, 1 nnz/r) flags 0x2144386 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 0, symflags:'' +(2 x 2)[0xaaaae55194b0]{S} @ (0(0..2),0(0..2)) (2 nnz, 1 nnz/r) flags 0x2144386 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 0, symflags:'' +(2 x 2)[0xaaaae55195c0]{S} @ (2(2..4),2(2..4)) (2 nnz, 1 nnz/r) flags 0x2144386 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 0, symflags:'' #R 4 x 4, 4 nnz (16 bytes), 16 index space for bytes, 544 bytes for 2 structs (2 of which are on the diagonal) (1e+02% of nnz are on the diagonal) #N at 0 0, 4 x 4, 4 nnz ( 25%) #T at 0 0, 2 x 2, 2 nnz ( 50%) @@ -9233,9 +9314,9 @@ ( 0x2046186 = { rec:1 coo:1 css:1 hw:1 ic:1 fi:0 symflags: } ) DEVEL PRINT TEST: END PRINT TEST: BEGIN [QUIET] -(2 x 2)[0xaaaaeba584b0]{S} @ (0(0..2),0(0..2)) (2 nnz, 1 nnz/r) flags 0x2144386 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 0, symflags:'' -(2 x 2)[0xaaaaeba585c0]{S} @ (2(2..4),2(2..4)) (2 nnz, 1 nnz/r) flags 0x2144386 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 0, symflags:'' -(4 x 4)[0xaaaaeba583a0]{S} @ (0(0..0),0(0..0)) (4 nnz, 1 nnz/r) flags 0x2046186 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 2, symflags:'' +(2 x 2)[0xaaaae55194b0]{S} @ (0(0..2),0(0..2)) (2 nnz, 1 nnz/r) flags 0x2144386 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 0, symflags:'' +(2 x 2)[0xaaaae55195c0]{S} @ (2(2..4),2(2..4)) (2 nnz, 1 nnz/r) flags 0x2144386 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 0, symflags:'' +(4 x 4)[0xaaaae55193a0]{S} @ (0(0..0),0(0..0)) (4 nnz, 1 nnz/r) flags 0x2046186 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 2, symflags:'' RSB_FLAG_USE_HALFWORD_INDICES | RSB_FLAG_SORTED_INPUT | RSB_FLAG_WANT_COO_STORAGE | @@ -9253,8 +9334,8 @@ BASIC PRIMITIVES TEST: BEGIN BASIC PRIMITIVES TEST: END (SUCCESS) ADVANCED SPARSE BLAS TEST: BEGIN [limit 30.000000s] [QUIET] -Terminating testing earlier due to user timeout request: test took 30.009580 s, max allowed was 30.000000. - PASSED:19597 +Terminating testing earlier due to user timeout request: test took 30.000919 s, max allowed was 30.000000. + PASSED:18025 FAILED:0 ADVANCED SPARSE BLAS TEST: END (SUCCESS) gmake qtests -C librsbpp @@ -9263,14 +9344,14 @@ gmake[4]: Entering directory '/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp' gmake[4]: Leaving directory '/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp' ./rsbtt -if ! test -f G.mtx ; then cp -p /build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp/G.mtx . ; fi ; /bin/bash /build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp/test.sh +if ! test -f G.mtx ; then cp -p /build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp/G.mtx . ; fi ; /bin/sh /build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp/test.sh ++ ./rsbpp Td,s G.mtx ++ grep Z-sort ++ wc -l + test 54 = 54 ++ grep Z-sort -++ wc -l ++ ./rsbpp Td G.mtx +++ wc -l + test 27 = 27 ++ ./rsbpp Td,z G.mtx ++ grep Z-sort @@ -9297,11 +9378,11 @@ ++ wc -l + test 0 = 0 ++ ./rsbpp vvvTd,z G.mtx -++ grep Range ++ wc -l +++ grep Range + test 258 -gt 0 -++ ./rsbpp vvvTd,z S.mtx ++ grep Range +++ ./rsbpp vvvTd,z S.mtx ++ wc -l + test 0 -eq 0 ++ ./rsbpp vvvTd,z G.mtx @@ -9320,13 +9401,13 @@ + test 9 = 9 ++ OMP_NUM_THREADS=1 ++ ./rsbpp C1000m100M100I1r1sFvtN,T -++ wc -l ++ grep spmm- +++ wc -l + test 3 = 3 -++ OMP_NUM_THREADS=1 -++ ./rsbpp C1000m100M100I1r1vtN,TsF ++ grep spmm- ++ wc -l +++ OMP_NUM_THREADS=1 +++ ./rsbpp C1000m100M100I1r1vtN,TsF + test 2 = 2 ++ OMP_NUM_THREADS=1 ++ ./rsbpp C1000m100M100I1r0vtN,TsF @@ -9402,7 +9483,7 @@ 0 0 0 0 before tuning for SPMV: -(3 x 3)[0xaaaab5dbb4c0]{D} @ (0(0..0),0(0..0)) (6 nnz, 2 nnz/r) flags 0x2046186 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'' +(3 x 3)[0xaaaae6f2cb50]{D} @ (0(0..0),0(0..0)) (6 nnz, 2 nnz/r) flags 0x2046186 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'' ** x: 1.1 @@ -9491,18 +9572,18 @@ BEGIN Rsb_Matrix_test_multimatrix_ms_mnrhs BEGIN -(3 x 3)[0xaaaab5ddca00]{D} @ (0(0..0),0(0..0)) (6 nnz, 2 nnz/r) flags 0x204619e (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'LT' +(3 x 3)[0xaaaae6f49830]{D} @ (0(0..0),0(0..0)) (6 nnz, 2 nnz/r) flags 0x204619e (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'LT' Tuned with speedup factor of 1: -(3 x 3)[0xaaaab5ddca00]{D} @ (0(0..0),0(0..0)) (6 nnz, 2 nnz/r) flags 0x204619e (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'LT' -(3 x 3)[0xaaaab5deee90]{D} @ (0(0..0),0(0..0)) (6 nnz, 2 nnz/r) flags 0x204619e (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'LT' +(3 x 3)[0xaaaae6f49830]{D} @ (0(0..0),0(0..0)) (6 nnz, 2 nnz/r) flags 0x204619e (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'LT' +(3 x 3)[0xaaaae6f39590]{D} @ (0(0..0),0(0..0)) (6 nnz, 2 nnz/r) flags 0x204619e (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'LT' Tuned with speedup factor of 1: -(3 x 3)[0xaaaab5deee90]{D} @ (0(0..0),0(0..0)) (6 nnz, 2 nnz/r) flags 0x204619e (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'LT' -(3 x 3)[0xaaaab5ddca00]{D} @ (0(0..0),0(0..0)) (6 nnz, 2 nnz/r) flags 0x204619e (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'LT' +(3 x 3)[0xaaaae6f39590]{D} @ (0(0..0),0(0..0)) (6 nnz, 2 nnz/r) flags 0x204619e (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'LT' +(3 x 3)[0xaaaae6f49830]{D} @ (0(0..0),0(0..0)) (6 nnz, 2 nnz/r) flags 0x204619e (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'LT' +Tuned with speedup factor of 1.00745: +(3 x 3)[0xaaaae6f682a0]{D} @ (0(0..0),0(0..0)) (6 nnz, 2 nnz/r) flags 0x204619e (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'LT' +(3 x 3)[0xaaaae6f49830]{D} @ (0(0..0),0(0..0)) (6 nnz, 2 nnz/r) flags 0x204619e (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'LT' Tuned with speedup factor of 1: -(3 x 3)[0xaaaab5ddca00]{D} @ (0(0..0),0(0..0)) (6 nnz, 2 nnz/r) flags 0x204619e (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'LT' -(3 x 3)[0xaaaab5deee90]{D} @ (0(0..0),0(0..0)) (6 nnz, 2 nnz/r) flags 0x204619e (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'LT' -Tuned with speedup factor of 1: -(3 x 3)[0xaaaab5deee90]{D} @ (0(0..0),0(0..0)) (6 nnz, 2 nnz/r) flags 0x204619e (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'LT' +(3 x 3)[0xaaaae6f49830]{D} @ (0(0..0),0(0..0)) (6 nnz, 2 nnz/r) flags 0x204619e (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'LT' END OK: terminating with no allocations registered in librsb [*] tests terminated successfully ! @@ -9519,10 +9600,10 @@ ./rsbtest --no-tune --max_t 0.01 --serial | dd if=/dev/stdin of=/dev/stdout bs=16M status=none iflag=fullblock | grep -q Building ./rsbtest --no-tune --max_t 0.01 --max 1 --nrhs 1 --beta 1 --incy 1 --incx 1 --no-trans --alpha 1 --type d --rand --serial . | dd if=/dev/stdin of=/dev/stdout bs=16M status=none iflag=fullblock | grep -q adding ! ./rsbtest --mkl A.mkl -running on codethink03-arm64 +running on i-capture-the-hostname Built without the MKL. ( ! ./rsbtest --unrecognized-option-triggers-abort ) -running on codethink03-arm64 +running on i-capture-the-hostname /build/reproducible-path/librsb-1.3.0.2+dfsg/rsbtest/.libs/rsbtest: unrecognized option '--unrecognized-option-triggers-abort' unrecognized option, aborting. ( ./rsbtest --no-tune --max_t 0.01 --skip-loading-hermitian-matrices --skip-loading-unsymmetric-matrices --tune-maxt 10 --tune-maxr 10 --verbose-tuning --extra-verbose-interface --min_t 0.01 --max_t 0.01 --mintimes 1 --maxtimes 1 --verbose --skip-loading-symmetric-matrices A.mtx | dd if=/dev/stdin of=/dev/stdout bs=16M status=none iflag=fullblock | grep -q skip ) @@ -9531,7 +9612,7 @@ ( ! ./rsbtest --no-tune --max_t 0.01 --quiet --types all --nthreads 1,2 --maxtimes 1 -+ A.mtx | dd if=/dev/stdin of=/dev/stdout bs=16M status=none iflag=fullblock | grep -q 2.threads ) ( ! ./rsbtest --no-tune --max_t 0.01 --quiet --render-only A.mtx > /dev/null ) ! ./rsbtest --no-tune --max_t 0.01 --quiet --max 1 --nrhs 1 --beta 1 --incy 1 --incx 1 --render --no-trans --alpha 1 --type all A.mtx -running on codethink03-arm64 +running on i-capture-the-hostname Will not invoke autotuning routine. Benchmark will sample for at most 0.01 s Built without render support! @@ -9583,7 +9664,7 @@ gmake[4]: Entering directory '/build/reproducible-path/librsb-1.3.0.2+dfsg' gmake[5]: Entering directory '/build/reproducible-path/librsb-1.3.0.2+dfsg' /usr/bin/mkdir -p '/build/reproducible-path/librsb-1.3.0.2+dfsg/debian/tmp/usr/lib/aarch64-linux-gnu' - /bin/bash ./libtool --mode=install /usr/bin/install -c librsb.la '/build/reproducible-path/librsb-1.3.0.2+dfsg/debian/tmp/usr/lib/aarch64-linux-gnu' + /bin/sh ./libtool --mode=install /usr/bin/install -c librsb.la '/build/reproducible-path/librsb-1.3.0.2+dfsg/debian/tmp/usr/lib/aarch64-linux-gnu' libtool: install: /usr/bin/install -c .libs/librsb.so.0.0.0 /build/reproducible-path/librsb-1.3.0.2+dfsg/debian/tmp/usr/lib/aarch64-linux-gnu/librsb.so.0.0.0 libtool: install: (cd /build/reproducible-path/librsb-1.3.0.2+dfsg/debian/tmp/usr/lib/aarch64-linux-gnu && { ln -s -f librsb.so.0.0.0 librsb.so.0 || { rm -f librsb.so.0 && ln -s librsb.so.0.0.0 librsb.so.0; }; }) libtool: install: (cd /build/reproducible-path/librsb-1.3.0.2+dfsg/debian/tmp/usr/lib/aarch64-linux-gnu && { ln -s -f librsb.so.0.0.0 librsb.so || { rm -f librsb.so && ln -s librsb.so.0.0.0 librsb.so; }; }) @@ -9593,7 +9674,7 @@ libtool: install: ranlib /build/reproducible-path/librsb-1.3.0.2+dfsg/debian/tmp/usr/lib/aarch64-linux-gnu/librsb.a libtool: warning: remember to run 'libtool --finish /usr/lib/aarch64-linux-gnu' /usr/bin/mkdir -p '/build/reproducible-path/librsb-1.3.0.2+dfsg/debian/tmp/usr/bin' - /bin/bash ./libtool --mode=install /usr/bin/install -c rsbench '/build/reproducible-path/librsb-1.3.0.2+dfsg/debian/tmp/usr/bin' + /bin/sh ./libtool --mode=install /usr/bin/install -c rsbench '/build/reproducible-path/librsb-1.3.0.2+dfsg/debian/tmp/usr/bin' libtool: warning: 'librsb.la' has not been installed in '/usr/lib/aarch64-linux-gnu' libtool: install: /usr/bin/install -c .libs/rsbench /build/reproducible-path/librsb-1.3.0.2+dfsg/debian/tmp/usr/bin/rsbench /usr/bin/mkdir -p '/build/reproducible-path/librsb-1.3.0.2+dfsg/debian/tmp/usr/bin' @@ -9728,8 +9809,8 @@ dh_gencontrol dh_md5sums dh_builddeb -dpkg-deb: building package 'librsb0t64' in '../librsb0t64_1.3.0.2+dfsg-7_arm64.deb'. dpkg-deb: building package 'librsb0t64-dbgsym' in '../librsb0t64-dbgsym_1.3.0.2+dfsg-7_arm64.deb'. +dpkg-deb: building package 'librsb0t64' in '../librsb0t64_1.3.0.2+dfsg-7_arm64.deb'. dpkg-deb: building package 'librsb-dev' in '../librsb-dev_1.3.0.2+dfsg-7_arm64.deb'. dpkg-deb: building package 'librsb-tools' in '../librsb-tools_1.3.0.2+dfsg-7_arm64.deb'. dpkg-deb: building package 'librsb-tools-dbgsym' in '../librsb-tools-dbgsym_1.3.0.2+dfsg-7_arm64.deb'. @@ -9742,12 +9823,14 @@ dpkg-buildpackage: info: binary-only upload (no source included) dpkg-genchanges: info: not including original source code in upload I: copying local configuration +I: user script /srv/workspace/pbuilder/1182468/tmp/hooks/B01_cleanup starting +I: user script /srv/workspace/pbuilder/1182468/tmp/hooks/B01_cleanup finished I: unmounting dev/ptmx filesystem I: unmounting dev/pts filesystem I: unmounting dev/shm filesystem I: unmounting proc filesystem I: unmounting sys filesystem I: cleaning the build env -I: removing directory /srv/workspace/pbuilder/2200206 and its subdirectories -I: Current time: Thu Mar 12 03:05:31 -12 2026 -I: pbuilder-time-stamp: 1773327931 +I: removing directory /srv/workspace/pbuilder/1182468 and its subdirectories +I: Current time: Fri Feb 7 22:56:31 +14 2025 +I: pbuilder-time-stamp: 1738918591