Diff of the two buildlogs: -- --- b1/build.log 2024-11-22 13:49:03.496188754 +0000 +++ b2/build.log 2024-11-22 14:23:00.259949831 +0000 @@ -1,6 +1,6 @@ I: pbuilder: network access will be disabled during build -I: Current time: Thu Dec 25 07:48:28 -12 2025 -I: pbuilder-time-stamp: 1766692108 +I: Current time: Sat Nov 23 03:49:05 +14 2024 +I: pbuilder-time-stamp: 1732283345 I: Building the build Environment I: extracting base tarball [/var/cache/pbuilder/unstable-reproducible-base.tgz] I: copying local configuration @@ -29,54 +29,86 @@ dpkg-source: info: applying fix_mod_install.patch I: using fakeroot in build. I: Installing the build-deps -I: user script /srv/workspace/pbuilder/87525/tmp/hooks/D02_print_environment starting +I: user script /srv/workspace/pbuilder/6634/tmp/hooks/D01_modify_environment starting +debug: Running on ionos2-i386. +I: Changing host+domainname to test build reproducibility +I: Adding a custom variable just for the fun of it... +I: Changing /bin/sh to bash +'/bin/sh' -> '/bin/bash' +lrwxrwxrwx 1 root root 9 Nov 22 13:49 /bin/sh -> /bin/bash +I: Setting pbuilder2's login shell to /bin/bash +I: Setting pbuilder2's GECOS to second user,second room,second work-phone,second home-phone,second other +I: user script /srv/workspace/pbuilder/6634/tmp/hooks/D01_modify_environment finished +I: user script /srv/workspace/pbuilder/6634/tmp/hooks/D02_print_environment starting I: set - BUILDDIR='/build/reproducible-path' - BUILDUSERGECOS='first user,first room,first work-phone,first home-phone,first other' - BUILDUSERNAME='pbuilder1' - BUILD_ARCH='i386' - DEBIAN_FRONTEND='noninteractive' - DEB_BUILD_OPTIONS='buildinfo=+all reproducible=+all parallel=22 ' - DISTRIBUTION='unstable' - HOME='/root' - HOST_ARCH='i386' + BASH=/bin/sh + BASHOPTS=checkwinsize:cmdhist:complete_fullquote:extquote:force_fignore:globasciiranges:globskipdots:hostcomplete:interactive_comments:patsub_replacement:progcomp:promptvars:sourcepath + BASH_ALIASES=() + BASH_ARGC=() + BASH_ARGV=() + BASH_CMDS=() + BASH_LINENO=([0]="12" [1]="0") + BASH_LOADABLES_PATH=/usr/local/lib/bash:/usr/lib/bash:/opt/local/lib/bash:/usr/pkg/lib/bash:/opt/pkg/lib/bash:. + BASH_SOURCE=([0]="/tmp/hooks/D02_print_environment" [1]="/tmp/hooks/D02_print_environment") + BASH_VERSINFO=([0]="5" [1]="2" [2]="32" [3]="1" [4]="release" [5]="i686-pc-linux-gnu") + BASH_VERSION='5.2.32(1)-release' + BUILDDIR=/build/reproducible-path + BUILDUSERGECOS='second user,second room,second work-phone,second home-phone,second other' + BUILDUSERNAME=pbuilder2 + BUILD_ARCH=i386 + DEBIAN_FRONTEND=noninteractive + DEB_BUILD_OPTIONS='buildinfo=+all reproducible=+all parallel=10 ' + DIRSTACK=() + DISTRIBUTION=unstable + EUID=0 + FUNCNAME=([0]="Echo" [1]="main") + GROUPS=() + HOME=/root + HOSTNAME=i-capture-the-hostname + HOSTTYPE=i686 + HOST_ARCH=i386 IFS=' ' - INVOCATION_ID='0f298b4b9c6649ecb8a8d62081f2e41c' - LANG='C' - LANGUAGE='en_US:en' - LC_ALL='C' - LD_LIBRARY_PATH='/usr/lib/libeatmydata' - LD_PRELOAD='libeatmydata.so' - MAIL='/var/mail/root' - OPTIND='1' - PATH='/usr/sbin:/usr/bin:/sbin:/bin:/usr/games' - PBCURRENTCOMMANDLINEOPERATION='build' - PBUILDER_OPERATION='build' - PBUILDER_PKGDATADIR='/usr/share/pbuilder' - PBUILDER_PKGLIBDIR='/usr/lib/pbuilder' - PBUILDER_SYSCONFDIR='/etc' - PPID='87525' - PS1='# ' - PS2='> ' + INVOCATION_ID=884027f429ce43969fbaee49600559b7 + LANG=C + LANGUAGE=de_CH:de + LC_ALL=C + LD_LIBRARY_PATH=/usr/lib/libeatmydata + LD_PRELOAD=libeatmydata.so + MACHTYPE=i686-pc-linux-gnu + MAIL=/var/mail/root + OPTERR=1 + OPTIND=1 + OSTYPE=linux-gnu + PATH=/usr/sbin:/usr/bin:/sbin:/bin:/usr/games:/i/capture/the/path + PBCURRENTCOMMANDLINEOPERATION=build + PBUILDER_OPERATION=build + PBUILDER_PKGDATADIR=/usr/share/pbuilder + PBUILDER_PKGLIBDIR=/usr/lib/pbuilder + PBUILDER_SYSCONFDIR=/etc + PIPESTATUS=([0]="0") + POSIXLY_CORRECT=y + PPID=6634 PS4='+ ' - PWD='/' - SHELL='/bin/bash' - SHLVL='2' - SUDO_COMMAND='/usr/bin/timeout -k 18.1h 18h /usr/bin/ionice -c 3 /usr/bin/nice /usr/sbin/pbuilder --build --configfile /srv/reproducible-results/rbuild-debian/r-b-build.igKwWWMX/pbuilderrc_hGTM --distribution unstable --hookdir /etc/pbuilder/first-build-hooks --debbuildopts -b --basetgz /var/cache/pbuilder/unstable-reproducible-base.tgz --buildresult /srv/reproducible-results/rbuild-debian/r-b-build.igKwWWMX/b1 --logfile b1/build.log dbcsr_2.6.0-2.dsc' - SUDO_GID='112' - SUDO_UID='107' - SUDO_USER='jenkins' - TERM='unknown' - TZ='/usr/share/zoneinfo/Etc/GMT+12' - USER='root' - _='/usr/bin/systemd-run' - http_proxy='http://213.165.73.152:3128' + PWD=/ + SHELL=/bin/bash + SHELLOPTS=braceexpand:errexit:hashall:interactive-comments:posix + SHLVL=3 + SUDO_COMMAND='/usr/bin/timeout -k 24.1h 24h /usr/bin/ionice -c 3 /usr/bin/nice -n 11 /usr/bin/unshare --uts -- /usr/sbin/pbuilder --build --configfile /srv/reproducible-results/rbuild-debian/r-b-build.igKwWWMX/pbuilderrc_2Vwc --distribution unstable --hookdir /etc/pbuilder/rebuild-hooks --debbuildopts -b --basetgz /var/cache/pbuilder/unstable-reproducible-base.tgz --buildresult /srv/reproducible-results/rbuild-debian/r-b-build.igKwWWMX/b2 --logfile b2/build.log dbcsr_2.6.0-2.dsc' + SUDO_GID=112 + SUDO_UID=107 + SUDO_USER=jenkins + TERM=unknown + TZ=/usr/share/zoneinfo/Etc/GMT-14 + UID=0 + USER=root + _='I: set' + http_proxy=http://46.16.76.132:3128 I: uname -a - Linux ionos6-i386 6.1.0-27-amd64 #1 SMP PREEMPT_DYNAMIC Debian 6.1.115-1 (2024-11-01) x86_64 GNU/Linux + Linux i-capture-the-hostname 6.1.0-27-amd64 #1 SMP PREEMPT_DYNAMIC Debian 6.1.115-1 (2024-11-01) x86_64 GNU/Linux I: ls -l /bin - lrwxrwxrwx 1 root root 7 Aug 4 2024 /bin -> usr/bin -I: user script /srv/workspace/pbuilder/87525/tmp/hooks/D02_print_environment finished + lrwxrwxrwx 1 root root 7 Aug 4 21:30 /bin -> usr/bin +I: user script /srv/workspace/pbuilder/6634/tmp/hooks/D02_print_environment finished -> Attempting to satisfy build-dependencies -> Creating pbuilder-satisfydepends-dummy package Package: pbuilder-satisfydepends-dummy @@ -227,7 +259,7 @@ Get: 95 http://deb.debian.org/debian unstable/main i386 moreutils i386 0.69-1 [62.9 kB] Get: 96 http://deb.debian.org/debian unstable/main i386 mpi-default-bin i386 1.17 [2372 B] Get: 97 http://deb.debian.org/debian unstable/main i386 mpi-default-dev i386 1.17 [3144 B] -Fetched 73.4 MB in 1s (88.2 MB/s) +Fetched 73.4 MB in 1s (67.8 MB/s) debconf: delaying package configuration, since apt-utils is not installed Selecting previously unselected package libpython3.12-minimal:i386. (Reading database ... (Reading database ... 5% (Reading database ... 10% (Reading database ... 15% (Reading database ... 20% (Reading database ... 25% (Reading database ... 30% (Reading database ... 35% (Reading database ... 40% (Reading database ... 45% (Reading database ... 50% (Reading database ... 55% (Reading database ... 60% (Reading database ... 65% (Reading database ... 70% (Reading database ... 75% (Reading database ... 80% (Reading database ... 85% (Reading database ... 90% (Reading database ... 95% (Reading database ... 100% (Reading database ... 19952 files and directories currently installed.) @@ -558,8 +590,8 @@ Setting up tzdata (2024b-3) ... Current default time zone: 'Etc/UTC' -Local time is now: Thu Dec 25 19:48:54 UTC 2025. -Universal Time is now: Thu Dec 25 19:48:54 UTC 2025. +Local time is now: Fri Nov 22 13:49:38 UTC 2024. +Universal Time is now: Fri Nov 22 13:49:38 UTC 2024. Run 'dpkg-reconfigure tzdata' if you wish to change it. Setting up autotools-dev (20220109.1) ... @@ -658,7 +690,11 @@ fakeroot is already the newest version (1.36-1). 0 upgraded, 0 newly installed, 0 to remove and 0 not upgraded. I: Building the package -I: Running cd /build/reproducible-path/dbcsr-2.6.0/ && env PATH="/usr/sbin:/usr/bin:/sbin:/bin:/usr/games" HOME="/nonexistent/first-build" dpkg-buildpackage -us -uc -b && env PATH="/usr/sbin:/usr/bin:/sbin:/bin:/usr/games" HOME="/nonexistent/first-build" dpkg-genchanges -S > ../dbcsr_2.6.0-2_source.changes +I: user script /srv/workspace/pbuilder/6634/tmp/hooks/A99_set_merged_usr starting +Not re-configuring usrmerge for unstable +I: user script /srv/workspace/pbuilder/6634/tmp/hooks/A99_set_merged_usr finished +hostname: Name or service not known +I: Running cd /build/reproducible-path/dbcsr-2.6.0/ && env PATH="/usr/sbin:/usr/bin:/sbin:/bin:/usr/games:/i/capture/the/path" HOME="/nonexistent/second-build" dpkg-buildpackage -us -uc -b && env PATH="/usr/sbin:/usr/bin:/sbin:/bin:/usr/games:/i/capture/the/path" HOME="/nonexistent/second-build" dpkg-genchanges -S > ../dbcsr_2.6.0-2_source.changes dpkg-buildpackage: info: source package dbcsr dpkg-buildpackage: info: source version 2.6.0-2 dpkg-buildpackage: info: source distribution unstable @@ -724,9 +760,9 @@ -- Performing Test f95-reshape-order-allocatable -- Performing Test f95-reshape-order-allocatable - Success -- FYPP preprocessor found. -Tests will run with 12 MPI ranks and 2 OpenMP threads each --- Configuring done (6.3s) --- Generating done (0.1s) +Tests will run with 7 MPI ranks and 2 OpenMP threads each +-- Configuring done (10.3s) +-- Generating done (0.2s) CMake Warning: Manually-specified variables were not used by the project: @@ -737,7 +773,7 @@ -- Build files have been written to: /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu dh_auto_build -O--buildsystem=cmake - cd obj-i686-linux-gnu && make -j22 VERBOSE=1 + cd obj-i686-linux-gnu && make -j10 VERBOSE=1 make[1]: Entering directory '/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu' /usr/bin/cmake -S/build/reproducible-path/dbcsr-2.6.0 -B/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu --check-build-system CMakeFiles/Makefile.cmake 0 /usr/bin/cmake -E cmake_progress_start /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/CMakeFiles /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu//CMakeFiles/progress.marks @@ -746,76 +782,76 @@ make -f src/CMakeFiles/dbcsr.dir/build.make src/CMakeFiles/dbcsr.dir/depend make[3]: Entering directory '/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu' [ 0%] Generating acc/dbcsr_acc_devmem.F -[ 1%] Generating work/dbcsr_work_operations.F [ 1%] Generating acc/cuda/dbcsr_cuda_profiling.F -[ 1%] Generating acc/dbcsr_acc_device.F +[ 1%] Generating work/dbcsr_work_operations.F cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/python3 /usr/bin/fypp /build/reproducible-path/dbcsr-2.6.0/src/acc/dbcsr_acc_devmem.F /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/acc/dbcsr_acc_devmem.F -[ 1%] Generating acc/dbcsr_acc_init.F +[ 1%] Generating acc/dbcsr_acc_device.F cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/python3 /usr/bin/fypp /build/reproducible-path/dbcsr-2.6.0/src/work/dbcsr_work_operations.F /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/work/dbcsr_work_operations.F -[ 2%] Generating acc/dbcsr_acc_stream.F -[ 2%] Generating acc/dbcsr_acc_event.F -[ 2%] Generating base/dbcsr_base_hooks.F -[ 2%] Generating acc/dbcsr_acc_hostmem.F cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/python3 /usr/bin/fypp /build/reproducible-path/dbcsr-2.6.0/src/acc/cuda/dbcsr_cuda_profiling.F /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/acc/cuda/dbcsr_cuda_profiling.F -[ 2%] Generating acc/hip/dbcsr_hip_profiling.F cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/python3 /usr/bin/fypp /build/reproducible-path/dbcsr-2.6.0/src/acc/dbcsr_acc_device.F /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/acc/dbcsr_acc_device.F +[ 1%] Generating acc/hip/dbcsr_hip_profiling.F +[ 4%] Generating acc/dbcsr_acc_event.F +[ 4%] Generating acc/dbcsr_acc_hostmem.F [ 4%] Generating acc/dbcsr_acc_timings.F -cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/python3 /usr/bin/fypp /build/reproducible-path/dbcsr-2.6.0/src/acc/dbcsr_acc_init.F /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/acc/dbcsr_acc_init.F -cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/python3 /usr/bin/fypp /build/reproducible-path/dbcsr-2.6.0/src/base/dbcsr_base_hooks.F /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/base/dbcsr_base_hooks.F -[ 4%] Generating base/dbcsr_machine.F -[ 5%] Generating base/dbcsr_kinds.F +[ 4%] Generating acc/dbcsr_acc_init.F +[ 4%] Generating acc/dbcsr_acc_stream.F +cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/python3 /usr/bin/fypp /build/reproducible-path/dbcsr-2.6.0/src/acc/hip/dbcsr_hip_profiling.F /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/acc/hip/dbcsr_hip_profiling.F cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/python3 /usr/bin/fypp /build/reproducible-path/dbcsr-2.6.0/src/acc/dbcsr_acc_event.F /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/acc/dbcsr_acc_event.F cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/python3 /usr/bin/fypp /build/reproducible-path/dbcsr-2.6.0/src/acc/dbcsr_acc_hostmem.F /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/acc/dbcsr_acc_hostmem.F -[ 5%] Generating block/dbcsr_block_access.F +cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/python3 /usr/bin/fypp /build/reproducible-path/dbcsr-2.6.0/src/acc/dbcsr_acc_init.F /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/acc/dbcsr_acc_init.F cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/python3 /usr/bin/fypp /build/reproducible-path/dbcsr-2.6.0/src/acc/dbcsr_acc_stream.F /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/acc/dbcsr_acc_stream.F -[ 5%] Generating base/dbcsr_machine_internal.F cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/python3 /usr/bin/fypp /build/reproducible-path/dbcsr-2.6.0/src/acc/dbcsr_acc_timings.F /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/acc/dbcsr_acc_timings.F -cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/python3 /usr/bin/fypp /build/reproducible-path/dbcsr-2.6.0/src/acc/hip/dbcsr_hip_profiling.F /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/acc/hip/dbcsr_hip_profiling.F +[ 4%] Generating base/dbcsr_base_hooks.F +cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/python3 /usr/bin/fypp /build/reproducible-path/dbcsr-2.6.0/src/base/dbcsr_base_hooks.F /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/base/dbcsr_base_hooks.F +[ 5%] Generating base/dbcsr_kinds.F +[ 5%] Generating base/dbcsr_machine.F cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/python3 /usr/bin/fypp /build/reproducible-path/dbcsr-2.6.0/src/base/dbcsr_kinds.F /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/base/dbcsr_kinds.F -[ 5%] Generating block/dbcsr_index_operations.F -[ 5%] Generating block/dbcsr_iterator_operations.F -[ 7%] Generating block/dbcsr_block_operations.F cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/python3 /usr/bin/fypp /build/reproducible-path/dbcsr-2.6.0/src/base/dbcsr_machine.F /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/base/dbcsr_machine.F +[ 5%] Generating base/dbcsr_machine_internal.F +[ 5%] Generating block/dbcsr_index_operations.F cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/python3 /usr/bin/fypp /build/reproducible-path/dbcsr-2.6.0/src/base/dbcsr_machine_internal.F /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/base/dbcsr_machine_internal.F -cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/python3 /usr/bin/fypp /build/reproducible-path/dbcsr-2.6.0/src/block/dbcsr_block_access.F /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/block/dbcsr_block_access.F -[ 7%] Generating core/dbcsr_config.F -[ 8%] Generating core/dbcsr_array_types.F cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/python3 /usr/bin/fypp /build/reproducible-path/dbcsr-2.6.0/src/block/dbcsr_index_operations.F /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/block/dbcsr_index_operations.F -cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/python3 /usr/bin/fypp /build/reproducible-path/dbcsr-2.6.0/src/block/dbcsr_iterator_operations.F /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/block/dbcsr_iterator_operations.F +[ 7%] Generating block/dbcsr_block_operations.F +[ 7%] Generating block/dbcsr_block_access.F +cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/python3 /usr/bin/fypp /build/reproducible-path/dbcsr-2.6.0/src/block/dbcsr_block_access.F /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/block/dbcsr_block_access.F cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/python3 /usr/bin/fypp /build/reproducible-path/dbcsr-2.6.0/src/block/dbcsr_block_operations.F /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/block/dbcsr_block_operations.F -[ 8%] Generating core/dbcsr_error_handling.F +[ 7%] Generating block/dbcsr_iterator_operations.F +cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/python3 /usr/bin/fypp /build/reproducible-path/dbcsr-2.6.0/src/block/dbcsr_iterator_operations.F /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/block/dbcsr_iterator_operations.F +[ 8%] Generating core/dbcsr_array_types.F +[ 8%] Generating core/dbcsr_config.F +cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/python3 /usr/bin/fypp /build/reproducible-path/dbcsr-2.6.0/src/core/dbcsr_array_types.F /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/core/dbcsr_array_types.F cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/python3 /usr/bin/fypp /build/reproducible-path/dbcsr-2.6.0/src/core/dbcsr_config.F /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/core/dbcsr_config.F [ 8%] Generating core/dbcsr_dict.F -cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/python3 /usr/bin/fypp /build/reproducible-path/dbcsr-2.6.0/src/core/dbcsr_array_types.F /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/core/dbcsr_array_types.F cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/python3 /usr/bin/fypp /build/reproducible-path/dbcsr-2.6.0/src/core/dbcsr_dict.F /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/core/dbcsr_dict.F -cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/python3 /usr/bin/fypp /build/reproducible-path/dbcsr-2.6.0/src/core/dbcsr_error_handling.F /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/core/dbcsr_error_handling.F +[ 8%] Generating core/dbcsr_error_handling.F [ 10%] Generating core/dbcsr_iter_types.F +cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/python3 /usr/bin/fypp /build/reproducible-path/dbcsr-2.6.0/src/core/dbcsr_error_handling.F /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/core/dbcsr_error_handling.F cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/python3 /usr/bin/fypp /build/reproducible-path/dbcsr-2.6.0/src/core/dbcsr_iter_types.F /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/core/dbcsr_iter_types.F [ 10%] Generating core/dbcsr_lib.F cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/python3 /usr/bin/fypp /build/reproducible-path/dbcsr-2.6.0/src/core/dbcsr_lib.F /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/core/dbcsr_lib.F -[ 10%] Generating core/dbcsr_list_routinereport.F -cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/python3 /usr/bin/fypp /build/reproducible-path/dbcsr-2.6.0/src/core/dbcsr_list_routinereport.F /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/core/dbcsr_list_routinereport.F [ 10%] Generating core/dbcsr_list.F +cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/python3 /usr/bin/fypp /build/reproducible-path/dbcsr-2.6.0/src/core/dbcsr_list.F /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/core/dbcsr_list.F [ 10%] Generating core/dbcsr_list_callstackentry.F cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/python3 /usr/bin/fypp /build/reproducible-path/dbcsr-2.6.0/src/core/dbcsr_list_callstackentry.F /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/core/dbcsr_list_callstackentry.F -cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/python3 /usr/bin/fypp /build/reproducible-path/dbcsr-2.6.0/src/core/dbcsr_list.F /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/core/dbcsr_list.F -[ 11%] Generating core/dbcsr_list_timerenv.F +[ 10%] Generating core/dbcsr_list_routinereport.F +cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/python3 /usr/bin/fypp /build/reproducible-path/dbcsr-2.6.0/src/core/dbcsr_list_routinereport.F /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/core/dbcsr_list_routinereport.F [ 11%] Generating core/dbcsr_list_routinestat.F -[ 11%] Generating core/dbcsr_log_handling.F -[ 11%] Generating core/dbcsr_methods.F -[ 11%] Generating core/dbcsr_timings.F cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/python3 /usr/bin/fypp /build/reproducible-path/dbcsr-2.6.0/src/core/dbcsr_list_routinestat.F /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/core/dbcsr_list_routinestat.F -[ 13%] Generating core/dbcsr_print_messages.F +[ 11%] Generating core/dbcsr_list_timerenv.F cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/python3 /usr/bin/fypp /build/reproducible-path/dbcsr-2.6.0/src/core/dbcsr_list_timerenv.F /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/core/dbcsr_list_timerenv.F +[ 11%] Generating core/dbcsr_log_handling.F cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/python3 /usr/bin/fypp /build/reproducible-path/dbcsr-2.6.0/src/core/dbcsr_log_handling.F /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/core/dbcsr_log_handling.F -[ 13%] Generating core/dbcsr_timings_base_type.F +[ 11%] Generating core/dbcsr_methods.F cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/python3 /usr/bin/fypp /build/reproducible-path/dbcsr-2.6.0/src/core/dbcsr_methods.F /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/core/dbcsr_methods.F +[ 13%] Generating core/dbcsr_print_messages.F cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/python3 /usr/bin/fypp /build/reproducible-path/dbcsr-2.6.0/src/core/dbcsr_print_messages.F /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/core/dbcsr_print_messages.F +[ 13%] Generating core/dbcsr_timings.F cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/python3 /usr/bin/fypp /build/reproducible-path/dbcsr-2.6.0/src/core/dbcsr_timings.F /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/core/dbcsr_timings.F +[ 13%] Generating core/dbcsr_timings_base_type.F cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/python3 /usr/bin/fypp /build/reproducible-path/dbcsr-2.6.0/src/core/dbcsr_timings_base_type.F /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/core/dbcsr_timings_base_type.F [ 14%] Generating core/dbcsr_timings_report.F -[ 14%] Generating core/dbcsr_timings_types.F cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/python3 /usr/bin/fypp /build/reproducible-path/dbcsr-2.6.0/src/core/dbcsr_timings_report.F /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/core/dbcsr_timings_report.F +[ 14%] Generating core/dbcsr_timings_types.F cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/python3 /usr/bin/fypp /build/reproducible-path/dbcsr-2.6.0/src/core/dbcsr_timings_types.F /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/core/dbcsr_timings_types.F [ 15%] Generating core/dbcsr_types.F cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/python3 /usr/bin/fypp /build/reproducible-path/dbcsr-2.6.0/src/core/dbcsr_types.F /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/core/dbcsr_types.F @@ -825,53 +861,53 @@ cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/python3 /usr/bin/fypp /build/reproducible-path/dbcsr-2.6.0/src/data/dbcsr_data_methods_low.F /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/data/dbcsr_data_methods_low.F [ 17%] Generating data/dbcsr_data_operations.F cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/python3 /usr/bin/fypp /build/reproducible-path/dbcsr-2.6.0/src/data/dbcsr_data_operations.F /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/data/dbcsr_data_operations.F -[ 17%] Generating data/dbcsr_mem_methods.F [ 17%] Generating data/dbcsr_data_types.F cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/python3 /usr/bin/fypp /build/reproducible-path/dbcsr-2.6.0/src/data/dbcsr_data_types.F /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/data/dbcsr_data_types.F +[ 17%] Generating data/dbcsr_mem_methods.F cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/python3 /usr/bin/fypp /build/reproducible-path/dbcsr-2.6.0/src/data/dbcsr_mem_methods.F /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/data/dbcsr_mem_methods.F [ 18%] Generating data/dbcsr_ptr_util.F -cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/python3 /usr/bin/fypp /build/reproducible-path/dbcsr-2.6.0/src/data/dbcsr_ptr_util.F /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/data/dbcsr_ptr_util.F [ 18%] Generating dbcsr_api.F +cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/python3 /usr/bin/fypp /build/reproducible-path/dbcsr-2.6.0/src/data/dbcsr_ptr_util.F /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/data/dbcsr_ptr_util.F cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/python3 /usr/bin/fypp /build/reproducible-path/dbcsr-2.6.0/src/dbcsr_api.F /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/dbcsr_api.F [ 18%] Generating dist/dbcsr_dist_methods.F -[ 18%] Generating dist/dbcsr_dist_operations.F cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/python3 /usr/bin/fypp /build/reproducible-path/dbcsr-2.6.0/src/dist/dbcsr_dist_methods.F /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/dist/dbcsr_dist_methods.F +[ 18%] Generating dist/dbcsr_dist_operations.F cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/python3 /usr/bin/fypp /build/reproducible-path/dbcsr-2.6.0/src/dist/dbcsr_dist_operations.F /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/dist/dbcsr_dist_operations.F +[ 18%] Generating dist/dbcsr_dist_util.F +cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/python3 /usr/bin/fypp /build/reproducible-path/dbcsr-2.6.0/src/dist/dbcsr_dist_util.F /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/dist/dbcsr_dist_util.F [ 20%] Generating mm/dbcsr_acc_operations.F -[ 20%] Generating dist/dbcsr_dist_util.F cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/python3 /usr/bin/fypp /build/reproducible-path/dbcsr-2.6.0/src/mm/dbcsr_acc_operations.F /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/mm/dbcsr_acc_operations.F -cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/python3 /usr/bin/fypp /build/reproducible-path/dbcsr-2.6.0/src/dist/dbcsr_dist_util.F /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/dist/dbcsr_dist_util.F -[ 20%] Generating mm/dbcsr_mm_csr.F [ 21%] Generating mm/dbcsr_mm.F -[ 21%] Generating mm/dbcsr_mm_3d.F -cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/python3 /usr/bin/fypp /build/reproducible-path/dbcsr-2.6.0/src/mm/dbcsr_mm_csr.F /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/mm/dbcsr_mm_csr.F cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/python3 /usr/bin/fypp /build/reproducible-path/dbcsr-2.6.0/src/mm/dbcsr_mm.F /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/mm/dbcsr_mm.F -[ 23%] Generating mm/dbcsr_mm_cannon.F -[ 23%] Generating mm/dbcsr_mm_accdrv.F +[ 21%] Generating mm/dbcsr_mm_accdrv.F +cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/python3 /usr/bin/fypp /build/reproducible-path/dbcsr-2.6.0/src/mm/dbcsr_mm_accdrv.F /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/mm/dbcsr_mm_accdrv.F +[ 21%] Generating mm/dbcsr_mm_3d.F cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/python3 /usr/bin/fypp /build/reproducible-path/dbcsr-2.6.0/src/mm/dbcsr_mm_3d.F /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/mm/dbcsr_mm_3d.F -[ 23%] Generating mm/dbcsr_mm_common.F -[ 23%] Generating mm/dbcsr_mm_dist_operations.F -[ 24%] Generating mm/dbcsr_mm_sched.F -[ 24%] Generating mm/dbcsr_mm_hostdrv.F +[ 23%] Generating mm/dbcsr_mm_cannon.F cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/python3 /usr/bin/fypp /build/reproducible-path/dbcsr-2.6.0/src/mm/dbcsr_mm_cannon.F /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/mm/dbcsr_mm_cannon.F -cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/python3 /usr/bin/fypp /build/reproducible-path/dbcsr-2.6.0/src/mm/dbcsr_mm_accdrv.F /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/mm/dbcsr_mm_accdrv.F +[ 23%] Generating mm/dbcsr_mm_common.F cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/python3 /usr/bin/fypp /build/reproducible-path/dbcsr-2.6.0/src/mm/dbcsr_mm_common.F /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/mm/dbcsr_mm_common.F +[ 23%] Generating mm/dbcsr_mm_csr.F +cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/python3 /usr/bin/fypp /build/reproducible-path/dbcsr-2.6.0/src/mm/dbcsr_mm_csr.F /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/mm/dbcsr_mm_csr.F +[ 23%] Generating mm/dbcsr_mm_dist_operations.F cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/python3 /usr/bin/fypp /build/reproducible-path/dbcsr-2.6.0/src/mm/dbcsr_mm_dist_operations.F /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/mm/dbcsr_mm_dist_operations.F -[ 24%] Generating mm/dbcsr_mm_multrec.F +[ 23%] Generating mm/dbcsr_mm_hostdrv.F +[ 23%] Generating mm/dbcsr_mm_multrec.F +[ 24%] Generating mm/dbcsr_mm_sched.F cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/python3 /usr/bin/fypp /build/reproducible-path/dbcsr-2.6.0/src/mm/dbcsr_mm_hostdrv.F /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/mm/dbcsr_mm_hostdrv.F -cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/python3 /usr/bin/fypp /build/reproducible-path/dbcsr-2.6.0/src/mm/dbcsr_mm_sched.F /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/mm/dbcsr_mm_sched.F cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/python3 /usr/bin/fypp /build/reproducible-path/dbcsr-2.6.0/src/mm/dbcsr_mm_multrec.F /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/mm/dbcsr_mm_multrec.F +cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/python3 /usr/bin/fypp /build/reproducible-path/dbcsr-2.6.0/src/mm/dbcsr_mm_sched.F /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/mm/dbcsr_mm_sched.F [ 24%] Generating mm/dbcsr_mm_types.F -[ 24%] Generating mm/dbcsr_multiply_api.F -[ 24%] Generating mpi/dbcsr_mp_methods.F cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/python3 /usr/bin/fypp /build/reproducible-path/dbcsr-2.6.0/src/mm/dbcsr_mm_types.F /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/mm/dbcsr_mm_types.F +[ 24%] Generating mm/dbcsr_multiply_api.F cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/python3 /usr/bin/fypp /build/reproducible-path/dbcsr-2.6.0/src/mm/dbcsr_multiply_api.F /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/mm/dbcsr_multiply_api.F -cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/python3 /usr/bin/fypp /build/reproducible-path/dbcsr-2.6.0/src/mpi/dbcsr_mp_methods.F /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/mpi/dbcsr_mp_methods.F +[ 24%] Generating mpi/dbcsr_mp_methods.F [ 26%] Generating mpi/dbcsr_mp_operations.F -[ 26%] Generating mpi/dbcsr_mpiwrap.F +cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/python3 /usr/bin/fypp /build/reproducible-path/dbcsr-2.6.0/src/mpi/dbcsr_mp_methods.F /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/mpi/dbcsr_mp_methods.F cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/python3 /usr/bin/fypp /build/reproducible-path/dbcsr-2.6.0/src/mpi/dbcsr_mp_operations.F /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/mpi/dbcsr_mp_operations.F -cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/python3 /usr/bin/fypp /build/reproducible-path/dbcsr-2.6.0/src/mpi/dbcsr_mpiwrap.F /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/mpi/dbcsr_mpiwrap.F +[ 26%] Generating mpi/dbcsr_mpiwrap.F [ 26%] Generating ops/dbcsr_csr_conversions.F +cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/python3 /usr/bin/fypp /build/reproducible-path/dbcsr-2.6.0/src/mpi/dbcsr_mpiwrap.F /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/mpi/dbcsr_mpiwrap.F cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/python3 /usr/bin/fypp /build/reproducible-path/dbcsr-2.6.0/src/ops/dbcsr_csr_conversions.F /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/ops/dbcsr_csr_conversions.F [ 27%] Generating ops/dbcsr_io.F cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/python3 /usr/bin/fypp /build/reproducible-path/dbcsr-2.6.0/src/ops/dbcsr_io.F /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/ops/dbcsr_io.F @@ -880,39 +916,39 @@ [ 27%] Generating ops/dbcsr_test_methods.F cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/python3 /usr/bin/fypp /build/reproducible-path/dbcsr-2.6.0/src/ops/dbcsr_test_methods.F /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/ops/dbcsr_test_methods.F [ 28%] Generating ops/dbcsr_tests.F -cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/python3 /usr/bin/fypp /build/reproducible-path/dbcsr-2.6.0/src/ops/dbcsr_tests.F /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/ops/dbcsr_tests.F +[ 28%] Generating tas/dbcsr_tas_base.F [ 28%] Generating ops/dbcsr_transformations.F +cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/python3 /usr/bin/fypp /build/reproducible-path/dbcsr-2.6.0/src/ops/dbcsr_tests.F /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/ops/dbcsr_tests.F +cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/python3 /usr/bin/fypp /build/reproducible-path/dbcsr-2.6.0/src/tas/dbcsr_tas_base.F /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/tas/dbcsr_tas_base.F cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/python3 /usr/bin/fypp /build/reproducible-path/dbcsr-2.6.0/src/ops/dbcsr_transformations.F /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/ops/dbcsr_transformations.F [ 28%] Generating tas/dbcsr_tas_global.F -[ 28%] Generating tas/dbcsr_tas_base.F cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/python3 /usr/bin/fypp /build/reproducible-path/dbcsr-2.6.0/src/tas/dbcsr_tas_global.F /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/tas/dbcsr_tas_global.F [ 30%] Generating tas/dbcsr_tas_io.F -cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/python3 /usr/bin/fypp /build/reproducible-path/dbcsr-2.6.0/src/tas/dbcsr_tas_base.F /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/tas/dbcsr_tas_base.F -[ 30%] Generating tas/dbcsr_tas_mm.F -[ 30%] Generating tas/dbcsr_tas_reshape_ops.F -[ 31%] Generating tas/dbcsr_tas_split.F cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/python3 /usr/bin/fypp /build/reproducible-path/dbcsr-2.6.0/src/tas/dbcsr_tas_io.F /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/tas/dbcsr_tas_io.F +[ 30%] Generating tas/dbcsr_tas_mm.F cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/python3 /usr/bin/fypp /build/reproducible-path/dbcsr-2.6.0/src/tas/dbcsr_tas_mm.F /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/tas/dbcsr_tas_mm.F +[ 30%] Generating tas/dbcsr_tas_reshape_ops.F cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/python3 /usr/bin/fypp /build/reproducible-path/dbcsr-2.6.0/src/tas/dbcsr_tas_reshape_ops.F /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/tas/dbcsr_tas_reshape_ops.F +[ 31%] Generating tas/dbcsr_tas_split.F cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/python3 /usr/bin/fypp /build/reproducible-path/dbcsr-2.6.0/src/tas/dbcsr_tas_split.F /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/tas/dbcsr_tas_split.F -[ 31%] Generating tas/dbcsr_tas_types.F [ 31%] Generating tas/dbcsr_tas_test.F -cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/python3 /usr/bin/fypp /build/reproducible-path/dbcsr-2.6.0/src/tas/dbcsr_tas_types.F /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/tas/dbcsr_tas_types.F cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/python3 /usr/bin/fypp /build/reproducible-path/dbcsr-2.6.0/src/tas/dbcsr_tas_test.F /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/tas/dbcsr_tas_test.F -[ 33%] Generating tas/dbcsr_tas_util.F -[ 33%] Generating tensors/dbcsr_allocate_wrap.F -[ 33%] Generating tensors/dbcsr_array_list_methods.F +[ 31%] Generating tas/dbcsr_tas_types.F +cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/python3 /usr/bin/fypp /build/reproducible-path/dbcsr-2.6.0/src/tas/dbcsr_tas_types.F /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/tas/dbcsr_tas_types.F +[ 31%] Generating tas/dbcsr_tas_util.F cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/python3 /usr/bin/fypp /build/reproducible-path/dbcsr-2.6.0/src/tas/dbcsr_tas_util.F /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/tas/dbcsr_tas_util.F +[ 33%] Generating tensors/dbcsr_allocate_wrap.F cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/python3 /usr/bin/fypp /build/reproducible-path/dbcsr-2.6.0/src/tensors/dbcsr_allocate_wrap.F /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/tensors/dbcsr_allocate_wrap.F +[ 33%] Generating tensors/dbcsr_array_list_methods.F cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/python3 /usr/bin/fypp /build/reproducible-path/dbcsr-2.6.0/src/tensors/dbcsr_array_list_methods.F /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/tensors/dbcsr_array_list_methods.F [ 33%] Generating tensors/dbcsr_tensor.F -[ 33%] Generating tensors/dbcsr_tensor_api.F cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/python3 /usr/bin/fypp /build/reproducible-path/dbcsr-2.6.0/src/tensors/dbcsr_tensor.F /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/tensors/dbcsr_tensor.F -[ 33%] Generating tensors/dbcsr_tensor_index.F +[ 33%] Generating tensors/dbcsr_tensor_api.F cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/python3 /usr/bin/fypp /build/reproducible-path/dbcsr-2.6.0/src/tensors/dbcsr_tensor_api.F /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/tensors/dbcsr_tensor_api.F -cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/python3 /usr/bin/fypp /build/reproducible-path/dbcsr-2.6.0/src/tensors/dbcsr_tensor_index.F /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/tensors/dbcsr_tensor_index.F [ 34%] Generating tensors/dbcsr_tensor_block.F cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/python3 /usr/bin/fypp /build/reproducible-path/dbcsr-2.6.0/src/tensors/dbcsr_tensor_block.F /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/tensors/dbcsr_tensor_block.F +[ 34%] Generating tensors/dbcsr_tensor_index.F +cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/python3 /usr/bin/fypp /build/reproducible-path/dbcsr-2.6.0/src/tensors/dbcsr_tensor_index.F /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/tensors/dbcsr_tensor_index.F [ 34%] Generating tensors/dbcsr_tensor_io.F cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/python3 /usr/bin/fypp /build/reproducible-path/dbcsr-2.6.0/src/tensors/dbcsr_tensor_io.F /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/tensors/dbcsr_tensor_io.F [ 36%] Generating tensors/dbcsr_tensor_reshape.F @@ -925,14 +961,14 @@ cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/python3 /usr/bin/fypp /build/reproducible-path/dbcsr-2.6.0/src/tensors/dbcsr_tensor_types.F /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/tensors/dbcsr_tensor_types.F [ 37%] Generating utils/dbcsr_array_sort.F cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/python3 /usr/bin/fypp /build/reproducible-path/dbcsr-2.6.0/src/utils/dbcsr_array_sort.F /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/utils/dbcsr_array_sort.F -[ 37%] Generating utils/dbcsr_btree.F [ 37%] Generating utils/dbcsr_blas_operations.F -cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/python3 /usr/bin/fypp /build/reproducible-path/dbcsr-2.6.0/src/utils/dbcsr_btree.F /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/utils/dbcsr_btree.F cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/python3 /usr/bin/fypp /build/reproducible-path/dbcsr-2.6.0/src/utils/dbcsr_blas_operations.F /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/utils/dbcsr_blas_operations.F -[ 37%] Generating utils/dbcsr_min_heap.F -cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/python3 /usr/bin/fypp /build/reproducible-path/dbcsr-2.6.0/src/utils/dbcsr_min_heap.F /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/utils/dbcsr_min_heap.F +[ 37%] Generating utils/dbcsr_btree.F +cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/python3 /usr/bin/fypp /build/reproducible-path/dbcsr-2.6.0/src/utils/dbcsr_btree.F /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/utils/dbcsr_btree.F [ 39%] Generating utils/dbcsr_files.F cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/python3 /usr/bin/fypp /build/reproducible-path/dbcsr-2.6.0/src/utils/dbcsr_files.F /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/utils/dbcsr_files.F +[ 39%] Generating utils/dbcsr_min_heap.F +cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/python3 /usr/bin/fypp /build/reproducible-path/dbcsr-2.6.0/src/utils/dbcsr_min_heap.F /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/utils/dbcsr_min_heap.F [ 39%] Generating utils/dbcsr_string_utilities.F cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/python3 /usr/bin/fypp /build/reproducible-path/dbcsr-2.6.0/src/utils/dbcsr_string_utilities.F /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/utils/dbcsr_string_utilities.F [ 40%] Generating utils/dbcsr_toollib.F @@ -944,27 +980,27 @@ make[3]: Leaving directory '/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu' make -f src/CMakeFiles/dbcsr.dir/build.make src/CMakeFiles/dbcsr.dir/build make[3]: Entering directory '/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu' -[ 40%] Building Fortran object src/CMakeFiles/dbcsr.dir/acc/hip/dbcsr_hip_profiling.F.o [ 40%] Building Fortran object src/CMakeFiles/dbcsr.dir/base/dbcsr_kinds.F.o +cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/gfortran -D__STATM_TOTAL -D__parallel -D__SHORT_FILE__=\"dbcsr_kinds.F\" -I/build/reproducible-path/dbcsr-2.6.0/src/base -I/build/reproducible-path/dbcsr-2.6.0/src -I/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src -I/usr/lib/i386-linux-gnu/mpich/include -ffree-form -std=f2008ts -fimplicit-none -Werror=aliasing -Werror=ampersand -Werror=c-binding-type -Werror=intrinsic-shadow -Werror=intrinsics-std -Werror=line-truncation -Werror=tabs -Werror=target-lifetime -Werror=underflow -Werror=unused-but-set-parameter -Werror=unused-but-set-variable -Werror=unused-variable -Werror=unused-dummy-argument -Werror=conversion -Werror=zerotrip -Werror=uninitialized -Wno-maybe-uninitialized -Werror=unused-parameter -fallow-argument-mismatch -fPIC -fallow-invalid-boz -fallow-argument-mismatch -fopenmp -c /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/base/dbcsr_kinds.F -o CMakeFiles/dbcsr.dir/base/dbcsr_kinds.F.o [ 40%] Building Fortran object src/CMakeFiles/dbcsr.dir/utils/dbcsr_btree.F.o +[ 40%] Building Fortran object src/CMakeFiles/dbcsr.dir/acc/hip/dbcsr_hip_profiling.F.o [ 42%] Building Fortran object src/CMakeFiles/dbcsr.dir/mm/dbcsr_mm_types.F.o cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/gfortran -D__STATM_TOTAL -D__parallel -D__SHORT_FILE__=\"dbcsr_hip_profiling.F\" -I/build/reproducible-path/dbcsr-2.6.0/src/base -I/build/reproducible-path/dbcsr-2.6.0/src -I/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src -I/usr/lib/i386-linux-gnu/mpich/include -ffree-form -std=f2008ts -fimplicit-none -Werror=aliasing -Werror=ampersand -Werror=c-binding-type -Werror=intrinsic-shadow -Werror=intrinsics-std -Werror=line-truncation -Werror=tabs -Werror=target-lifetime -Werror=underflow -Werror=unused-but-set-parameter -Werror=unused-but-set-variable -Werror=unused-variable -Werror=unused-dummy-argument -Werror=conversion -Werror=zerotrip -Werror=uninitialized -Wno-maybe-uninitialized -Werror=unused-parameter -fallow-argument-mismatch -fPIC -fallow-invalid-boz -fallow-argument-mismatch -fopenmp -c /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/acc/hip/dbcsr_hip_profiling.F -o CMakeFiles/dbcsr.dir/acc/hip/dbcsr_hip_profiling.F.o -cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/gfortran -D__STATM_TOTAL -D__parallel -D__SHORT_FILE__=\"dbcsr_kinds.F\" -I/build/reproducible-path/dbcsr-2.6.0/src/base -I/build/reproducible-path/dbcsr-2.6.0/src -I/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src -I/usr/lib/i386-linux-gnu/mpich/include -ffree-form -std=f2008ts -fimplicit-none -Werror=aliasing -Werror=ampersand -Werror=c-binding-type -Werror=intrinsic-shadow -Werror=intrinsics-std -Werror=line-truncation -Werror=tabs -Werror=target-lifetime -Werror=underflow -Werror=unused-but-set-parameter -Werror=unused-but-set-variable -Werror=unused-variable -Werror=unused-dummy-argument -Werror=conversion -Werror=zerotrip -Werror=uninitialized -Wno-maybe-uninitialized -Werror=unused-parameter -fallow-argument-mismatch -fPIC -fallow-invalid-boz -fallow-argument-mismatch -fopenmp -c /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/base/dbcsr_kinds.F -o CMakeFiles/dbcsr.dir/base/dbcsr_kinds.F.o cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/gfortran -D__STATM_TOTAL -D__parallel -D__SHORT_FILE__=\"dbcsr_btree.F\" -I/build/reproducible-path/dbcsr-2.6.0/src/base -I/build/reproducible-path/dbcsr-2.6.0/src -I/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src -I/usr/lib/i386-linux-gnu/mpich/include -ffree-form -std=f2008ts -fimplicit-none -Werror=aliasing -Werror=ampersand -Werror=c-binding-type -Werror=intrinsic-shadow -Werror=intrinsics-std -Werror=line-truncation -Werror=tabs -Werror=target-lifetime -Werror=underflow -Werror=unused-but-set-parameter -Werror=unused-but-set-variable -Werror=unused-variable -Werror=unused-dummy-argument -Werror=conversion -Werror=zerotrip -Werror=uninitialized -Wno-maybe-uninitialized -Werror=unused-parameter -fallow-argument-mismatch -fPIC -fallow-invalid-boz -fallow-argument-mismatch -fopenmp -c /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/utils/dbcsr_btree.F -o CMakeFiles/dbcsr.dir/utils/dbcsr_btree.F.o cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/gfortran -D__STATM_TOTAL -D__parallel -D__SHORT_FILE__=\"dbcsr_mm_types.F\" -I/build/reproducible-path/dbcsr-2.6.0/src/base -I/build/reproducible-path/dbcsr-2.6.0/src -I/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src -I/usr/lib/i386-linux-gnu/mpich/include -ffree-form -std=f2008ts -fimplicit-none -Werror=aliasing -Werror=ampersand -Werror=c-binding-type -Werror=intrinsic-shadow -Werror=intrinsics-std -Werror=line-truncation -Werror=tabs -Werror=target-lifetime -Werror=underflow -Werror=unused-but-set-parameter -Werror=unused-but-set-variable -Werror=unused-variable -Werror=unused-dummy-argument -Werror=conversion -Werror=zerotrip -Werror=uninitialized -Wno-maybe-uninitialized -Werror=unused-parameter -fallow-argument-mismatch -fPIC -fallow-invalid-boz -fallow-argument-mismatch -fopenmp -c /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/mm/dbcsr_mm_types.F -o CMakeFiles/dbcsr.dir/mm/dbcsr_mm_types.F.o /usr/bin/cmake -E cmake_copy_f90_mod src/dbcsr_hip_profiling.mod src/CMakeFiles/dbcsr.dir/dbcsr_hip_profiling.mod.stamp GNU +/usr/bin/cmake -E touch src/CMakeFiles/dbcsr.dir/acc/hip/dbcsr_hip_profiling.F.o.provides.build /usr/bin/cmake -E cmake_copy_f90_mod src/dbcsr_mm_types.mod src/CMakeFiles/dbcsr.dir/dbcsr_mm_types.mod.stamp GNU /usr/bin/cmake -E cmake_copy_f90_mod src/dbcsr_kinds.mod src/CMakeFiles/dbcsr.dir/dbcsr_kinds.mod.stamp GNU -/usr/bin/cmake -E touch src/CMakeFiles/dbcsr.dir/acc/hip/dbcsr_hip_profiling.F.o.provides.build /usr/bin/cmake -E touch src/CMakeFiles/dbcsr.dir/mm/dbcsr_mm_types.F.o.provides.build /usr/bin/cmake -E touch src/CMakeFiles/dbcsr.dir/base/dbcsr_kinds.F.o.provides.build -[ 42%] Building Fortran object src/CMakeFiles/dbcsr.dir/base/dbcsr_machine_internal.F.o -[ 42%] Building Fortran object src/CMakeFiles/dbcsr.dir/utils/dbcsr_string_utilities.F.o [ 43%] Building Fortran object src/CMakeFiles/dbcsr.dir/utils/dbcsr_array_sort.F.o -cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/gfortran -D__STATM_TOTAL -D__parallel -D__SHORT_FILE__=\"dbcsr_machine_internal.F\" -I/build/reproducible-path/dbcsr-2.6.0/src/base -I/build/reproducible-path/dbcsr-2.6.0/src -I/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src -I/usr/lib/i386-linux-gnu/mpich/include -ffree-form -std=f2008ts -fimplicit-none -Werror=aliasing -Werror=ampersand -Werror=c-binding-type -Werror=intrinsic-shadow -Werror=intrinsics-std -Werror=line-truncation -Werror=tabs -Werror=target-lifetime -Werror=underflow -Werror=unused-but-set-parameter -Werror=unused-but-set-variable -Werror=unused-variable -Werror=unused-dummy-argument -Werror=conversion -Werror=zerotrip -Werror=uninitialized -Wno-maybe-uninitialized -Werror=unused-parameter -fallow-argument-mismatch -fPIC -fallow-invalid-boz -fallow-argument-mismatch -fopenmp -c /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/base/dbcsr_machine_internal.F -o CMakeFiles/dbcsr.dir/base/dbcsr_machine_internal.F.o -[ 44%] Building Fortran object src/CMakeFiles/dbcsr.dir/core/dbcsr_timings_base_type.F.o -cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/gfortran -D__STATM_TOTAL -D__parallel -D__SHORT_FILE__=\"dbcsr_string_utilities.F\" -I/build/reproducible-path/dbcsr-2.6.0/src/base -I/build/reproducible-path/dbcsr-2.6.0/src -I/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src -I/usr/lib/i386-linux-gnu/mpich/include -ffree-form -std=f2008ts -fimplicit-none -Werror=aliasing -Werror=ampersand -Werror=c-binding-type -Werror=intrinsic-shadow -Werror=intrinsics-std -Werror=line-truncation -Werror=tabs -Werror=target-lifetime -Werror=underflow -Werror=unused-but-set-parameter -Werror=unused-but-set-variable -Werror=unused-variable -Werror=unused-dummy-argument -Werror=conversion -Werror=zerotrip -Werror=uninitialized -Wno-maybe-uninitialized -Werror=unused-parameter -fallow-argument-mismatch -fPIC -fallow-invalid-boz -fallow-argument-mismatch -fopenmp -c /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/utils/dbcsr_string_utilities.F -o CMakeFiles/dbcsr.dir/utils/dbcsr_string_utilities.F.o +[ 43%] Building Fortran object src/CMakeFiles/dbcsr.dir/utils/dbcsr_string_utilities.F.o cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/gfortran -D__STATM_TOTAL -D__parallel -D__SHORT_FILE__=\"dbcsr_array_sort.F\" -I/build/reproducible-path/dbcsr-2.6.0/src/base -I/build/reproducible-path/dbcsr-2.6.0/src -I/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src -I/usr/lib/i386-linux-gnu/mpich/include -ffree-form -std=f2008ts -fimplicit-none -Werror=aliasing -Werror=ampersand -Werror=c-binding-type -Werror=intrinsic-shadow -Werror=intrinsics-std -Werror=line-truncation -Werror=tabs -Werror=target-lifetime -Werror=underflow -Werror=unused-but-set-parameter -Werror=unused-but-set-variable -Werror=unused-variable -Werror=unused-dummy-argument -Werror=conversion -Werror=zerotrip -Werror=uninitialized -Wno-maybe-uninitialized -Werror=unused-parameter -fallow-argument-mismatch -fPIC -fallow-invalid-boz -fallow-argument-mismatch -fopenmp -c /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/utils/dbcsr_array_sort.F -o CMakeFiles/dbcsr.dir/utils/dbcsr_array_sort.F.o +[ 43%] Building Fortran object src/CMakeFiles/dbcsr.dir/base/dbcsr_machine_internal.F.o +cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/gfortran -D__STATM_TOTAL -D__parallel -D__SHORT_FILE__=\"dbcsr_string_utilities.F\" -I/build/reproducible-path/dbcsr-2.6.0/src/base -I/build/reproducible-path/dbcsr-2.6.0/src -I/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src -I/usr/lib/i386-linux-gnu/mpich/include -ffree-form -std=f2008ts -fimplicit-none -Werror=aliasing -Werror=ampersand -Werror=c-binding-type -Werror=intrinsic-shadow -Werror=intrinsics-std -Werror=line-truncation -Werror=tabs -Werror=target-lifetime -Werror=underflow -Werror=unused-but-set-parameter -Werror=unused-but-set-variable -Werror=unused-variable -Werror=unused-dummy-argument -Werror=conversion -Werror=zerotrip -Werror=uninitialized -Wno-maybe-uninitialized -Werror=unused-parameter -fallow-argument-mismatch -fPIC -fallow-invalid-boz -fallow-argument-mismatch -fopenmp -c /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/utils/dbcsr_string_utilities.F -o CMakeFiles/dbcsr.dir/utils/dbcsr_string_utilities.F.o +[ 44%] Building Fortran object src/CMakeFiles/dbcsr.dir/core/dbcsr_timings_base_type.F.o +cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/gfortran -D__STATM_TOTAL -D__parallel -D__SHORT_FILE__=\"dbcsr_machine_internal.F\" -I/build/reproducible-path/dbcsr-2.6.0/src/base -I/build/reproducible-path/dbcsr-2.6.0/src -I/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src -I/usr/lib/i386-linux-gnu/mpich/include -ffree-form -std=f2008ts -fimplicit-none -Werror=aliasing -Werror=ampersand -Werror=c-binding-type -Werror=intrinsic-shadow -Werror=intrinsics-std -Werror=line-truncation -Werror=tabs -Werror=target-lifetime -Werror=underflow -Werror=unused-but-set-parameter -Werror=unused-but-set-variable -Werror=unused-variable -Werror=unused-dummy-argument -Werror=conversion -Werror=zerotrip -Werror=uninitialized -Wno-maybe-uninitialized -Werror=unused-parameter -fallow-argument-mismatch -fPIC -fallow-invalid-boz -fallow-argument-mismatch -fopenmp -c /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/base/dbcsr_machine_internal.F -o CMakeFiles/dbcsr.dir/base/dbcsr_machine_internal.F.o cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/gfortran -D__STATM_TOTAL -D__parallel -D__SHORT_FILE__=\"dbcsr_timings_base_type.F\" -I/build/reproducible-path/dbcsr-2.6.0/src/base -I/build/reproducible-path/dbcsr-2.6.0/src -I/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src -I/usr/lib/i386-linux-gnu/mpich/include -ffree-form -std=f2008ts -fimplicit-none -Werror=aliasing -Werror=ampersand -Werror=c-binding-type -Werror=intrinsic-shadow -Werror=intrinsics-std -Werror=line-truncation -Werror=tabs -Werror=target-lifetime -Werror=underflow -Werror=unused-but-set-parameter -Werror=unused-but-set-variable -Werror=unused-variable -Werror=unused-dummy-argument -Werror=conversion -Werror=zerotrip -Werror=uninitialized -Wno-maybe-uninitialized -Werror=unused-parameter -fallow-argument-mismatch -fPIC -fallow-invalid-boz -fallow-argument-mismatch -fopenmp -c /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/core/dbcsr_timings_base_type.F -o CMakeFiles/dbcsr.dir/core/dbcsr_timings_base_type.F.o /usr/bin/cmake -E cmake_copy_f90_mod src/dbcsr_timings_base_type.mod src/CMakeFiles/dbcsr.dir/dbcsr_timings_base_type.mod.stamp GNU /usr/bin/cmake -E cmake_copy_f90_mod src/dbcsr_string_utilities.mod src/CMakeFiles/dbcsr.dir/dbcsr_string_utilities.mod.stamp GNU @@ -983,68 +1019,68 @@ /usr/bin/cmake -E cmake_copy_f90_mod src/dbcsr_base_hooks.mod src/CMakeFiles/dbcsr.dir/dbcsr_base_hooks.mod.stamp GNU /usr/bin/cmake -E touch src/CMakeFiles/dbcsr.dir/base/dbcsr_base_hooks.F.o.provides.build [ 46%] Building Fortran object src/CMakeFiles/dbcsr.dir/acc/cuda/dbcsr_cuda_profiling.F.o -[ 46%] Building Fortran object src/CMakeFiles/dbcsr.dir/utils/dbcsr_min_heap.F.o cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/gfortran -D__STATM_TOTAL -D__parallel -D__SHORT_FILE__=\"dbcsr_cuda_profiling.F\" -I/build/reproducible-path/dbcsr-2.6.0/src/base -I/build/reproducible-path/dbcsr-2.6.0/src -I/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src -I/usr/lib/i386-linux-gnu/mpich/include -ffree-form -std=f2008ts -fimplicit-none -Werror=aliasing -Werror=ampersand -Werror=c-binding-type -Werror=intrinsic-shadow -Werror=intrinsics-std -Werror=line-truncation -Werror=tabs -Werror=target-lifetime -Werror=underflow -Werror=unused-but-set-parameter -Werror=unused-but-set-variable -Werror=unused-variable -Werror=unused-dummy-argument -Werror=conversion -Werror=zerotrip -Werror=uninitialized -Wno-maybe-uninitialized -Werror=unused-parameter -fallow-argument-mismatch -fPIC -fallow-invalid-boz -fallow-argument-mismatch -fopenmp -c /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/acc/cuda/dbcsr_cuda_profiling.F -o CMakeFiles/dbcsr.dir/acc/cuda/dbcsr_cuda_profiling.F.o -[ 47%] Building Fortran object src/CMakeFiles/dbcsr.dir/core/dbcsr_dict.F.o -[ 47%] Building Fortran object src/CMakeFiles/dbcsr.dir/acc/dbcsr_acc_timings.F.o -cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/gfortran -D__STATM_TOTAL -D__parallel -D__SHORT_FILE__=\"dbcsr_min_heap.F\" -I/build/reproducible-path/dbcsr-2.6.0/src/base -I/build/reproducible-path/dbcsr-2.6.0/src -I/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src -I/usr/lib/i386-linux-gnu/mpich/include -ffree-form -std=f2008ts -fimplicit-none -Werror=aliasing -Werror=ampersand -Werror=c-binding-type -Werror=intrinsic-shadow -Werror=intrinsics-std -Werror=line-truncation -Werror=tabs -Werror=target-lifetime -Werror=underflow -Werror=unused-but-set-parameter -Werror=unused-but-set-variable -Werror=unused-variable -Werror=unused-dummy-argument -Werror=conversion -Werror=zerotrip -Werror=uninitialized -Wno-maybe-uninitialized -Werror=unused-parameter -fallow-argument-mismatch -fPIC -fallow-invalid-boz -fallow-argument-mismatch -fopenmp -c /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/utils/dbcsr_min_heap.F -o CMakeFiles/dbcsr.dir/utils/dbcsr_min_heap.F.o -cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/gfortran -D__STATM_TOTAL -D__parallel -D__SHORT_FILE__=\"dbcsr_dict.F\" -I/build/reproducible-path/dbcsr-2.6.0/src/base -I/build/reproducible-path/dbcsr-2.6.0/src -I/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src -I/usr/lib/i386-linux-gnu/mpich/include -ffree-form -std=f2008ts -fimplicit-none -Werror=aliasing -Werror=ampersand -Werror=c-binding-type -Werror=intrinsic-shadow -Werror=intrinsics-std -Werror=line-truncation -Werror=tabs -Werror=target-lifetime -Werror=underflow -Werror=unused-but-set-parameter -Werror=unused-but-set-variable -Werror=unused-variable -Werror=unused-dummy-argument -Werror=conversion -Werror=zerotrip -Werror=uninitialized -Wno-maybe-uninitialized -Werror=unused-parameter -fallow-argument-mismatch -fPIC -fallow-invalid-boz -fallow-argument-mismatch -fopenmp -c /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/core/dbcsr_dict.F -o CMakeFiles/dbcsr.dir/core/dbcsr_dict.F.o -[ 47%] Building Fortran object src/CMakeFiles/dbcsr.dir/core/dbcsr_array_types.F.o -cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/gfortran -D__STATM_TOTAL -D__parallel -D__SHORT_FILE__=\"dbcsr_acc_timings.F\" -I/build/reproducible-path/dbcsr-2.6.0/src/base -I/build/reproducible-path/dbcsr-2.6.0/src -I/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src -I/usr/lib/i386-linux-gnu/mpich/include -ffree-form -std=f2008ts -fimplicit-none -Werror=aliasing -Werror=ampersand -Werror=c-binding-type -Werror=intrinsic-shadow -Werror=intrinsics-std -Werror=line-truncation -Werror=tabs -Werror=target-lifetime -Werror=underflow -Werror=unused-but-set-parameter -Werror=unused-but-set-variable -Werror=unused-variable -Werror=unused-dummy-argument -Werror=conversion -Werror=zerotrip -Werror=uninitialized -Wno-maybe-uninitialized -Werror=unused-parameter -fallow-argument-mismatch -fPIC -fallow-invalid-boz -fallow-argument-mismatch -fopenmp -c /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/acc/dbcsr_acc_timings.F -o CMakeFiles/dbcsr.dir/acc/dbcsr_acc_timings.F.o -cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/gfortran -D__STATM_TOTAL -D__parallel -D__SHORT_FILE__=\"dbcsr_array_types.F\" -I/build/reproducible-path/dbcsr-2.6.0/src/base -I/build/reproducible-path/dbcsr-2.6.0/src -I/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src -I/usr/lib/i386-linux-gnu/mpich/include -ffree-form -std=f2008ts -fimplicit-none -Werror=aliasing -Werror=ampersand -Werror=c-binding-type -Werror=intrinsic-shadow -Werror=intrinsics-std -Werror=line-truncation -Werror=tabs -Werror=target-lifetime -Werror=underflow -Werror=unused-but-set-parameter -Werror=unused-but-set-variable -Werror=unused-variable -Werror=unused-dummy-argument -Werror=conversion -Werror=zerotrip -Werror=uninitialized -Wno-maybe-uninitialized -Werror=unused-parameter -fallow-argument-mismatch -fPIC -fallow-invalid-boz -fallow-argument-mismatch -fopenmp -c /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/core/dbcsr_array_types.F -o CMakeFiles/dbcsr.dir/core/dbcsr_array_types.F.o -[ 47%] Building Fortran object src/CMakeFiles/dbcsr.dir/core/dbcsr_list_routinereport.F.o -[ 49%] Building Fortran object src/CMakeFiles/dbcsr.dir/core/dbcsr_list_callstackentry.F.o +[ 47%] Building Fortran object src/CMakeFiles/dbcsr.dir/acc/dbcsr_acc_device.F.o +cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/gfortran -D__STATM_TOTAL -D__parallel -D__SHORT_FILE__=\"dbcsr_acc_device.F\" -I/build/reproducible-path/dbcsr-2.6.0/src/base -I/build/reproducible-path/dbcsr-2.6.0/src -I/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src -I/usr/lib/i386-linux-gnu/mpich/include -ffree-form -std=f2008ts -fimplicit-none -Werror=aliasing -Werror=ampersand -Werror=c-binding-type -Werror=intrinsic-shadow -Werror=intrinsics-std -Werror=line-truncation -Werror=tabs -Werror=target-lifetime -Werror=underflow -Werror=unused-but-set-parameter -Werror=unused-but-set-variable -Werror=unused-variable -Werror=unused-dummy-argument -Werror=conversion -Werror=zerotrip -Werror=uninitialized -Wno-maybe-uninitialized -Werror=unused-parameter -fallow-argument-mismatch -fPIC -fallow-invalid-boz -fallow-argument-mismatch -fopenmp -c /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/acc/dbcsr_acc_device.F -o CMakeFiles/dbcsr.dir/acc/dbcsr_acc_device.F.o [ 47%] Building Fortran object src/CMakeFiles/dbcsr.dir/mpi/dbcsr_mpiwrap.F.o -[ 50%] Building Fortran object src/CMakeFiles/dbcsr.dir/acc/dbcsr_acc_device.F.o -cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/gfortran -D__STATM_TOTAL -D__parallel -D__SHORT_FILE__=\"dbcsr_list_routinereport.F\" -I/build/reproducible-path/dbcsr-2.6.0/src/base -I/build/reproducible-path/dbcsr-2.6.0/src -I/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src -I/usr/lib/i386-linux-gnu/mpich/include -ffree-form -std=f2008ts -fimplicit-none -Werror=aliasing -Werror=ampersand -Werror=c-binding-type -Werror=intrinsic-shadow -Werror=intrinsics-std -Werror=line-truncation -Werror=tabs -Werror=target-lifetime -Werror=underflow -Werror=unused-but-set-parameter -Werror=unused-but-set-variable -Werror=unused-variable -Werror=unused-dummy-argument -Werror=conversion -Werror=zerotrip -Werror=uninitialized -Wno-maybe-uninitialized -Werror=unused-parameter -fallow-argument-mismatch -fPIC -fallow-invalid-boz -fallow-argument-mismatch -fopenmp -c /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/core/dbcsr_list_routinereport.F -o CMakeFiles/dbcsr.dir/core/dbcsr_list_routinereport.F.o -cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/gfortran -D__STATM_TOTAL -D__parallel -D__SHORT_FILE__=\"dbcsr_list_callstackentry.F\" -I/build/reproducible-path/dbcsr-2.6.0/src/base -I/build/reproducible-path/dbcsr-2.6.0/src -I/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src -I/usr/lib/i386-linux-gnu/mpich/include -ffree-form -std=f2008ts -fimplicit-none -Werror=aliasing -Werror=ampersand -Werror=c-binding-type -Werror=intrinsic-shadow -Werror=intrinsics-std -Werror=line-truncation -Werror=tabs -Werror=target-lifetime -Werror=underflow -Werror=unused-but-set-parameter -Werror=unused-but-set-variable -Werror=unused-variable -Werror=unused-dummy-argument -Werror=conversion -Werror=zerotrip -Werror=uninitialized -Wno-maybe-uninitialized -Werror=unused-parameter -fallow-argument-mismatch -fPIC -fallow-invalid-boz -fallow-argument-mismatch -fopenmp -c /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/core/dbcsr_list_callstackentry.F -o CMakeFiles/dbcsr.dir/core/dbcsr_list_callstackentry.F.o +[ 49%] Building Fortran object src/CMakeFiles/dbcsr.dir/acc/dbcsr_acc_timings.F.o +[ 49%] Building Fortran object src/CMakeFiles/dbcsr.dir/core/dbcsr_array_types.F.o +[ 49%] Building Fortran object src/CMakeFiles/dbcsr.dir/utils/dbcsr_toollib.F.o +[ 49%] Building Fortran object src/CMakeFiles/dbcsr.dir/core/dbcsr_dict.F.o +[ 49%] Building Fortran object src/CMakeFiles/dbcsr.dir/utils/dbcsr_min_heap.F.o cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/gfortran -D__STATM_TOTAL -D__parallel -D__SHORT_FILE__=\"dbcsr_mpiwrap.F\" -I/build/reproducible-path/dbcsr-2.6.0/src/base -I/build/reproducible-path/dbcsr-2.6.0/src -I/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src -I/usr/lib/i386-linux-gnu/mpich/include -ffree-form -std=f2008ts -fimplicit-none -Werror=aliasing -Werror=ampersand -Werror=c-binding-type -Werror=intrinsic-shadow -Werror=intrinsics-std -Werror=line-truncation -Werror=tabs -Werror=target-lifetime -Werror=underflow -Werror=unused-but-set-parameter -Werror=unused-but-set-variable -Werror=unused-variable -Werror=unused-dummy-argument -Werror=conversion -Werror=zerotrip -Werror=uninitialized -Wno-maybe-uninitialized -Werror=unused-parameter -fallow-argument-mismatch -fPIC -fallow-invalid-boz -fallow-argument-mismatch -fopenmp -Wno-error -c /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/mpi/dbcsr_mpiwrap.F -o CMakeFiles/dbcsr.dir/mpi/dbcsr_mpiwrap.F.o -cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/gfortran -D__STATM_TOTAL -D__parallel -D__SHORT_FILE__=\"dbcsr_acc_device.F\" -I/build/reproducible-path/dbcsr-2.6.0/src/base -I/build/reproducible-path/dbcsr-2.6.0/src -I/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src -I/usr/lib/i386-linux-gnu/mpich/include -ffree-form -std=f2008ts -fimplicit-none -Werror=aliasing -Werror=ampersand -Werror=c-binding-type -Werror=intrinsic-shadow -Werror=intrinsics-std -Werror=line-truncation -Werror=tabs -Werror=target-lifetime -Werror=underflow -Werror=unused-but-set-parameter -Werror=unused-but-set-variable -Werror=unused-variable -Werror=unused-dummy-argument -Werror=conversion -Werror=zerotrip -Werror=uninitialized -Wno-maybe-uninitialized -Werror=unused-parameter -fallow-argument-mismatch -fPIC -fallow-invalid-boz -fallow-argument-mismatch -fopenmp -c /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/acc/dbcsr_acc_device.F -o CMakeFiles/dbcsr.dir/acc/dbcsr_acc_device.F.o -[ 50%] Building Fortran object src/CMakeFiles/dbcsr.dir/utils/dbcsr_toollib.F.o -[ 52%] Building Fortran object src/CMakeFiles/dbcsr.dir/utils/dbcsr_files.F.o -[ 52%] Building Fortran object src/CMakeFiles/dbcsr.dir/core/dbcsr_iter_types.F.o +cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/gfortran -D__STATM_TOTAL -D__parallel -D__SHORT_FILE__=\"dbcsr_acc_timings.F\" -I/build/reproducible-path/dbcsr-2.6.0/src/base -I/build/reproducible-path/dbcsr-2.6.0/src -I/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src -I/usr/lib/i386-linux-gnu/mpich/include -ffree-form -std=f2008ts -fimplicit-none -Werror=aliasing -Werror=ampersand -Werror=c-binding-type -Werror=intrinsic-shadow -Werror=intrinsics-std -Werror=line-truncation -Werror=tabs -Werror=target-lifetime -Werror=underflow -Werror=unused-but-set-parameter -Werror=unused-but-set-variable -Werror=unused-variable -Werror=unused-dummy-argument -Werror=conversion -Werror=zerotrip -Werror=uninitialized -Wno-maybe-uninitialized -Werror=unused-parameter -fallow-argument-mismatch -fPIC -fallow-invalid-boz -fallow-argument-mismatch -fopenmp -c /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/acc/dbcsr_acc_timings.F -o CMakeFiles/dbcsr.dir/acc/dbcsr_acc_timings.F.o +cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/gfortran -D__STATM_TOTAL -D__parallel -D__SHORT_FILE__=\"dbcsr_array_types.F\" -I/build/reproducible-path/dbcsr-2.6.0/src/base -I/build/reproducible-path/dbcsr-2.6.0/src -I/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src -I/usr/lib/i386-linux-gnu/mpich/include -ffree-form -std=f2008ts -fimplicit-none -Werror=aliasing -Werror=ampersand -Werror=c-binding-type -Werror=intrinsic-shadow -Werror=intrinsics-std -Werror=line-truncation -Werror=tabs -Werror=target-lifetime -Werror=underflow -Werror=unused-but-set-parameter -Werror=unused-but-set-variable -Werror=unused-variable -Werror=unused-dummy-argument -Werror=conversion -Werror=zerotrip -Werror=uninitialized -Wno-maybe-uninitialized -Werror=unused-parameter -fallow-argument-mismatch -fPIC -fallow-invalid-boz -fallow-argument-mismatch -fopenmp -c /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/core/dbcsr_array_types.F -o CMakeFiles/dbcsr.dir/core/dbcsr_array_types.F.o +cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/gfortran -D__STATM_TOTAL -D__parallel -D__SHORT_FILE__=\"dbcsr_min_heap.F\" -I/build/reproducible-path/dbcsr-2.6.0/src/base -I/build/reproducible-path/dbcsr-2.6.0/src -I/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src -I/usr/lib/i386-linux-gnu/mpich/include -ffree-form -std=f2008ts -fimplicit-none -Werror=aliasing -Werror=ampersand -Werror=c-binding-type -Werror=intrinsic-shadow -Werror=intrinsics-std -Werror=line-truncation -Werror=tabs -Werror=target-lifetime -Werror=underflow -Werror=unused-but-set-parameter -Werror=unused-but-set-variable -Werror=unused-variable -Werror=unused-dummy-argument -Werror=conversion -Werror=zerotrip -Werror=uninitialized -Wno-maybe-uninitialized -Werror=unused-parameter -fallow-argument-mismatch -fPIC -fallow-invalid-boz -fallow-argument-mismatch -fopenmp -c /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/utils/dbcsr_min_heap.F -o CMakeFiles/dbcsr.dir/utils/dbcsr_min_heap.F.o cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/gfortran -D__STATM_TOTAL -D__parallel -D__SHORT_FILE__=\"dbcsr_toollib.F\" -I/build/reproducible-path/dbcsr-2.6.0/src/base -I/build/reproducible-path/dbcsr-2.6.0/src -I/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src -I/usr/lib/i386-linux-gnu/mpich/include -ffree-form -std=f2008ts -fimplicit-none -Werror=aliasing -Werror=ampersand -Werror=c-binding-type -Werror=intrinsic-shadow -Werror=intrinsics-std -Werror=line-truncation -Werror=tabs -Werror=target-lifetime -Werror=underflow -Werror=unused-but-set-parameter -Werror=unused-but-set-variable -Werror=unused-variable -Werror=unused-dummy-argument -Werror=conversion -Werror=zerotrip -Werror=uninitialized -Wno-maybe-uninitialized -Werror=unused-parameter -fallow-argument-mismatch -fPIC -fallow-invalid-boz -fallow-argument-mismatch -fopenmp -c /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/utils/dbcsr_toollib.F -o CMakeFiles/dbcsr.dir/utils/dbcsr_toollib.F.o -cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/gfortran -D__STATM_TOTAL -D__parallel -D__SHORT_FILE__=\"dbcsr_iter_types.F\" -I/build/reproducible-path/dbcsr-2.6.0/src/base -I/build/reproducible-path/dbcsr-2.6.0/src -I/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src -I/usr/lib/i386-linux-gnu/mpich/include -ffree-form -std=f2008ts -fimplicit-none -Werror=aliasing -Werror=ampersand -Werror=c-binding-type -Werror=intrinsic-shadow -Werror=intrinsics-std -Werror=line-truncation -Werror=tabs -Werror=target-lifetime -Werror=underflow -Werror=unused-but-set-parameter -Werror=unused-but-set-variable -Werror=unused-variable -Werror=unused-dummy-argument -Werror=conversion -Werror=zerotrip -Werror=uninitialized -Wno-maybe-uninitialized -Werror=unused-parameter -fallow-argument-mismatch -fPIC -fallow-invalid-boz -fallow-argument-mismatch -fopenmp -c /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/core/dbcsr_iter_types.F -o CMakeFiles/dbcsr.dir/core/dbcsr_iter_types.F.o +cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/gfortran -D__STATM_TOTAL -D__parallel -D__SHORT_FILE__=\"dbcsr_dict.F\" -I/build/reproducible-path/dbcsr-2.6.0/src/base -I/build/reproducible-path/dbcsr-2.6.0/src -I/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src -I/usr/lib/i386-linux-gnu/mpich/include -ffree-form -std=f2008ts -fimplicit-none -Werror=aliasing -Werror=ampersand -Werror=c-binding-type -Werror=intrinsic-shadow -Werror=intrinsics-std -Werror=line-truncation -Werror=tabs -Werror=target-lifetime -Werror=underflow -Werror=unused-but-set-parameter -Werror=unused-but-set-variable -Werror=unused-variable -Werror=unused-dummy-argument -Werror=conversion -Werror=zerotrip -Werror=uninitialized -Wno-maybe-uninitialized -Werror=unused-parameter -fallow-argument-mismatch -fPIC -fallow-invalid-boz -fallow-argument-mismatch -fopenmp -c /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/core/dbcsr_dict.F -o CMakeFiles/dbcsr.dir/core/dbcsr_dict.F.o +[ 50%] Building Fortran object src/CMakeFiles/dbcsr.dir/utils/dbcsr_files.F.o cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/gfortran -D__STATM_TOTAL -D__parallel -D__SHORT_FILE__=\"dbcsr_files.F\" -I/build/reproducible-path/dbcsr-2.6.0/src/base -I/build/reproducible-path/dbcsr-2.6.0/src -I/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src -I/usr/lib/i386-linux-gnu/mpich/include -ffree-form -std=f2008ts -fimplicit-none -Werror=aliasing -Werror=ampersand -Werror=c-binding-type -Werror=intrinsic-shadow -Werror=intrinsics-std -Werror=line-truncation -Werror=tabs -Werror=target-lifetime -Werror=underflow -Werror=unused-but-set-parameter -Werror=unused-but-set-variable -Werror=unused-variable -Werror=unused-dummy-argument -Werror=conversion -Werror=zerotrip -Werror=uninitialized -Wno-maybe-uninitialized -Werror=unused-parameter -fallow-argument-mismatch -fPIC -fallow-invalid-boz -fallow-argument-mismatch -fopenmp -c /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/utils/dbcsr_files.F -o CMakeFiles/dbcsr.dir/utils/dbcsr_files.F.o +[ 50%] Building Fortran object src/CMakeFiles/dbcsr.dir/core/dbcsr_iter_types.F.o +[ 52%] Building Fortran object src/CMakeFiles/dbcsr.dir/core/dbcsr_list_callstackentry.F.o +cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/gfortran -D__STATM_TOTAL -D__parallel -D__SHORT_FILE__=\"dbcsr_iter_types.F\" -I/build/reproducible-path/dbcsr-2.6.0/src/base -I/build/reproducible-path/dbcsr-2.6.0/src -I/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src -I/usr/lib/i386-linux-gnu/mpich/include -ffree-form -std=f2008ts -fimplicit-none -Werror=aliasing -Werror=ampersand -Werror=c-binding-type -Werror=intrinsic-shadow -Werror=intrinsics-std -Werror=line-truncation -Werror=tabs -Werror=target-lifetime -Werror=underflow -Werror=unused-but-set-parameter -Werror=unused-but-set-variable -Werror=unused-variable -Werror=unused-dummy-argument -Werror=conversion -Werror=zerotrip -Werror=uninitialized -Wno-maybe-uninitialized -Werror=unused-parameter -fallow-argument-mismatch -fPIC -fallow-invalid-boz -fallow-argument-mismatch -fopenmp -c /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/core/dbcsr_iter_types.F -o CMakeFiles/dbcsr.dir/core/dbcsr_iter_types.F.o +cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/gfortran -D__STATM_TOTAL -D__parallel -D__SHORT_FILE__=\"dbcsr_list_callstackentry.F\" -I/build/reproducible-path/dbcsr-2.6.0/src/base -I/build/reproducible-path/dbcsr-2.6.0/src -I/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src -I/usr/lib/i386-linux-gnu/mpich/include -ffree-form -std=f2008ts -fimplicit-none -Werror=aliasing -Werror=ampersand -Werror=c-binding-type -Werror=intrinsic-shadow -Werror=intrinsics-std -Werror=line-truncation -Werror=tabs -Werror=target-lifetime -Werror=underflow -Werror=unused-but-set-parameter -Werror=unused-but-set-variable -Werror=unused-variable -Werror=unused-dummy-argument -Werror=conversion -Werror=zerotrip -Werror=uninitialized -Wno-maybe-uninitialized -Werror=unused-parameter -fallow-argument-mismatch -fPIC -fallow-invalid-boz -fallow-argument-mismatch -fopenmp -c /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/core/dbcsr_list_callstackentry.F -o CMakeFiles/dbcsr.dir/core/dbcsr_list_callstackentry.F.o +[ 52%] Building Fortran object src/CMakeFiles/dbcsr.dir/core/dbcsr_list_routinereport.F.o +cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/gfortran -D__STATM_TOTAL -D__parallel -D__SHORT_FILE__=\"dbcsr_list_routinereport.F\" -I/build/reproducible-path/dbcsr-2.6.0/src/base -I/build/reproducible-path/dbcsr-2.6.0/src -I/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src -I/usr/lib/i386-linux-gnu/mpich/include -ffree-form -std=f2008ts -fimplicit-none -Werror=aliasing -Werror=ampersand -Werror=c-binding-type -Werror=intrinsic-shadow -Werror=intrinsics-std -Werror=line-truncation -Werror=tabs -Werror=target-lifetime -Werror=underflow -Werror=unused-but-set-parameter -Werror=unused-but-set-variable -Werror=unused-variable -Werror=unused-dummy-argument -Werror=conversion -Werror=zerotrip -Werror=uninitialized -Wno-maybe-uninitialized -Werror=unused-parameter -fallow-argument-mismatch -fPIC -fallow-invalid-boz -fallow-argument-mismatch -fopenmp -c /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/core/dbcsr_list_routinereport.F -o CMakeFiles/dbcsr.dir/core/dbcsr_list_routinereport.F.o [ 53%] Building Fortran object src/CMakeFiles/dbcsr.dir/core/dbcsr_list_routinestat.F.o -[ 55%] Building Fortran object src/CMakeFiles/dbcsr.dir/tensors/dbcsr_allocate_wrap.F.o +[ 53%] Building Fortran object src/CMakeFiles/dbcsr.dir/core/dbcsr_print_messages.F.o cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/gfortran -D__STATM_TOTAL -D__parallel -D__SHORT_FILE__=\"dbcsr_list_routinestat.F\" -I/build/reproducible-path/dbcsr-2.6.0/src/base -I/build/reproducible-path/dbcsr-2.6.0/src -I/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src -I/usr/lib/i386-linux-gnu/mpich/include -ffree-form -std=f2008ts -fimplicit-none -Werror=aliasing -Werror=ampersand -Werror=c-binding-type -Werror=intrinsic-shadow -Werror=intrinsics-std -Werror=line-truncation -Werror=tabs -Werror=target-lifetime -Werror=underflow -Werror=unused-but-set-parameter -Werror=unused-but-set-variable -Werror=unused-variable -Werror=unused-dummy-argument -Werror=conversion -Werror=zerotrip -Werror=uninitialized -Wno-maybe-uninitialized -Werror=unused-parameter -fallow-argument-mismatch -fPIC -fallow-invalid-boz -fallow-argument-mismatch -fopenmp -c /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/core/dbcsr_list_routinestat.F -o CMakeFiles/dbcsr.dir/core/dbcsr_list_routinestat.F.o -cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/gfortran -D__STATM_TOTAL -D__parallel -D__SHORT_FILE__=\"dbcsr_allocate_wrap.F\" -I/build/reproducible-path/dbcsr-2.6.0/src/base -I/build/reproducible-path/dbcsr-2.6.0/src -I/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src -I/usr/lib/i386-linux-gnu/mpich/include -ffree-form -std=f2008ts -fimplicit-none -Werror=aliasing -Werror=ampersand -Werror=c-binding-type -Werror=intrinsic-shadow -Werror=intrinsics-std -Werror=line-truncation -Werror=tabs -Werror=target-lifetime -Werror=underflow -Werror=unused-but-set-parameter -Werror=unused-but-set-variable -Werror=unused-variable -Werror=unused-dummy-argument -Werror=conversion -Werror=zerotrip -Werror=uninitialized -Wno-maybe-uninitialized -Werror=unused-parameter -fallow-argument-mismatch -fPIC -fallow-invalid-boz -fallow-argument-mismatch -fopenmp -c /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/tensors/dbcsr_allocate_wrap.F -o CMakeFiles/dbcsr.dir/tensors/dbcsr_allocate_wrap.F.o -[ 55%] Building Fortran object src/CMakeFiles/dbcsr.dir/core/dbcsr_print_messages.F.o cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/gfortran -D__STATM_TOTAL -D__parallel -D__SHORT_FILE__=\"dbcsr_print_messages.F\" -I/build/reproducible-path/dbcsr-2.6.0/src/base -I/build/reproducible-path/dbcsr-2.6.0/src -I/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src -I/usr/lib/i386-linux-gnu/mpich/include -ffree-form -std=f2008ts -fimplicit-none -Werror=aliasing -Werror=ampersand -Werror=c-binding-type -Werror=intrinsic-shadow -Werror=intrinsics-std -Werror=line-truncation -Werror=tabs -Werror=target-lifetime -Werror=underflow -Werror=unused-but-set-parameter -Werror=unused-but-set-variable -Werror=unused-variable -Werror=unused-dummy-argument -Werror=conversion -Werror=zerotrip -Werror=uninitialized -Wno-maybe-uninitialized -Werror=unused-parameter -fallow-argument-mismatch -fPIC -fallow-invalid-boz -fallow-argument-mismatch -fopenmp -c /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/core/dbcsr_print_messages.F -o CMakeFiles/dbcsr.dir/core/dbcsr_print_messages.F.o +[ 55%] Building Fortran object src/CMakeFiles/dbcsr.dir/tensors/dbcsr_allocate_wrap.F.o +cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/gfortran -D__STATM_TOTAL -D__parallel -D__SHORT_FILE__=\"dbcsr_allocate_wrap.F\" -I/build/reproducible-path/dbcsr-2.6.0/src/base -I/build/reproducible-path/dbcsr-2.6.0/src -I/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src -I/usr/lib/i386-linux-gnu/mpich/include -ffree-form -std=f2008ts -fimplicit-none -Werror=aliasing -Werror=ampersand -Werror=c-binding-type -Werror=intrinsic-shadow -Werror=intrinsics-std -Werror=line-truncation -Werror=tabs -Werror=target-lifetime -Werror=underflow -Werror=unused-but-set-parameter -Werror=unused-but-set-variable -Werror=unused-variable -Werror=unused-dummy-argument -Werror=conversion -Werror=zerotrip -Werror=uninitialized -Wno-maybe-uninitialized -Werror=unused-parameter -fallow-argument-mismatch -fPIC -fallow-invalid-boz -fallow-argument-mismatch -fopenmp -c /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/tensors/dbcsr_allocate_wrap.F -o CMakeFiles/dbcsr.dir/tensors/dbcsr_allocate_wrap.F.o +/usr/bin/cmake -E cmake_copy_f90_mod src/dbcsr_cuda_profiling.mod src/CMakeFiles/dbcsr.dir/dbcsr_cuda_profiling.mod.stamp GNU /usr/bin/cmake -E cmake_copy_f90_mod src/dbcsr_acc_device.mod src/CMakeFiles/dbcsr.dir/dbcsr_acc_device.mod.stamp GNU /usr/bin/cmake -E cmake_copy_f90_mod src/dbcsr_acc_timings.mod src/CMakeFiles/dbcsr.dir/dbcsr_acc_timings.mod.stamp GNU -/usr/bin/cmake -E cmake_copy_f90_mod src/dbcsr_cuda_profiling.mod src/CMakeFiles/dbcsr.dir/dbcsr_cuda_profiling.mod.stamp GNU -/usr/bin/cmake -E cmake_copy_f90_mod src/dbcsr_iter_types.mod src/CMakeFiles/dbcsr.dir/dbcsr_iter_types.mod.stamp GNU -/usr/bin/cmake -E touch src/CMakeFiles/dbcsr.dir/acc/dbcsr_acc_device.F.o.provides.build -/usr/bin/cmake -E cmake_copy_f90_mod src/dbcsr_toollib.mod src/CMakeFiles/dbcsr.dir/dbcsr_toollib.mod.stamp GNU -/usr/bin/cmake -E touch src/CMakeFiles/dbcsr.dir/acc/dbcsr_acc_timings.F.o.provides.build -/usr/bin/cmake -E touch src/CMakeFiles/dbcsr.dir/acc/cuda/dbcsr_cuda_profiling.F.o.provides.build /usr/bin/cmake -E cmake_copy_f90_mod src/dbcsr_array_types.mod src/CMakeFiles/dbcsr.dir/dbcsr_array_types.mod.stamp GNU -/usr/bin/cmake -E touch src/CMakeFiles/dbcsr.dir/core/dbcsr_iter_types.F.o.provides.build -/usr/bin/cmake -E touch src/CMakeFiles/dbcsr.dir/utils/dbcsr_toollib.F.o.provides.build +/usr/bin/cmake -E cmake_copy_f90_mod src/dbcsr_btree.mod src/CMakeFiles/dbcsr.dir/dbcsr_btree.mod.stamp GNU +/usr/bin/cmake -E cmake_copy_f90_mod src/dbcsr_min_heap.mod src/CMakeFiles/dbcsr.dir/dbcsr_min_heap.mod.stamp GNU +/usr/bin/cmake -E cmake_copy_f90_mod src/dbcsr_toollib.mod src/CMakeFiles/dbcsr.dir/dbcsr_toollib.mod.stamp GNU +/usr/bin/cmake -E cmake_copy_f90_mod src/dbcsr_dict.mod src/CMakeFiles/dbcsr.dir/dbcsr_dict.mod.stamp GNU +/usr/bin/cmake -E cmake_copy_f90_mod src/dbcsr_iter_types.mod src/CMakeFiles/dbcsr.dir/dbcsr_iter_types.mod.stamp GNU +/usr/bin/cmake -E cmake_copy_f90_mod src/dbcsr_list_callstackentry.mod src/CMakeFiles/dbcsr.dir/dbcsr_list_callstackentry.mod.stamp GNU /usr/bin/cmake -E cmake_copy_f90_mod src/dbcsr_list_routinereport.mod src/CMakeFiles/dbcsr.dir/dbcsr_list_routinereport.mod.stamp GNU /usr/bin/cmake -E cmake_copy_f90_mod src/dbcsr_print_messages.mod src/CMakeFiles/dbcsr.dir/dbcsr_print_messages.mod.stamp GNU -/usr/bin/cmake -E touch src/CMakeFiles/dbcsr.dir/core/dbcsr_array_types.F.o.provides.build -[ 55%] Building Fortran object src/CMakeFiles/dbcsr.dir/tas/dbcsr_tas_global.F.o -/usr/bin/cmake -E touch src/CMakeFiles/dbcsr.dir/core/dbcsr_list_routinereport.F.o.provides.build -cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/gfortran -D__STATM_TOTAL -D__parallel -D__SHORT_FILE__=\"dbcsr_tas_global.F\" -I/build/reproducible-path/dbcsr-2.6.0/src/base -I/build/reproducible-path/dbcsr-2.6.0/src -I/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src -I/usr/lib/i386-linux-gnu/mpich/include -ffree-form -std=f2008ts -fimplicit-none -Werror=aliasing -Werror=ampersand -Werror=c-binding-type -Werror=intrinsic-shadow -Werror=intrinsics-std -Werror=line-truncation -Werror=tabs -Werror=target-lifetime -Werror=underflow -Werror=unused-but-set-parameter -Werror=unused-but-set-variable -Werror=unused-variable -Werror=unused-dummy-argument -Werror=conversion -Werror=zerotrip -Werror=uninitialized -Wno-maybe-uninitialized -Werror=unused-parameter -fallow-argument-mismatch -fPIC -fallow-invalid-boz -fallow-argument-mismatch -fopenmp -c /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/tas/dbcsr_tas_global.F -o CMakeFiles/dbcsr.dir/tas/dbcsr_tas_global.F.o -/usr/bin/cmake -E cmake_copy_f90_mod src/dbcsr_min_heap.mod src/CMakeFiles/dbcsr.dir/dbcsr_min_heap.mod.stamp GNU -/usr/bin/cmake -E touch src/CMakeFiles/dbcsr.dir/core/dbcsr_print_messages.F.o.provides.build +/usr/bin/cmake -E touch src/CMakeFiles/dbcsr.dir/utils/dbcsr_btree.F.o.provides.build /usr/bin/cmake -E touch src/CMakeFiles/dbcsr.dir/utils/dbcsr_min_heap.F.o.provides.build -/usr/bin/cmake -E cmake_copy_f90_mod src/dbcsr_list_callstackentry.mod src/CMakeFiles/dbcsr.dir/dbcsr_list_callstackentry.mod.stamp GNU +/usr/bin/cmake -E touch src/CMakeFiles/dbcsr.dir/utils/dbcsr_toollib.F.o.provides.build +/usr/bin/cmake -E touch src/CMakeFiles/dbcsr.dir/acc/cuda/dbcsr_cuda_profiling.F.o.provides.build +/usr/bin/cmake -E touch src/CMakeFiles/dbcsr.dir/acc/dbcsr_acc_device.F.o.provides.build +/usr/bin/cmake -E touch src/CMakeFiles/dbcsr.dir/acc/dbcsr_acc_timings.F.o.provides.build +/usr/bin/cmake -E touch src/CMakeFiles/dbcsr.dir/core/dbcsr_array_types.F.o.provides.build +/usr/bin/cmake -E touch src/CMakeFiles/dbcsr.dir/core/dbcsr_dict.F.o.provides.build +/usr/bin/cmake -E cmake_copy_f90_mod src/dbcsr_files.mod src/CMakeFiles/dbcsr.dir/dbcsr_files.mod.stamp GNU /usr/bin/cmake -E cmake_copy_f90_mod src/dbcsr_list_routinestat.mod src/CMakeFiles/dbcsr.dir/dbcsr_list_routinestat.mod.stamp GNU -/usr/bin/cmake -E cmake_copy_f90_mod src/dbcsr_btree.mod src/CMakeFiles/dbcsr.dir/dbcsr_btree.mod.stamp GNU +/usr/bin/cmake -E touch src/CMakeFiles/dbcsr.dir/core/dbcsr_iter_types.F.o.provides.build /usr/bin/cmake -E touch src/CMakeFiles/dbcsr.dir/core/dbcsr_list_callstackentry.F.o.provides.build -/usr/bin/cmake -E cmake_copy_f90_mod src/dbcsr_dict.mod src/CMakeFiles/dbcsr.dir/dbcsr_dict.mod.stamp GNU +/usr/bin/cmake -E touch src/CMakeFiles/dbcsr.dir/core/dbcsr_list_routinereport.F.o.provides.build +/usr/bin/cmake -E touch src/CMakeFiles/dbcsr.dir/core/dbcsr_print_messages.F.o.provides.build +/usr/bin/cmake -E touch src/CMakeFiles/dbcsr.dir/utils/dbcsr_files.F.o.provides.build /usr/bin/cmake -E touch src/CMakeFiles/dbcsr.dir/core/dbcsr_list_routinestat.F.o.provides.build -/usr/bin/cmake -E touch src/CMakeFiles/dbcsr.dir/utils/dbcsr_btree.F.o.provides.build -/usr/bin/cmake -E touch src/CMakeFiles/dbcsr.dir/core/dbcsr_dict.F.o.provides.build +[ 55%] Building Fortran object src/CMakeFiles/dbcsr.dir/tas/dbcsr_tas_global.F.o +cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/gfortran -D__STATM_TOTAL -D__parallel -D__SHORT_FILE__=\"dbcsr_tas_global.F\" -I/build/reproducible-path/dbcsr-2.6.0/src/base -I/build/reproducible-path/dbcsr-2.6.0/src -I/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src -I/usr/lib/i386-linux-gnu/mpich/include -ffree-form -std=f2008ts -fimplicit-none -Werror=aliasing -Werror=ampersand -Werror=c-binding-type -Werror=intrinsic-shadow -Werror=intrinsics-std -Werror=line-truncation -Werror=tabs -Werror=target-lifetime -Werror=underflow -Werror=unused-but-set-parameter -Werror=unused-but-set-variable -Werror=unused-variable -Werror=unused-dummy-argument -Werror=conversion -Werror=zerotrip -Werror=uninitialized -Wno-maybe-uninitialized -Werror=unused-parameter -fallow-argument-mismatch -fPIC -fallow-invalid-boz -fallow-argument-mismatch -fopenmp -c /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/tas/dbcsr_tas_global.F -o CMakeFiles/dbcsr.dir/tas/dbcsr_tas_global.F.o [ 56%] Building Fortran object src/CMakeFiles/dbcsr.dir/core/dbcsr_timings_types.F.o cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/gfortran -D__STATM_TOTAL -D__parallel -D__SHORT_FILE__=\"dbcsr_timings_types.F\" -I/build/reproducible-path/dbcsr-2.6.0/src/base -I/build/reproducible-path/dbcsr-2.6.0/src -I/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src -I/usr/lib/i386-linux-gnu/mpich/include -ffree-form -std=f2008ts -fimplicit-none -Werror=aliasing -Werror=ampersand -Werror=c-binding-type -Werror=intrinsic-shadow -Werror=intrinsics-std -Werror=line-truncation -Werror=tabs -Werror=target-lifetime -Werror=underflow -Werror=unused-but-set-parameter -Werror=unused-but-set-variable -Werror=unused-variable -Werror=unused-dummy-argument -Werror=conversion -Werror=zerotrip -Werror=uninitialized -Wno-maybe-uninitialized -Werror=unused-parameter -fallow-argument-mismatch -fPIC -fallow-invalid-boz -fallow-argument-mismatch -fopenmp -c /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/core/dbcsr_timings_types.F -o CMakeFiles/dbcsr.dir/core/dbcsr_timings_types.F.o -/usr/bin/cmake -E cmake_copy_f90_mod src/dbcsr_files.mod src/CMakeFiles/dbcsr.dir/dbcsr_files.mod.stamp GNU /usr/bin/cmake -E cmake_copy_f90_mod src/dbcsr_timings_types.mod src/CMakeFiles/dbcsr.dir/dbcsr_timings_types.mod.stamp GNU -/usr/bin/cmake -E touch src/CMakeFiles/dbcsr.dir/utils/dbcsr_files.F.o.provides.build /usr/bin/cmake -E touch src/CMakeFiles/dbcsr.dir/core/dbcsr_timings_types.F.o.provides.build [ 56%] Building Fortran object src/CMakeFiles/dbcsr.dir/core/dbcsr_list_timerenv.F.o cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/gfortran -D__STATM_TOTAL -D__parallel -D__SHORT_FILE__=\"dbcsr_list_timerenv.F\" -I/build/reproducible-path/dbcsr-2.6.0/src/base -I/build/reproducible-path/dbcsr-2.6.0/src -I/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src -I/usr/lib/i386-linux-gnu/mpich/include -ffree-form -std=f2008ts -fimplicit-none -Werror=aliasing -Werror=ampersand -Werror=c-binding-type -Werror=intrinsic-shadow -Werror=intrinsics-std -Werror=line-truncation -Werror=tabs -Werror=target-lifetime -Werror=underflow -Werror=unused-but-set-parameter -Werror=unused-but-set-variable -Werror=unused-variable -Werror=unused-dummy-argument -Werror=conversion -Werror=zerotrip -Werror=uninitialized -Wno-maybe-uninitialized -Werror=unused-parameter -fallow-argument-mismatch -fPIC -fallow-invalid-boz -fallow-argument-mismatch -fopenmp -c /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/core/dbcsr_list_timerenv.F -o CMakeFiles/dbcsr.dir/core/dbcsr_list_timerenv.F.o @@ -1074,54 +1110,54 @@ /usr/bin/cmake -E touch src/CMakeFiles/dbcsr.dir/core/dbcsr_config.F.o.provides.build [ 57%] Building Fortran object src/CMakeFiles/dbcsr.dir/acc/dbcsr_acc_stream.F.o [ 57%] Building Fortran object src/CMakeFiles/dbcsr.dir/acc/dbcsr_acc_init.F.o -cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/gfortran -D__STATM_TOTAL -D__parallel -D__SHORT_FILE__=\"dbcsr_acc_init.F\" -I/build/reproducible-path/dbcsr-2.6.0/src/base -I/build/reproducible-path/dbcsr-2.6.0/src -I/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src -I/usr/lib/i386-linux-gnu/mpich/include -ffree-form -std=f2008ts -fimplicit-none -Werror=aliasing -Werror=ampersand -Werror=c-binding-type -Werror=intrinsic-shadow -Werror=intrinsics-std -Werror=line-truncation -Werror=tabs -Werror=target-lifetime -Werror=underflow -Werror=unused-but-set-parameter -Werror=unused-but-set-variable -Werror=unused-variable -Werror=unused-dummy-argument -Werror=conversion -Werror=zerotrip -Werror=uninitialized -Wno-maybe-uninitialized -Werror=unused-parameter -fallow-argument-mismatch -fPIC -fallow-invalid-boz -fallow-argument-mismatch -fopenmp -c /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/acc/dbcsr_acc_init.F -o CMakeFiles/dbcsr.dir/acc/dbcsr_acc_init.F.o cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/gfortran -D__STATM_TOTAL -D__parallel -D__SHORT_FILE__=\"dbcsr_acc_stream.F\" -I/build/reproducible-path/dbcsr-2.6.0/src/base -I/build/reproducible-path/dbcsr-2.6.0/src -I/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src -I/usr/lib/i386-linux-gnu/mpich/include -ffree-form -std=f2008ts -fimplicit-none -Werror=aliasing -Werror=ampersand -Werror=c-binding-type -Werror=intrinsic-shadow -Werror=intrinsics-std -Werror=line-truncation -Werror=tabs -Werror=target-lifetime -Werror=underflow -Werror=unused-but-set-parameter -Werror=unused-but-set-variable -Werror=unused-variable -Werror=unused-dummy-argument -Werror=conversion -Werror=zerotrip -Werror=uninitialized -Wno-maybe-uninitialized -Werror=unused-parameter -fallow-argument-mismatch -fPIC -fallow-invalid-boz -fallow-argument-mismatch -fopenmp -c /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/acc/dbcsr_acc_stream.F -o CMakeFiles/dbcsr.dir/acc/dbcsr_acc_stream.F.o +cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/gfortran -D__STATM_TOTAL -D__parallel -D__SHORT_FILE__=\"dbcsr_acc_init.F\" -I/build/reproducible-path/dbcsr-2.6.0/src/base -I/build/reproducible-path/dbcsr-2.6.0/src -I/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src -I/usr/lib/i386-linux-gnu/mpich/include -ffree-form -std=f2008ts -fimplicit-none -Werror=aliasing -Werror=ampersand -Werror=c-binding-type -Werror=intrinsic-shadow -Werror=intrinsics-std -Werror=line-truncation -Werror=tabs -Werror=target-lifetime -Werror=underflow -Werror=unused-but-set-parameter -Werror=unused-but-set-variable -Werror=unused-variable -Werror=unused-dummy-argument -Werror=conversion -Werror=zerotrip -Werror=uninitialized -Wno-maybe-uninitialized -Werror=unused-parameter -fallow-argument-mismatch -fPIC -fallow-invalid-boz -fallow-argument-mismatch -fopenmp -c /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/acc/dbcsr_acc_init.F -o CMakeFiles/dbcsr.dir/acc/dbcsr_acc_init.F.o /usr/bin/cmake -E cmake_copy_f90_mod src/dbcsr_acc_init.mod src/CMakeFiles/dbcsr.dir/dbcsr_acc_init.mod.stamp GNU /usr/bin/cmake -E cmake_copy_f90_mod src/dbcsr_acc_stream.mod src/CMakeFiles/dbcsr.dir/dbcsr_acc_stream.mod.stamp GNU /usr/bin/cmake -E touch src/CMakeFiles/dbcsr.dir/acc/dbcsr_acc_init.F.o.provides.build /usr/bin/cmake -E touch src/CMakeFiles/dbcsr.dir/acc/dbcsr_acc_stream.F.o.provides.build -[ 57%] Building Fortran object src/CMakeFiles/dbcsr.dir/acc/dbcsr_acc_devmem.F.o [ 57%] Building Fortran object src/CMakeFiles/dbcsr.dir/acc/dbcsr_acc_event.F.o +cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/gfortran -D__STATM_TOTAL -D__parallel -D__SHORT_FILE__=\"dbcsr_acc_event.F\" -I/build/reproducible-path/dbcsr-2.6.0/src/base -I/build/reproducible-path/dbcsr-2.6.0/src -I/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src -I/usr/lib/i386-linux-gnu/mpich/include -ffree-form -std=f2008ts -fimplicit-none -Werror=aliasing -Werror=ampersand -Werror=c-binding-type -Werror=intrinsic-shadow -Werror=intrinsics-std -Werror=line-truncation -Werror=tabs -Werror=target-lifetime -Werror=underflow -Werror=unused-but-set-parameter -Werror=unused-but-set-variable -Werror=unused-variable -Werror=unused-dummy-argument -Werror=conversion -Werror=zerotrip -Werror=uninitialized -Wno-maybe-uninitialized -Werror=unused-parameter -fallow-argument-mismatch -fPIC -fallow-invalid-boz -fallow-argument-mismatch -fopenmp -c /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/acc/dbcsr_acc_event.F -o CMakeFiles/dbcsr.dir/acc/dbcsr_acc_event.F.o [ 59%] Building Fortran object src/CMakeFiles/dbcsr.dir/acc/dbcsr_acc_hostmem.F.o +[ 59%] Building Fortran object src/CMakeFiles/dbcsr.dir/acc/dbcsr_acc_devmem.F.o cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/gfortran -D__STATM_TOTAL -D__parallel -D__SHORT_FILE__=\"dbcsr_acc_devmem.F\" -I/build/reproducible-path/dbcsr-2.6.0/src/base -I/build/reproducible-path/dbcsr-2.6.0/src -I/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src -I/usr/lib/i386-linux-gnu/mpich/include -ffree-form -std=f2008ts -fimplicit-none -Werror=aliasing -Werror=ampersand -Werror=c-binding-type -Werror=intrinsic-shadow -Werror=intrinsics-std -Werror=line-truncation -Werror=tabs -Werror=target-lifetime -Werror=underflow -Werror=unused-but-set-parameter -Werror=unused-but-set-variable -Werror=unused-variable -Werror=unused-dummy-argument -Werror=conversion -Werror=zerotrip -Werror=uninitialized -Wno-maybe-uninitialized -Werror=unused-parameter -fallow-argument-mismatch -fPIC -fallow-invalid-boz -fallow-argument-mismatch -fopenmp -c /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/acc/dbcsr_acc_devmem.F -o CMakeFiles/dbcsr.dir/acc/dbcsr_acc_devmem.F.o -cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/gfortran -D__STATM_TOTAL -D__parallel -D__SHORT_FILE__=\"dbcsr_acc_event.F\" -I/build/reproducible-path/dbcsr-2.6.0/src/base -I/build/reproducible-path/dbcsr-2.6.0/src -I/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src -I/usr/lib/i386-linux-gnu/mpich/include -ffree-form -std=f2008ts -fimplicit-none -Werror=aliasing -Werror=ampersand -Werror=c-binding-type -Werror=intrinsic-shadow -Werror=intrinsics-std -Werror=line-truncation -Werror=tabs -Werror=target-lifetime -Werror=underflow -Werror=unused-but-set-parameter -Werror=unused-but-set-variable -Werror=unused-variable -Werror=unused-dummy-argument -Werror=conversion -Werror=zerotrip -Werror=uninitialized -Wno-maybe-uninitialized -Werror=unused-parameter -fallow-argument-mismatch -fPIC -fallow-invalid-boz -fallow-argument-mismatch -fopenmp -c /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/acc/dbcsr_acc_event.F -o CMakeFiles/dbcsr.dir/acc/dbcsr_acc_event.F.o cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/gfortran -D__STATM_TOTAL -D__parallel -D__SHORT_FILE__=\"dbcsr_acc_hostmem.F\" -I/build/reproducible-path/dbcsr-2.6.0/src/base -I/build/reproducible-path/dbcsr-2.6.0/src -I/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src -I/usr/lib/i386-linux-gnu/mpich/include -ffree-form -std=f2008ts -fimplicit-none -Werror=aliasing -Werror=ampersand -Werror=c-binding-type -Werror=intrinsic-shadow -Werror=intrinsics-std -Werror=line-truncation -Werror=tabs -Werror=target-lifetime -Werror=underflow -Werror=unused-but-set-parameter -Werror=unused-but-set-variable -Werror=unused-variable -Werror=unused-dummy-argument -Werror=conversion -Werror=zerotrip -Werror=uninitialized -Wno-maybe-uninitialized -Werror=unused-parameter -fallow-argument-mismatch -fPIC -fallow-invalid-boz -fallow-argument-mismatch -fopenmp -c /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/acc/dbcsr_acc_hostmem.F -o CMakeFiles/dbcsr.dir/acc/dbcsr_acc_hostmem.F.o /usr/bin/cmake -E cmake_copy_f90_mod src/dbcsr_acc_event.mod src/CMakeFiles/dbcsr.dir/dbcsr_acc_event.mod.stamp GNU /usr/bin/cmake -E touch src/CMakeFiles/dbcsr.dir/acc/dbcsr_acc_event.F.o.provides.build /usr/bin/cmake -E cmake_copy_f90_mod src/dbcsr_acc_devmem.mod src/CMakeFiles/dbcsr.dir/dbcsr_acc_devmem.mod.stamp GNU -/usr/bin/cmake -E cmake_copy_f90_mod src/dbcsr_acc_hostmem.mod src/CMakeFiles/dbcsr.dir/dbcsr_acc_hostmem.mod.stamp GNU /usr/bin/cmake -E touch src/CMakeFiles/dbcsr.dir/acc/dbcsr_acc_devmem.F.o.provides.build -/usr/bin/cmake -E touch src/CMakeFiles/dbcsr.dir/acc/dbcsr_acc_hostmem.F.o.provides.build -[ 59%] Building Fortran object src/CMakeFiles/dbcsr.dir/data/dbcsr_data_types.F.o +/usr/bin/cmake -E cmake_copy_f90_mod src/dbcsr_acc_hostmem.mod src/CMakeFiles/dbcsr.dir/dbcsr_acc_hostmem.mod.stamp GNU [ 59%] Building Fortran object src/CMakeFiles/dbcsr.dir/core/dbcsr_timings.F.o -cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/gfortran -D__STATM_TOTAL -D__parallel -D__SHORT_FILE__=\"dbcsr_data_types.F\" -I/build/reproducible-path/dbcsr-2.6.0/src/base -I/build/reproducible-path/dbcsr-2.6.0/src -I/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src -I/usr/lib/i386-linux-gnu/mpich/include -ffree-form -std=f2008ts -fimplicit-none -Werror=aliasing -Werror=ampersand -Werror=c-binding-type -Werror=intrinsic-shadow -Werror=intrinsics-std -Werror=line-truncation -Werror=tabs -Werror=target-lifetime -Werror=underflow -Werror=unused-but-set-parameter -Werror=unused-but-set-variable -Werror=unused-variable -Werror=unused-dummy-argument -Werror=conversion -Werror=zerotrip -Werror=uninitialized -Wno-maybe-uninitialized -Werror=unused-parameter -fallow-argument-mismatch -fPIC -fallow-invalid-boz -fallow-argument-mismatch -fopenmp -c /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/data/dbcsr_data_types.F -o CMakeFiles/dbcsr.dir/data/dbcsr_data_types.F.o cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/gfortran -D__STATM_TOTAL -D__parallel -D__SHORT_FILE__=\"dbcsr_timings.F\" -I/build/reproducible-path/dbcsr-2.6.0/src/base -I/build/reproducible-path/dbcsr-2.6.0/src -I/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src -I/usr/lib/i386-linux-gnu/mpich/include -ffree-form -std=f2008ts -fimplicit-none -Werror=aliasing -Werror=ampersand -Werror=c-binding-type -Werror=intrinsic-shadow -Werror=intrinsics-std -Werror=line-truncation -Werror=tabs -Werror=target-lifetime -Werror=underflow -Werror=unused-but-set-parameter -Werror=unused-but-set-variable -Werror=unused-variable -Werror=unused-dummy-argument -Werror=conversion -Werror=zerotrip -Werror=uninitialized -Wno-maybe-uninitialized -Werror=unused-parameter -fallow-argument-mismatch -fPIC -fallow-invalid-boz -fallow-argument-mismatch -fopenmp -c /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/core/dbcsr_timings.F -o CMakeFiles/dbcsr.dir/core/dbcsr_timings.F.o +[ 59%] Building Fortran object src/CMakeFiles/dbcsr.dir/data/dbcsr_data_types.F.o +cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/gfortran -D__STATM_TOTAL -D__parallel -D__SHORT_FILE__=\"dbcsr_data_types.F\" -I/build/reproducible-path/dbcsr-2.6.0/src/base -I/build/reproducible-path/dbcsr-2.6.0/src -I/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src -I/usr/lib/i386-linux-gnu/mpich/include -ffree-form -std=f2008ts -fimplicit-none -Werror=aliasing -Werror=ampersand -Werror=c-binding-type -Werror=intrinsic-shadow -Werror=intrinsics-std -Werror=line-truncation -Werror=tabs -Werror=target-lifetime -Werror=underflow -Werror=unused-but-set-parameter -Werror=unused-but-set-variable -Werror=unused-variable -Werror=unused-dummy-argument -Werror=conversion -Werror=zerotrip -Werror=uninitialized -Wno-maybe-uninitialized -Werror=unused-parameter -fallow-argument-mismatch -fPIC -fallow-invalid-boz -fallow-argument-mismatch -fopenmp -c /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/data/dbcsr_data_types.F -o CMakeFiles/dbcsr.dir/data/dbcsr_data_types.F.o +/usr/bin/cmake -E touch src/CMakeFiles/dbcsr.dir/acc/dbcsr_acc_hostmem.F.o.provides.build /usr/bin/cmake -E cmake_copy_f90_mod src/dbcsr_data_types.mod src/CMakeFiles/dbcsr.dir/dbcsr_data_types.mod.stamp GNU /usr/bin/cmake -E touch src/CMakeFiles/dbcsr.dir/data/dbcsr_data_types.F.o.provides.build [ 59%] Building Fortran object src/CMakeFiles/dbcsr.dir/data/dbcsr_ptr_util.F.o -[ 60%] Building Fortran object src/CMakeFiles/dbcsr.dir/core/dbcsr_types.F.o cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/gfortran -D__STATM_TOTAL -D__parallel -D__SHORT_FILE__=\"dbcsr_ptr_util.F\" -I/build/reproducible-path/dbcsr-2.6.0/src/base -I/build/reproducible-path/dbcsr-2.6.0/src -I/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src -I/usr/lib/i386-linux-gnu/mpich/include -ffree-form -std=f2008ts -fimplicit-none -Werror=aliasing -Werror=ampersand -Werror=c-binding-type -Werror=intrinsic-shadow -Werror=intrinsics-std -Werror=line-truncation -Werror=tabs -Werror=target-lifetime -Werror=underflow -Werror=unused-but-set-parameter -Werror=unused-but-set-variable -Werror=unused-variable -Werror=unused-dummy-argument -Werror=conversion -Werror=zerotrip -Werror=uninitialized -Wno-maybe-uninitialized -Werror=unused-parameter -fallow-argument-mismatch -fPIC -fallow-invalid-boz -fallow-argument-mismatch -fopenmp -c /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/data/dbcsr_ptr_util.F -o CMakeFiles/dbcsr.dir/data/dbcsr_ptr_util.F.o +[ 60%] Building Fortran object src/CMakeFiles/dbcsr.dir/core/dbcsr_types.F.o cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/gfortran -D__STATM_TOTAL -D__parallel -D__SHORT_FILE__=\"dbcsr_types.F\" -I/build/reproducible-path/dbcsr-2.6.0/src/base -I/build/reproducible-path/dbcsr-2.6.0/src -I/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src -I/usr/lib/i386-linux-gnu/mpich/include -ffree-form -std=f2008ts -fimplicit-none -Werror=aliasing -Werror=ampersand -Werror=c-binding-type -Werror=intrinsic-shadow -Werror=intrinsics-std -Werror=line-truncation -Werror=tabs -Werror=target-lifetime -Werror=underflow -Werror=unused-but-set-parameter -Werror=unused-but-set-variable -Werror=unused-variable -Werror=unused-dummy-argument -Werror=conversion -Werror=zerotrip -Werror=uninitialized -Wno-maybe-uninitialized -Werror=unused-parameter -fallow-argument-mismatch -fPIC -fallow-invalid-boz -fallow-argument-mismatch -fopenmp -c /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/core/dbcsr_types.F -o CMakeFiles/dbcsr.dir/core/dbcsr_types.F.o /usr/bin/cmake -E cmake_copy_f90_mod src/dbcsr_timings.mod src/CMakeFiles/dbcsr.dir/dbcsr_timings.mod.stamp GNU /usr/bin/cmake -E touch src/CMakeFiles/dbcsr.dir/core/dbcsr_timings.F.o.provides.build /usr/bin/cmake -E cmake_copy_f90_mod src/dbcsr_types.mod src/CMakeFiles/dbcsr.dir/dbcsr_types.mod.stamp GNU /usr/bin/cmake -E touch src/CMakeFiles/dbcsr.dir/core/dbcsr_types.F.o.provides.build -[ 60%] Building Fortran object src/CMakeFiles/dbcsr.dir/utils/dbcsr_blas_operations.F.o -cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/gfortran -D__STATM_TOTAL -D__parallel -D__SHORT_FILE__=\"dbcsr_blas_operations.F\" -I/build/reproducible-path/dbcsr-2.6.0/src/base -I/build/reproducible-path/dbcsr-2.6.0/src -I/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src -I/usr/lib/i386-linux-gnu/mpich/include -ffree-form -std=f2008ts -fimplicit-none -Werror=aliasing -Werror=ampersand -Werror=c-binding-type -Werror=intrinsic-shadow -Werror=intrinsics-std -Werror=line-truncation -Werror=tabs -Werror=target-lifetime -Werror=underflow -Werror=unused-but-set-parameter -Werror=unused-but-set-variable -Werror=unused-variable -Werror=unused-dummy-argument -Werror=conversion -Werror=zerotrip -Werror=uninitialized -Wno-maybe-uninitialized -Werror=unused-parameter -fallow-argument-mismatch -fPIC -fallow-invalid-boz -fallow-argument-mismatch -fopenmp -c /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/utils/dbcsr_blas_operations.F -o CMakeFiles/dbcsr.dir/utils/dbcsr_blas_operations.F.o -[ 60%] Building Fortran object src/CMakeFiles/dbcsr.dir/tas/dbcsr_tas_types.F.o -[ 62%] Building Fortran object src/CMakeFiles/dbcsr.dir/core/dbcsr_timings_report.F.o [ 62%] Building Fortran object src/CMakeFiles/dbcsr.dir/mm/dbcsr_acc_operations.F.o -cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/gfortran -D__STATM_TOTAL -D__parallel -D__SHORT_FILE__=\"dbcsr_timings_report.F\" -I/build/reproducible-path/dbcsr-2.6.0/src/base -I/build/reproducible-path/dbcsr-2.6.0/src -I/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src -I/usr/lib/i386-linux-gnu/mpich/include -ffree-form -std=f2008ts -fimplicit-none -Werror=aliasing -Werror=ampersand -Werror=c-binding-type -Werror=intrinsic-shadow -Werror=intrinsics-std -Werror=line-truncation -Werror=tabs -Werror=target-lifetime -Werror=underflow -Werror=unused-but-set-parameter -Werror=unused-but-set-variable -Werror=unused-variable -Werror=unused-dummy-argument -Werror=conversion -Werror=zerotrip -Werror=uninitialized -Wno-maybe-uninitialized -Werror=unused-parameter -fallow-argument-mismatch -fPIC -fallow-invalid-boz -fallow-argument-mismatch -fopenmp -c /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/core/dbcsr_timings_report.F -o CMakeFiles/dbcsr.dir/core/dbcsr_timings_report.F.o cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/gfortran -D__STATM_TOTAL -D__parallel -D__SHORT_FILE__=\"dbcsr_acc_operations.F\" -I/build/reproducible-path/dbcsr-2.6.0/src/base -I/build/reproducible-path/dbcsr-2.6.0/src -I/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src -I/usr/lib/i386-linux-gnu/mpich/include -ffree-form -std=f2008ts -fimplicit-none -Werror=aliasing -Werror=ampersand -Werror=c-binding-type -Werror=intrinsic-shadow -Werror=intrinsics-std -Werror=line-truncation -Werror=tabs -Werror=target-lifetime -Werror=underflow -Werror=unused-but-set-parameter -Werror=unused-but-set-variable -Werror=unused-variable -Werror=unused-dummy-argument -Werror=conversion -Werror=zerotrip -Werror=uninitialized -Wno-maybe-uninitialized -Werror=unused-parameter -fallow-argument-mismatch -fPIC -fallow-invalid-boz -fallow-argument-mismatch -fopenmp -c /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/mm/dbcsr_acc_operations.F -o CMakeFiles/dbcsr.dir/mm/dbcsr_acc_operations.F.o +[ 62%] Building Fortran object src/CMakeFiles/dbcsr.dir/utils/dbcsr_blas_operations.F.o +[ 62%] Building Fortran object src/CMakeFiles/dbcsr.dir/core/dbcsr_timings_report.F.o +[ 62%] Building Fortran object src/CMakeFiles/dbcsr.dir/tas/dbcsr_tas_types.F.o +cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/gfortran -D__STATM_TOTAL -D__parallel -D__SHORT_FILE__=\"dbcsr_blas_operations.F\" -I/build/reproducible-path/dbcsr-2.6.0/src/base -I/build/reproducible-path/dbcsr-2.6.0/src -I/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src -I/usr/lib/i386-linux-gnu/mpich/include -ffree-form -std=f2008ts -fimplicit-none -Werror=aliasing -Werror=ampersand -Werror=c-binding-type -Werror=intrinsic-shadow -Werror=intrinsics-std -Werror=line-truncation -Werror=tabs -Werror=target-lifetime -Werror=underflow -Werror=unused-but-set-parameter -Werror=unused-but-set-variable -Werror=unused-variable -Werror=unused-dummy-argument -Werror=conversion -Werror=zerotrip -Werror=uninitialized -Wno-maybe-uninitialized -Werror=unused-parameter -fallow-argument-mismatch -fPIC -fallow-invalid-boz -fallow-argument-mismatch -fopenmp -c /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/utils/dbcsr_blas_operations.F -o CMakeFiles/dbcsr.dir/utils/dbcsr_blas_operations.F.o +cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/gfortran -D__STATM_TOTAL -D__parallel -D__SHORT_FILE__=\"dbcsr_timings_report.F\" -I/build/reproducible-path/dbcsr-2.6.0/src/base -I/build/reproducible-path/dbcsr-2.6.0/src -I/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src -I/usr/lib/i386-linux-gnu/mpich/include -ffree-form -std=f2008ts -fimplicit-none -Werror=aliasing -Werror=ampersand -Werror=c-binding-type -Werror=intrinsic-shadow -Werror=intrinsics-std -Werror=line-truncation -Werror=tabs -Werror=target-lifetime -Werror=underflow -Werror=unused-but-set-parameter -Werror=unused-but-set-variable -Werror=unused-variable -Werror=unused-dummy-argument -Werror=conversion -Werror=zerotrip -Werror=uninitialized -Wno-maybe-uninitialized -Werror=unused-parameter -fallow-argument-mismatch -fPIC -fallow-invalid-boz -fallow-argument-mismatch -fopenmp -c /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/core/dbcsr_timings_report.F -o CMakeFiles/dbcsr.dir/core/dbcsr_timings_report.F.o cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/gfortran -D__STATM_TOTAL -D__parallel -D__SHORT_FILE__=\"dbcsr_tas_types.F\" -I/build/reproducible-path/dbcsr-2.6.0/src/base -I/build/reproducible-path/dbcsr-2.6.0/src -I/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src -I/usr/lib/i386-linux-gnu/mpich/include -ffree-form -std=f2008ts -fimplicit-none -Werror=aliasing -Werror=ampersand -Werror=c-binding-type -Werror=intrinsic-shadow -Werror=intrinsics-std -Werror=line-truncation -Werror=tabs -Werror=target-lifetime -Werror=underflow -Werror=unused-but-set-parameter -Werror=unused-but-set-variable -Werror=unused-variable -Werror=unused-dummy-argument -Werror=conversion -Werror=zerotrip -Werror=uninitialized -Wno-maybe-uninitialized -Werror=unused-parameter -fallow-argument-mismatch -fPIC -fallow-invalid-boz -fallow-argument-mismatch -fopenmp -c /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/tas/dbcsr_tas_types.F -o CMakeFiles/dbcsr.dir/tas/dbcsr_tas_types.F.o /usr/bin/cmake -E cmake_copy_f90_mod src/dbcsr_blas_operations.mod src/CMakeFiles/dbcsr.dir/dbcsr_blas_operations.mod.stamp GNU /usr/bin/cmake -E cmake_copy_f90_mod src/dbcsr_acc_operations.mod src/CMakeFiles/dbcsr.dir/dbcsr_acc_operations.mod.stamp GNU /usr/bin/cmake -E touch src/CMakeFiles/dbcsr.dir/utils/dbcsr_blas_operations.F.o.provides.build /usr/bin/cmake -E touch src/CMakeFiles/dbcsr.dir/mm/dbcsr_acc_operations.F.o.provides.build -/usr/bin/cmake -E cmake_copy_f90_mod src/dbcsr_tas_types.mod src/CMakeFiles/dbcsr.dir/dbcsr_tas_types.mod.stamp GNU /usr/bin/cmake -E cmake_copy_f90_mod src/dbcsr_timings_report.mod src/CMakeFiles/dbcsr.dir/dbcsr_timings_report.mod.stamp GNU -/usr/bin/cmake -E touch src/CMakeFiles/dbcsr.dir/tas/dbcsr_tas_types.F.o.provides.build +/usr/bin/cmake -E cmake_copy_f90_mod src/dbcsr_tas_types.mod src/CMakeFiles/dbcsr.dir/dbcsr_tas_types.mod.stamp GNU /usr/bin/cmake -E touch src/CMakeFiles/dbcsr.dir/core/dbcsr_timings_report.F.o.provides.build +/usr/bin/cmake -E touch src/CMakeFiles/dbcsr.dir/tas/dbcsr_tas_types.F.o.provides.build /usr/bin/cmake -E cmake_copy_f90_mod src/dbcsr_ptr_util.mod src/CMakeFiles/dbcsr.dir/dbcsr_ptr_util.mod.stamp GNU /usr/bin/cmake -E touch src/CMakeFiles/dbcsr.dir/data/dbcsr_ptr_util.F.o.provides.build [ 63%] Building Fortran object src/CMakeFiles/dbcsr.dir/data/dbcsr_data_methods_low.F.o @@ -1130,8 +1166,8 @@ /usr/bin/cmake -E touch src/CMakeFiles/dbcsr.dir/data/dbcsr_data_methods_low.F.o.provides.build [ 65%] Building Fortran object src/CMakeFiles/dbcsr.dir/block/dbcsr_block_operations.F.o [ 65%] Building Fortran object src/CMakeFiles/dbcsr.dir/data/dbcsr_mem_methods.F.o -cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/gfortran -D__STATM_TOTAL -D__parallel -D__SHORT_FILE__=\"dbcsr_block_operations.F\" -I/build/reproducible-path/dbcsr-2.6.0/src/base -I/build/reproducible-path/dbcsr-2.6.0/src -I/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src -I/usr/lib/i386-linux-gnu/mpich/include -ffree-form -std=f2008ts -fimplicit-none -Werror=aliasing -Werror=ampersand -Werror=c-binding-type -Werror=intrinsic-shadow -Werror=intrinsics-std -Werror=line-truncation -Werror=tabs -Werror=target-lifetime -Werror=underflow -Werror=unused-but-set-parameter -Werror=unused-but-set-variable -Werror=unused-variable -Werror=unused-dummy-argument -Werror=conversion -Werror=zerotrip -Werror=uninitialized -Wno-maybe-uninitialized -Werror=unused-parameter -fallow-argument-mismatch -fPIC -fallow-invalid-boz -fallow-argument-mismatch -fopenmp -c /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/block/dbcsr_block_operations.F -o CMakeFiles/dbcsr.dir/block/dbcsr_block_operations.F.o cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/gfortran -D__STATM_TOTAL -D__parallel -D__SHORT_FILE__=\"dbcsr_mem_methods.F\" -I/build/reproducible-path/dbcsr-2.6.0/src/base -I/build/reproducible-path/dbcsr-2.6.0/src -I/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src -I/usr/lib/i386-linux-gnu/mpich/include -ffree-form -std=f2008ts -fimplicit-none -Werror=aliasing -Werror=ampersand -Werror=c-binding-type -Werror=intrinsic-shadow -Werror=intrinsics-std -Werror=line-truncation -Werror=tabs -Werror=target-lifetime -Werror=underflow -Werror=unused-but-set-parameter -Werror=unused-but-set-variable -Werror=unused-variable -Werror=unused-dummy-argument -Werror=conversion -Werror=zerotrip -Werror=uninitialized -Wno-maybe-uninitialized -Werror=unused-parameter -fallow-argument-mismatch -fPIC -fallow-invalid-boz -fallow-argument-mismatch -fopenmp -c /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/data/dbcsr_mem_methods.F -o CMakeFiles/dbcsr.dir/data/dbcsr_mem_methods.F.o +cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/gfortran -D__STATM_TOTAL -D__parallel -D__SHORT_FILE__=\"dbcsr_block_operations.F\" -I/build/reproducible-path/dbcsr-2.6.0/src/base -I/build/reproducible-path/dbcsr-2.6.0/src -I/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src -I/usr/lib/i386-linux-gnu/mpich/include -ffree-form -std=f2008ts -fimplicit-none -Werror=aliasing -Werror=ampersand -Werror=c-binding-type -Werror=intrinsic-shadow -Werror=intrinsics-std -Werror=line-truncation -Werror=tabs -Werror=target-lifetime -Werror=underflow -Werror=unused-but-set-parameter -Werror=unused-but-set-variable -Werror=unused-variable -Werror=unused-dummy-argument -Werror=conversion -Werror=zerotrip -Werror=uninitialized -Wno-maybe-uninitialized -Werror=unused-parameter -fallow-argument-mismatch -fPIC -fallow-invalid-boz -fallow-argument-mismatch -fopenmp -c /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/block/dbcsr_block_operations.F -o CMakeFiles/dbcsr.dir/block/dbcsr_block_operations.F.o /usr/bin/cmake -E cmake_copy_f90_mod src/dbcsr_mem_methods.mod src/CMakeFiles/dbcsr.dir/dbcsr_mem_methods.mod.stamp GNU /usr/bin/cmake -E touch src/CMakeFiles/dbcsr.dir/data/dbcsr_mem_methods.F.o.provides.build [ 65%] Building Fortran object src/CMakeFiles/dbcsr.dir/data/dbcsr_data_methods.F.o @@ -1140,60 +1176,60 @@ /usr/bin/cmake -E touch src/CMakeFiles/dbcsr.dir/data/dbcsr_data_methods.F.o.provides.build [ 65%] Building Fortran object src/CMakeFiles/dbcsr.dir/mm/dbcsr_mm_hostdrv.F.o [ 65%] Building Fortran object src/CMakeFiles/dbcsr.dir/core/dbcsr_methods.F.o -cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/gfortran -D__STATM_TOTAL -D__parallel -D__SHORT_FILE__=\"dbcsr_mm_hostdrv.F\" -I/build/reproducible-path/dbcsr-2.6.0/src/base -I/build/reproducible-path/dbcsr-2.6.0/src -I/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src -I/usr/lib/i386-linux-gnu/mpich/include -ffree-form -std=f2008ts -fimplicit-none -Werror=aliasing -Werror=ampersand -Werror=c-binding-type -Werror=intrinsic-shadow -Werror=intrinsics-std -Werror=line-truncation -Werror=tabs -Werror=target-lifetime -Werror=underflow -Werror=unused-but-set-parameter -Werror=unused-but-set-variable -Werror=unused-variable -Werror=unused-dummy-argument -Werror=conversion -Werror=zerotrip -Werror=uninitialized -Wno-maybe-uninitialized -Werror=unused-parameter -fallow-argument-mismatch -fPIC -fallow-invalid-boz -fallow-argument-mismatch -fopenmp -c /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/mm/dbcsr_mm_hostdrv.F -o CMakeFiles/dbcsr.dir/mm/dbcsr_mm_hostdrv.F.o cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/gfortran -D__STATM_TOTAL -D__parallel -D__SHORT_FILE__=\"dbcsr_methods.F\" -I/build/reproducible-path/dbcsr-2.6.0/src/base -I/build/reproducible-path/dbcsr-2.6.0/src -I/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src -I/usr/lib/i386-linux-gnu/mpich/include -ffree-form -std=f2008ts -fimplicit-none -Werror=aliasing -Werror=ampersand -Werror=c-binding-type -Werror=intrinsic-shadow -Werror=intrinsics-std -Werror=line-truncation -Werror=tabs -Werror=target-lifetime -Werror=underflow -Werror=unused-but-set-parameter -Werror=unused-but-set-variable -Werror=unused-variable -Werror=unused-dummy-argument -Werror=conversion -Werror=zerotrip -Werror=uninitialized -Wno-maybe-uninitialized -Werror=unused-parameter -fallow-argument-mismatch -fPIC -fallow-invalid-boz -fallow-argument-mismatch -fopenmp -c /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/core/dbcsr_methods.F -o CMakeFiles/dbcsr.dir/core/dbcsr_methods.F.o +cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/gfortran -D__STATM_TOTAL -D__parallel -D__SHORT_FILE__=\"dbcsr_mm_hostdrv.F\" -I/build/reproducible-path/dbcsr-2.6.0/src/base -I/build/reproducible-path/dbcsr-2.6.0/src -I/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src -I/usr/lib/i386-linux-gnu/mpich/include -ffree-form -std=f2008ts -fimplicit-none -Werror=aliasing -Werror=ampersand -Werror=c-binding-type -Werror=intrinsic-shadow -Werror=intrinsics-std -Werror=line-truncation -Werror=tabs -Werror=target-lifetime -Werror=underflow -Werror=unused-but-set-parameter -Werror=unused-but-set-variable -Werror=unused-variable -Werror=unused-dummy-argument -Werror=conversion -Werror=zerotrip -Werror=uninitialized -Wno-maybe-uninitialized -Werror=unused-parameter -fallow-argument-mismatch -fPIC -fallow-invalid-boz -fallow-argument-mismatch -fopenmp -c /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/mm/dbcsr_mm_hostdrv.F -o CMakeFiles/dbcsr.dir/mm/dbcsr_mm_hostdrv.F.o +/usr/bin/cmake -E cmake_copy_f90_mod src/dbcsr_mm_hostdrv.mod src/CMakeFiles/dbcsr.dir/dbcsr_mm_hostdrv.mod.stamp GNU +/usr/bin/cmake -E touch src/CMakeFiles/dbcsr.dir/mm/dbcsr_mm_hostdrv.F.o.provides.build /usr/bin/cmake -E cmake_copy_f90_mod src/dbcsr_methods.mod src/CMakeFiles/dbcsr.dir/dbcsr_methods.mod.stamp GNU /usr/bin/cmake -E touch src/CMakeFiles/dbcsr.dir/core/dbcsr_methods.F.o.provides.build [ 65%] Building Fortran object src/CMakeFiles/dbcsr.dir/mpi/dbcsr_mp_methods.F.o [ 65%] Building Fortran object src/CMakeFiles/dbcsr.dir/core/dbcsr_log_handling.F.o cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/gfortran -D__STATM_TOTAL -D__parallel -D__SHORT_FILE__=\"dbcsr_mp_methods.F\" -I/build/reproducible-path/dbcsr-2.6.0/src/base -I/build/reproducible-path/dbcsr-2.6.0/src -I/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src -I/usr/lib/i386-linux-gnu/mpich/include -ffree-form -std=f2008ts -fimplicit-none -Werror=aliasing -Werror=ampersand -Werror=c-binding-type -Werror=intrinsic-shadow -Werror=intrinsics-std -Werror=line-truncation -Werror=tabs -Werror=target-lifetime -Werror=underflow -Werror=unused-but-set-parameter -Werror=unused-but-set-variable -Werror=unused-variable -Werror=unused-dummy-argument -Werror=conversion -Werror=zerotrip -Werror=uninitialized -Wno-maybe-uninitialized -Werror=unused-parameter -fallow-argument-mismatch -fPIC -fallow-invalid-boz -fallow-argument-mismatch -fopenmp -c /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/mpi/dbcsr_mp_methods.F -o CMakeFiles/dbcsr.dir/mpi/dbcsr_mp_methods.F.o cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/gfortran -D__STATM_TOTAL -D__parallel -D__SHORT_FILE__=\"dbcsr_log_handling.F\" -I/build/reproducible-path/dbcsr-2.6.0/src/base -I/build/reproducible-path/dbcsr-2.6.0/src -I/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src -I/usr/lib/i386-linux-gnu/mpich/include -ffree-form -std=f2008ts -fimplicit-none -Werror=aliasing -Werror=ampersand -Werror=c-binding-type -Werror=intrinsic-shadow -Werror=intrinsics-std -Werror=line-truncation -Werror=tabs -Werror=target-lifetime -Werror=underflow -Werror=unused-but-set-parameter -Werror=unused-but-set-variable -Werror=unused-variable -Werror=unused-dummy-argument -Werror=conversion -Werror=zerotrip -Werror=uninitialized -Wno-maybe-uninitialized -Werror=unused-parameter -fallow-argument-mismatch -fPIC -fallow-invalid-boz -fallow-argument-mismatch -fopenmp -c /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/core/dbcsr_log_handling.F -o CMakeFiles/dbcsr.dir/core/dbcsr_log_handling.F.o -/usr/bin/cmake -E cmake_copy_f90_mod src/dbcsr_mm_hostdrv.mod src/CMakeFiles/dbcsr.dir/dbcsr_mm_hostdrv.mod.stamp GNU -/usr/bin/cmake -E touch src/CMakeFiles/dbcsr.dir/mm/dbcsr_mm_hostdrv.F.o.provides.build /usr/bin/cmake -E cmake_copy_f90_mod src/dbcsr_mp_methods.mod src/CMakeFiles/dbcsr.dir/dbcsr_mp_methods.mod.stamp GNU -/usr/bin/cmake -E cmake_copy_f90_mod src/dbcsr_log_handling.mod src/CMakeFiles/dbcsr.dir/dbcsr_log_handling.mod.stamp GNU /usr/bin/cmake -E touch src/CMakeFiles/dbcsr.dir/mpi/dbcsr_mp_methods.F.o.provides.build -/usr/bin/cmake -E touch src/CMakeFiles/dbcsr.dir/core/dbcsr_log_handling.F.o.provides.build [ 66%] Building Fortran object src/CMakeFiles/dbcsr.dir/mpi/dbcsr_mp_operations.F.o [ 68%] Building Fortran object src/CMakeFiles/dbcsr.dir/dist/dbcsr_dist_methods.F.o cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/gfortran -D__STATM_TOTAL -D__parallel -D__SHORT_FILE__=\"dbcsr_mp_operations.F\" -I/build/reproducible-path/dbcsr-2.6.0/src/base -I/build/reproducible-path/dbcsr-2.6.0/src -I/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src -I/usr/lib/i386-linux-gnu/mpich/include -ffree-form -std=f2008ts -fimplicit-none -Werror=aliasing -Werror=ampersand -Werror=c-binding-type -Werror=intrinsic-shadow -Werror=intrinsics-std -Werror=line-truncation -Werror=tabs -Werror=target-lifetime -Werror=underflow -Werror=unused-but-set-parameter -Werror=unused-but-set-variable -Werror=unused-variable -Werror=unused-dummy-argument -Werror=conversion -Werror=zerotrip -Werror=uninitialized -Wno-maybe-uninitialized -Werror=unused-parameter -fallow-argument-mismatch -fPIC -fallow-invalid-boz -fallow-argument-mismatch -fopenmp -c /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/mpi/dbcsr_mp_operations.F -o CMakeFiles/dbcsr.dir/mpi/dbcsr_mp_operations.F.o cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/gfortran -D__STATM_TOTAL -D__parallel -D__SHORT_FILE__=\"dbcsr_dist_methods.F\" -I/build/reproducible-path/dbcsr-2.6.0/src/base -I/build/reproducible-path/dbcsr-2.6.0/src -I/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src -I/usr/lib/i386-linux-gnu/mpich/include -ffree-form -std=f2008ts -fimplicit-none -Werror=aliasing -Werror=ampersand -Werror=c-binding-type -Werror=intrinsic-shadow -Werror=intrinsics-std -Werror=line-truncation -Werror=tabs -Werror=target-lifetime -Werror=underflow -Werror=unused-but-set-parameter -Werror=unused-but-set-variable -Werror=unused-variable -Werror=unused-dummy-argument -Werror=conversion -Werror=zerotrip -Werror=uninitialized -Wno-maybe-uninitialized -Werror=unused-parameter -fallow-argument-mismatch -fPIC -fallow-invalid-boz -fallow-argument-mismatch -fopenmp -c /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/dist/dbcsr_dist_methods.F -o CMakeFiles/dbcsr.dir/dist/dbcsr_dist_methods.F.o +/usr/bin/cmake -E cmake_copy_f90_mod src/dbcsr_log_handling.mod src/CMakeFiles/dbcsr.dir/dbcsr_log_handling.mod.stamp GNU +/usr/bin/cmake -E touch src/CMakeFiles/dbcsr.dir/core/dbcsr_log_handling.F.o.provides.build [ 68%] Building Fortran object src/CMakeFiles/dbcsr.dir/core/dbcsr_error_handling.F.o cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/gfortran -D__STATM_TOTAL -D__parallel -D__SHORT_FILE__=\"dbcsr_error_handling.F\" -I/build/reproducible-path/dbcsr-2.6.0/src/base -I/build/reproducible-path/dbcsr-2.6.0/src -I/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src -I/usr/lib/i386-linux-gnu/mpich/include -ffree-form -std=f2008ts -fimplicit-none -Werror=aliasing -Werror=ampersand -Werror=c-binding-type -Werror=intrinsic-shadow -Werror=intrinsics-std -Werror=line-truncation -Werror=tabs -Werror=target-lifetime -Werror=underflow -Werror=unused-but-set-parameter -Werror=unused-but-set-variable -Werror=unused-variable -Werror=unused-dummy-argument -Werror=conversion -Werror=zerotrip -Werror=uninitialized -Wno-maybe-uninitialized -Werror=unused-parameter -fallow-argument-mismatch -fPIC -fallow-invalid-boz -fallow-argument-mismatch -fopenmp -c /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/core/dbcsr_error_handling.F -o CMakeFiles/dbcsr.dir/core/dbcsr_error_handling.F.o +/usr/bin/cmake -E cmake_copy_f90_mod src/dbcsr_dist_methods.mod src/CMakeFiles/dbcsr.dir/dbcsr_dist_methods.mod.stamp GNU /usr/bin/cmake -E cmake_copy_f90_mod src/dbcsr_block_operations.mod src/CMakeFiles/dbcsr.dir/dbcsr_block_operations.mod.stamp GNU -/usr/bin/cmake -E touch src/CMakeFiles/dbcsr.dir/block/dbcsr_block_operations.F.o.provides.build -[ 68%] Building Fortran object src/CMakeFiles/dbcsr.dir/mm/dbcsr_mm_accdrv.F.o -cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/gfortran -D__STATM_TOTAL -D__parallel -D__SHORT_FILE__=\"dbcsr_mm_accdrv.F\" -I/build/reproducible-path/dbcsr-2.6.0/src/base -I/build/reproducible-path/dbcsr-2.6.0/src -I/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src -I/usr/lib/i386-linux-gnu/mpich/include -ffree-form -std=f2008ts -fimplicit-none -Werror=aliasing -Werror=ampersand -Werror=c-binding-type -Werror=intrinsic-shadow -Werror=intrinsics-std -Werror=line-truncation -Werror=tabs -Werror=target-lifetime -Werror=underflow -Werror=unused-but-set-parameter -Werror=unused-but-set-variable -Werror=unused-variable -Werror=unused-dummy-argument -Werror=conversion -Werror=zerotrip -Werror=uninitialized -Wno-maybe-uninitialized -Werror=unused-parameter -fallow-argument-mismatch -fPIC -fallow-invalid-boz -fallow-argument-mismatch -fopenmp -c /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/mm/dbcsr_mm_accdrv.F -o CMakeFiles/dbcsr.dir/mm/dbcsr_mm_accdrv.F.o /usr/bin/cmake -E cmake_copy_f90_mod src/dbcsr_error_handling.mod src/CMakeFiles/dbcsr.dir/dbcsr_error_handling.mod.stamp GNU -/usr/bin/cmake -E touch src/CMakeFiles/dbcsr.dir/core/dbcsr_error_handling.F.o.provides.build -/usr/bin/cmake -E cmake_copy_f90_mod src/dbcsr_dist_methods.mod src/CMakeFiles/dbcsr.dir/dbcsr_dist_methods.mod.stamp GNU /usr/bin/cmake -E touch src/CMakeFiles/dbcsr.dir/dist/dbcsr_dist_methods.F.o.provides.build -[ 68%] Building Fortran object src/CMakeFiles/dbcsr.dir/dist/dbcsr_dist_util.F.o -[ 68%] Building Fortran object src/CMakeFiles/dbcsr.dir/dist/dbcsr_dist_operations.F.o +/usr/bin/cmake -E touch src/CMakeFiles/dbcsr.dir/block/dbcsr_block_operations.F.o.provides.build +/usr/bin/cmake -E touch src/CMakeFiles/dbcsr.dir/core/dbcsr_error_handling.F.o.provides.build [ 68%] Building Fortran object src/CMakeFiles/dbcsr.dir/block/dbcsr_iterator_operations.F.o +[ 68%] Building Fortran object src/CMakeFiles/dbcsr.dir/dist/dbcsr_dist_operations.F.o +[ 68%] Building Fortran object src/CMakeFiles/dbcsr.dir/dist/dbcsr_dist_util.F.o +[ 68%] Building Fortran object src/CMakeFiles/dbcsr.dir/mm/dbcsr_mm_accdrv.F.o +cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/gfortran -D__STATM_TOTAL -D__parallel -D__SHORT_FILE__=\"dbcsr_iterator_operations.F\" -I/build/reproducible-path/dbcsr-2.6.0/src/base -I/build/reproducible-path/dbcsr-2.6.0/src -I/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src -I/usr/lib/i386-linux-gnu/mpich/include -ffree-form -std=f2008ts -fimplicit-none -Werror=aliasing -Werror=ampersand -Werror=c-binding-type -Werror=intrinsic-shadow -Werror=intrinsics-std -Werror=line-truncation -Werror=tabs -Werror=target-lifetime -Werror=underflow -Werror=unused-but-set-parameter -Werror=unused-but-set-variable -Werror=unused-variable -Werror=unused-dummy-argument -Werror=conversion -Werror=zerotrip -Werror=uninitialized -Wno-maybe-uninitialized -Werror=unused-parameter -fallow-argument-mismatch -fPIC -fallow-invalid-boz -fallow-argument-mismatch -fopenmp -c /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/block/dbcsr_iterator_operations.F -o CMakeFiles/dbcsr.dir/block/dbcsr_iterator_operations.F.o cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/gfortran -D__STATM_TOTAL -D__parallel -D__SHORT_FILE__=\"dbcsr_dist_operations.F\" -I/build/reproducible-path/dbcsr-2.6.0/src/base -I/build/reproducible-path/dbcsr-2.6.0/src -I/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src -I/usr/lib/i386-linux-gnu/mpich/include -ffree-form -std=f2008ts -fimplicit-none -Werror=aliasing -Werror=ampersand -Werror=c-binding-type -Werror=intrinsic-shadow -Werror=intrinsics-std -Werror=line-truncation -Werror=tabs -Werror=target-lifetime -Werror=underflow -Werror=unused-but-set-parameter -Werror=unused-but-set-variable -Werror=unused-variable -Werror=unused-dummy-argument -Werror=conversion -Werror=zerotrip -Werror=uninitialized -Wno-maybe-uninitialized -Werror=unused-parameter -fallow-argument-mismatch -fPIC -fallow-invalid-boz -fallow-argument-mismatch -fopenmp -c /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/dist/dbcsr_dist_operations.F -o CMakeFiles/dbcsr.dir/dist/dbcsr_dist_operations.F.o cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/gfortran -D__STATM_TOTAL -D__parallel -D__SHORT_FILE__=\"dbcsr_dist_util.F\" -I/build/reproducible-path/dbcsr-2.6.0/src/base -I/build/reproducible-path/dbcsr-2.6.0/src -I/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src -I/usr/lib/i386-linux-gnu/mpich/include -ffree-form -std=f2008ts -fimplicit-none -Werror=aliasing -Werror=ampersand -Werror=c-binding-type -Werror=intrinsic-shadow -Werror=intrinsics-std -Werror=line-truncation -Werror=tabs -Werror=target-lifetime -Werror=underflow -Werror=unused-but-set-parameter -Werror=unused-but-set-variable -Werror=unused-variable -Werror=unused-dummy-argument -Werror=conversion -Werror=zerotrip -Werror=uninitialized -Wno-maybe-uninitialized -Werror=unused-parameter -fallow-argument-mismatch -fPIC -fallow-invalid-boz -fallow-argument-mismatch -fopenmp -c /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/dist/dbcsr_dist_util.F -o CMakeFiles/dbcsr.dir/dist/dbcsr_dist_util.F.o -cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/gfortran -D__STATM_TOTAL -D__parallel -D__SHORT_FILE__=\"dbcsr_iterator_operations.F\" -I/build/reproducible-path/dbcsr-2.6.0/src/base -I/build/reproducible-path/dbcsr-2.6.0/src -I/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src -I/usr/lib/i386-linux-gnu/mpich/include -ffree-form -std=f2008ts -fimplicit-none -Werror=aliasing -Werror=ampersand -Werror=c-binding-type -Werror=intrinsic-shadow -Werror=intrinsics-std -Werror=line-truncation -Werror=tabs -Werror=target-lifetime -Werror=underflow -Werror=unused-but-set-parameter -Werror=unused-but-set-variable -Werror=unused-variable -Werror=unused-dummy-argument -Werror=conversion -Werror=zerotrip -Werror=uninitialized -Wno-maybe-uninitialized -Werror=unused-parameter -fallow-argument-mismatch -fPIC -fallow-invalid-boz -fallow-argument-mismatch -fopenmp -c /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/block/dbcsr_iterator_operations.F -o CMakeFiles/dbcsr.dir/block/dbcsr_iterator_operations.F.o +cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/gfortran -D__STATM_TOTAL -D__parallel -D__SHORT_FILE__=\"dbcsr_mm_accdrv.F\" -I/build/reproducible-path/dbcsr-2.6.0/src/base -I/build/reproducible-path/dbcsr-2.6.0/src -I/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src -I/usr/lib/i386-linux-gnu/mpich/include -ffree-form -std=f2008ts -fimplicit-none -Werror=aliasing -Werror=ampersand -Werror=c-binding-type -Werror=intrinsic-shadow -Werror=intrinsics-std -Werror=line-truncation -Werror=tabs -Werror=target-lifetime -Werror=underflow -Werror=unused-but-set-parameter -Werror=unused-but-set-variable -Werror=unused-variable -Werror=unused-dummy-argument -Werror=conversion -Werror=zerotrip -Werror=uninitialized -Wno-maybe-uninitialized -Werror=unused-parameter -fallow-argument-mismatch -fPIC -fallow-invalid-boz -fallow-argument-mismatch -fopenmp -c /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/mm/dbcsr_mm_accdrv.F -o CMakeFiles/dbcsr.dir/mm/dbcsr_mm_accdrv.F.o /usr/bin/cmake -E cmake_copy_f90_mod src/dbcsr_mm_accdrv.mod src/CMakeFiles/dbcsr.dir/dbcsr_mm_accdrv.mod.stamp GNU /usr/bin/cmake -E touch src/CMakeFiles/dbcsr.dir/mm/dbcsr_mm_accdrv.F.o.provides.build +/usr/bin/cmake -E cmake_copy_f90_mod src/dbcsr_iterator_operations.mod src/CMakeFiles/dbcsr.dir/dbcsr_iterator_operations.mod.stamp GNU [ 68%] Building Fortran object src/CMakeFiles/dbcsr.dir/mm/dbcsr_mm_sched.F.o cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/gfortran -D__STATM_TOTAL -D__parallel -D__SHORT_FILE__=\"dbcsr_mm_sched.F\" -I/build/reproducible-path/dbcsr-2.6.0/src/base -I/build/reproducible-path/dbcsr-2.6.0/src -I/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src -I/usr/lib/i386-linux-gnu/mpich/include -ffree-form -std=f2008ts -fimplicit-none -Werror=aliasing -Werror=ampersand -Werror=c-binding-type -Werror=intrinsic-shadow -Werror=intrinsics-std -Werror=line-truncation -Werror=tabs -Werror=target-lifetime -Werror=underflow -Werror=unused-but-set-parameter -Werror=unused-but-set-variable -Werror=unused-variable -Werror=unused-dummy-argument -Werror=conversion -Werror=zerotrip -Werror=uninitialized -Wno-maybe-uninitialized -Werror=unused-parameter -fallow-argument-mismatch -fPIC -fallow-invalid-boz -fallow-argument-mismatch -fopenmp -c /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/mm/dbcsr_mm_sched.F -o CMakeFiles/dbcsr.dir/mm/dbcsr_mm_sched.F.o +/usr/bin/cmake -E touch src/CMakeFiles/dbcsr.dir/block/dbcsr_iterator_operations.F.o.provides.build /usr/bin/cmake -E cmake_copy_f90_mod src/dbcsr_dist_operations.mod src/CMakeFiles/dbcsr.dir/dbcsr_dist_operations.mod.stamp GNU -/usr/bin/cmake -E cmake_copy_f90_mod src/dbcsr_iterator_operations.mod src/CMakeFiles/dbcsr.dir/dbcsr_iterator_operations.mod.stamp GNU /usr/bin/cmake -E touch src/CMakeFiles/dbcsr.dir/dist/dbcsr_dist_operations.F.o.provides.build -/usr/bin/cmake -E touch src/CMakeFiles/dbcsr.dir/block/dbcsr_iterator_operations.F.o.provides.build -[ 68%] Building Fortran object src/CMakeFiles/dbcsr.dir/block/dbcsr_index_operations.F.o [ 68%] Building Fortran object src/CMakeFiles/dbcsr.dir/mm/dbcsr_mm_dist_operations.F.o -cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/gfortran -D__STATM_TOTAL -D__parallel -D__SHORT_FILE__=\"dbcsr_index_operations.F\" -I/build/reproducible-path/dbcsr-2.6.0/src/base -I/build/reproducible-path/dbcsr-2.6.0/src -I/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src -I/usr/lib/i386-linux-gnu/mpich/include -ffree-form -std=f2008ts -fimplicit-none -Werror=aliasing -Werror=ampersand -Werror=c-binding-type -Werror=intrinsic-shadow -Werror=intrinsics-std -Werror=line-truncation -Werror=tabs -Werror=target-lifetime -Werror=underflow -Werror=unused-but-set-parameter -Werror=unused-but-set-variable -Werror=unused-variable -Werror=unused-dummy-argument -Werror=conversion -Werror=zerotrip -Werror=uninitialized -Wno-maybe-uninitialized -Werror=unused-parameter -fallow-argument-mismatch -fPIC -fallow-invalid-boz -fallow-argument-mismatch -fopenmp -c /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/block/dbcsr_index_operations.F -o CMakeFiles/dbcsr.dir/block/dbcsr_index_operations.F.o cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/gfortran -D__STATM_TOTAL -D__parallel -D__SHORT_FILE__=\"dbcsr_mm_dist_operations.F\" -I/build/reproducible-path/dbcsr-2.6.0/src/base -I/build/reproducible-path/dbcsr-2.6.0/src -I/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src -I/usr/lib/i386-linux-gnu/mpich/include -ffree-form -std=f2008ts -fimplicit-none -Werror=aliasing -Werror=ampersand -Werror=c-binding-type -Werror=intrinsic-shadow -Werror=intrinsics-std -Werror=line-truncation -Werror=tabs -Werror=target-lifetime -Werror=underflow -Werror=unused-but-set-parameter -Werror=unused-but-set-variable -Werror=unused-variable -Werror=unused-dummy-argument -Werror=conversion -Werror=zerotrip -Werror=uninitialized -Wno-maybe-uninitialized -Werror=unused-parameter -fallow-argument-mismatch -fPIC -fallow-invalid-boz -fallow-argument-mismatch -fopenmp -c /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/mm/dbcsr_mm_dist_operations.F -o CMakeFiles/dbcsr.dir/mm/dbcsr_mm_dist_operations.F.o +[ 68%] Building Fortran object src/CMakeFiles/dbcsr.dir/block/dbcsr_index_operations.F.o +cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/gfortran -D__STATM_TOTAL -D__parallel -D__SHORT_FILE__=\"dbcsr_index_operations.F\" -I/build/reproducible-path/dbcsr-2.6.0/src/base -I/build/reproducible-path/dbcsr-2.6.0/src -I/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src -I/usr/lib/i386-linux-gnu/mpich/include -ffree-form -std=f2008ts -fimplicit-none -Werror=aliasing -Werror=ampersand -Werror=c-binding-type -Werror=intrinsic-shadow -Werror=intrinsics-std -Werror=line-truncation -Werror=tabs -Werror=target-lifetime -Werror=underflow -Werror=unused-but-set-parameter -Werror=unused-but-set-variable -Werror=unused-variable -Werror=unused-dummy-argument -Werror=conversion -Werror=zerotrip -Werror=uninitialized -Wno-maybe-uninitialized -Werror=unused-parameter -fallow-argument-mismatch -fPIC -fallow-invalid-boz -fallow-argument-mismatch -fopenmp -c /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/block/dbcsr_index_operations.F -o CMakeFiles/dbcsr.dir/block/dbcsr_index_operations.F.o /usr/bin/cmake -E cmake_copy_f90_mod src/dbcsr_dist_util.mod src/CMakeFiles/dbcsr.dir/dbcsr_dist_util.mod.stamp GNU /usr/bin/cmake -E touch src/CMakeFiles/dbcsr.dir/dist/dbcsr_dist_util.F.o.provides.build [ 68%] Building Fortran object src/CMakeFiles/dbcsr.dir/data/dbcsr_data_operations.F.o cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/gfortran -D__STATM_TOTAL -D__parallel -D__SHORT_FILE__=\"dbcsr_data_operations.F\" -I/build/reproducible-path/dbcsr-2.6.0/src/base -I/build/reproducible-path/dbcsr-2.6.0/src -I/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src -I/usr/lib/i386-linux-gnu/mpich/include -ffree-form -std=f2008ts -fimplicit-none -Werror=aliasing -Werror=ampersand -Werror=c-binding-type -Werror=intrinsic-shadow -Werror=intrinsics-std -Werror=line-truncation -Werror=tabs -Werror=target-lifetime -Werror=underflow -Werror=unused-but-set-parameter -Werror=unused-but-set-variable -Werror=unused-variable -Werror=unused-dummy-argument -Werror=conversion -Werror=zerotrip -Werror=uninitialized -Wno-maybe-uninitialized -Werror=unused-parameter -fallow-argument-mismatch -fPIC -fallow-invalid-boz -fallow-argument-mismatch -fopenmp -c /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/data/dbcsr_data_operations.F -o CMakeFiles/dbcsr.dir/data/dbcsr_data_operations.F.o -/usr/bin/cmake -E cmake_copy_f90_mod src/dbcsr_mp_operations.mod src/CMakeFiles/dbcsr.dir/dbcsr_mp_operations.mod.stamp GNU /usr/bin/cmake -E cmake_copy_f90_mod src/dbcsr_mm_sched.mod src/CMakeFiles/dbcsr.dir/dbcsr_mm_sched.mod.stamp GNU -/usr/bin/cmake -E touch src/CMakeFiles/dbcsr.dir/mpi/dbcsr_mp_operations.F.o.provides.build +/usr/bin/cmake -E cmake_copy_f90_mod src/dbcsr_mp_operations.mod src/CMakeFiles/dbcsr.dir/dbcsr_mp_operations.mod.stamp GNU /usr/bin/cmake -E touch src/CMakeFiles/dbcsr.dir/mm/dbcsr_mm_sched.F.o.provides.build +/usr/bin/cmake -E touch src/CMakeFiles/dbcsr.dir/mpi/dbcsr_mp_operations.F.o.provides.build [ 68%] Building Fortran object src/CMakeFiles/dbcsr.dir/mm/dbcsr_mm_csr.F.o cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/gfortran -D__STATM_TOTAL -D__parallel -D__SHORT_FILE__=\"dbcsr_mm_csr.F\" -I/build/reproducible-path/dbcsr-2.6.0/src/base -I/build/reproducible-path/dbcsr-2.6.0/src -I/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src -I/usr/lib/i386-linux-gnu/mpich/include -ffree-form -std=f2008ts -fimplicit-none -Werror=aliasing -Werror=ampersand -Werror=c-binding-type -Werror=intrinsic-shadow -Werror=intrinsics-std -Werror=line-truncation -Werror=tabs -Werror=target-lifetime -Werror=underflow -Werror=unused-but-set-parameter -Werror=unused-but-set-variable -Werror=unused-variable -Werror=unused-dummy-argument -Werror=conversion -Werror=zerotrip -Werror=uninitialized -Wno-maybe-uninitialized -Werror=unused-parameter -fallow-argument-mismatch -fPIC -fallow-invalid-boz -fallow-argument-mismatch -fopenmp -c /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/mm/dbcsr_mm_csr.F -o CMakeFiles/dbcsr.dir/mm/dbcsr_mm_csr.F.o /usr/bin/cmake -E cmake_copy_f90_mod src/dbcsr_data_operations.mod src/CMakeFiles/dbcsr.dir/dbcsr_data_operations.mod.stamp GNU @@ -1202,10 +1238,10 @@ /usr/bin/cmake -E touch src/CMakeFiles/dbcsr.dir/mm/dbcsr_mm_dist_operations.F.o.provides.build /usr/bin/cmake -E cmake_copy_f90_mod src/dbcsr_index_operations.mod src/CMakeFiles/dbcsr.dir/dbcsr_index_operations.mod.stamp GNU /usr/bin/cmake -E touch src/CMakeFiles/dbcsr.dir/block/dbcsr_index_operations.F.o.provides.build -[ 68%] Building Fortran object src/CMakeFiles/dbcsr.dir/tas/dbcsr_tas_util.F.o [ 69%] Building Fortran object src/CMakeFiles/dbcsr.dir/work/dbcsr_work_operations.F.o -cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/gfortran -D__STATM_TOTAL -D__parallel -D__SHORT_FILE__=\"dbcsr_tas_util.F\" -I/build/reproducible-path/dbcsr-2.6.0/src/base -I/build/reproducible-path/dbcsr-2.6.0/src -I/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src -I/usr/lib/i386-linux-gnu/mpich/include -ffree-form -std=f2008ts -fimplicit-none -Werror=aliasing -Werror=ampersand -Werror=c-binding-type -Werror=intrinsic-shadow -Werror=intrinsics-std -Werror=line-truncation -Werror=tabs -Werror=target-lifetime -Werror=underflow -Werror=unused-but-set-parameter -Werror=unused-but-set-variable -Werror=unused-variable -Werror=unused-dummy-argument -Werror=conversion -Werror=zerotrip -Werror=uninitialized -Wno-maybe-uninitialized -Werror=unused-parameter -fallow-argument-mismatch -fPIC -fallow-invalid-boz -fallow-argument-mismatch -fopenmp -c /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/tas/dbcsr_tas_util.F -o CMakeFiles/dbcsr.dir/tas/dbcsr_tas_util.F.o cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/gfortran -D__STATM_TOTAL -D__parallel -D__SHORT_FILE__=\"dbcsr_work_operations.F\" -I/build/reproducible-path/dbcsr-2.6.0/src/base -I/build/reproducible-path/dbcsr-2.6.0/src -I/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src -I/usr/lib/i386-linux-gnu/mpich/include -ffree-form -std=f2008ts -fimplicit-none -Werror=aliasing -Werror=ampersand -Werror=c-binding-type -Werror=intrinsic-shadow -Werror=intrinsics-std -Werror=line-truncation -Werror=tabs -Werror=target-lifetime -Werror=underflow -Werror=unused-but-set-parameter -Werror=unused-but-set-variable -Werror=unused-variable -Werror=unused-dummy-argument -Werror=conversion -Werror=zerotrip -Werror=uninitialized -Wno-maybe-uninitialized -Werror=unused-parameter -fallow-argument-mismatch -fPIC -fallow-invalid-boz -fallow-argument-mismatch -fopenmp -c /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/work/dbcsr_work_operations.F -o CMakeFiles/dbcsr.dir/work/dbcsr_work_operations.F.o +[ 69%] Building Fortran object src/CMakeFiles/dbcsr.dir/tas/dbcsr_tas_util.F.o +cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/gfortran -D__STATM_TOTAL -D__parallel -D__SHORT_FILE__=\"dbcsr_tas_util.F\" -I/build/reproducible-path/dbcsr-2.6.0/src/base -I/build/reproducible-path/dbcsr-2.6.0/src -I/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src -I/usr/lib/i386-linux-gnu/mpich/include -ffree-form -std=f2008ts -fimplicit-none -Werror=aliasing -Werror=ampersand -Werror=c-binding-type -Werror=intrinsic-shadow -Werror=intrinsics-std -Werror=line-truncation -Werror=tabs -Werror=target-lifetime -Werror=underflow -Werror=unused-but-set-parameter -Werror=unused-but-set-variable -Werror=unused-variable -Werror=unused-dummy-argument -Werror=conversion -Werror=zerotrip -Werror=uninitialized -Wno-maybe-uninitialized -Werror=unused-parameter -fallow-argument-mismatch -fPIC -fallow-invalid-boz -fallow-argument-mismatch -fopenmp -c /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/tas/dbcsr_tas_util.F -o CMakeFiles/dbcsr.dir/tas/dbcsr_tas_util.F.o /usr/bin/cmake -E cmake_copy_f90_mod src/dbcsr_mm_csr.mod src/CMakeFiles/dbcsr.dir/dbcsr_mm_csr.mod.stamp GNU /usr/bin/cmake -E touch src/CMakeFiles/dbcsr.dir/mm/dbcsr_mm_csr.F.o.provides.build [ 69%] Building Fortran object src/CMakeFiles/dbcsr.dir/mm/dbcsr_mm_multrec.F.o @@ -1214,15 +1250,15 @@ /usr/bin/cmake -E touch src/CMakeFiles/dbcsr.dir/tas/dbcsr_tas_util.F.o.provides.build [ 69%] Building Fortran object src/CMakeFiles/dbcsr.dir/tas/dbcsr_tas_split.F.o cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/gfortran -D__STATM_TOTAL -D__parallel -D__SHORT_FILE__=\"dbcsr_tas_split.F\" -I/build/reproducible-path/dbcsr-2.6.0/src/base -I/build/reproducible-path/dbcsr-2.6.0/src -I/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src -I/usr/lib/i386-linux-gnu/mpich/include -ffree-form -std=f2008ts -fimplicit-none -Werror=aliasing -Werror=ampersand -Werror=c-binding-type -Werror=intrinsic-shadow -Werror=intrinsics-std -Werror=line-truncation -Werror=tabs -Werror=target-lifetime -Werror=underflow -Werror=unused-but-set-parameter -Werror=unused-but-set-variable -Werror=unused-variable -Werror=unused-dummy-argument -Werror=conversion -Werror=zerotrip -Werror=uninitialized -Wno-maybe-uninitialized -Werror=unused-parameter -fallow-argument-mismatch -fPIC -fallow-invalid-boz -fallow-argument-mismatch -fopenmp -c /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/tas/dbcsr_tas_split.F -o CMakeFiles/dbcsr.dir/tas/dbcsr_tas_split.F.o -/usr/bin/cmake -E cmake_copy_f90_mod src/dbcsr_mm_multrec.mod src/CMakeFiles/dbcsr.dir/dbcsr_mm_multrec.mod.stamp GNU -/usr/bin/cmake -E touch src/CMakeFiles/dbcsr.dir/mm/dbcsr_mm_multrec.F.o.provides.build /usr/bin/cmake -E cmake_copy_f90_mod src/dbcsr_tas_split.mod src/CMakeFiles/dbcsr.dir/dbcsr_tas_split.mod.stamp GNU /usr/bin/cmake -E touch src/CMakeFiles/dbcsr.dir/tas/dbcsr_tas_split.F.o.provides.build +/usr/bin/cmake -E cmake_copy_f90_mod src/dbcsr_mm_multrec.mod src/CMakeFiles/dbcsr.dir/dbcsr_mm_multrec.mod.stamp GNU +/usr/bin/cmake -E touch src/CMakeFiles/dbcsr.dir/mm/dbcsr_mm_multrec.F.o.provides.build /usr/bin/cmake -E cmake_copy_f90_mod src/dbcsr_work_operations.mod src/CMakeFiles/dbcsr.dir/dbcsr_work_operations.mod.stamp GNU /usr/bin/cmake -E touch src/CMakeFiles/dbcsr.dir/work/dbcsr_work_operations.F.o.provides.build [ 69%] Building Fortran object src/CMakeFiles/dbcsr.dir/block/dbcsr_block_access.F.o -[ 71%] Building Fortran object src/CMakeFiles/dbcsr.dir/mm/dbcsr_mm_common.F.o cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/gfortran -D__STATM_TOTAL -D__parallel -D__SHORT_FILE__=\"dbcsr_block_access.F\" -I/build/reproducible-path/dbcsr-2.6.0/src/base -I/build/reproducible-path/dbcsr-2.6.0/src -I/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src -I/usr/lib/i386-linux-gnu/mpich/include -ffree-form -std=f2008ts -fimplicit-none -Werror=aliasing -Werror=ampersand -Werror=c-binding-type -Werror=intrinsic-shadow -Werror=intrinsics-std -Werror=line-truncation -Werror=tabs -Werror=target-lifetime -Werror=underflow -Werror=unused-but-set-parameter -Werror=unused-but-set-variable -Werror=unused-variable -Werror=unused-dummy-argument -Werror=conversion -Werror=zerotrip -Werror=uninitialized -Wno-maybe-uninitialized -Werror=unused-parameter -fallow-argument-mismatch -fPIC -fallow-invalid-boz -fallow-argument-mismatch -fopenmp -c /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/block/dbcsr_block_access.F -o CMakeFiles/dbcsr.dir/block/dbcsr_block_access.F.o +[ 71%] Building Fortran object src/CMakeFiles/dbcsr.dir/mm/dbcsr_mm_common.F.o cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/gfortran -D__STATM_TOTAL -D__parallel -D__SHORT_FILE__=\"dbcsr_mm_common.F\" -I/build/reproducible-path/dbcsr-2.6.0/src/base -I/build/reproducible-path/dbcsr-2.6.0/src -I/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src -I/usr/lib/i386-linux-gnu/mpich/include -ffree-form -std=f2008ts -fimplicit-none -Werror=aliasing -Werror=ampersand -Werror=c-binding-type -Werror=intrinsic-shadow -Werror=intrinsics-std -Werror=line-truncation -Werror=tabs -Werror=target-lifetime -Werror=underflow -Werror=unused-but-set-parameter -Werror=unused-but-set-variable -Werror=unused-variable -Werror=unused-dummy-argument -Werror=conversion -Werror=zerotrip -Werror=uninitialized -Wno-maybe-uninitialized -Werror=unused-parameter -fallow-argument-mismatch -fPIC -fallow-invalid-boz -fallow-argument-mismatch -fopenmp -c /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/mm/dbcsr_mm_common.F -o CMakeFiles/dbcsr.dir/mm/dbcsr_mm_common.F.o /usr/bin/cmake -E cmake_copy_f90_mod src/dbcsr_mm_common.mod src/CMakeFiles/dbcsr.dir/dbcsr_mm_common.mod.stamp GNU /usr/bin/cmake -E touch src/CMakeFiles/dbcsr.dir/mm/dbcsr_mm_common.F.o.provides.build @@ -1231,8 +1267,8 @@ /usr/bin/cmake -E cmake_copy_f90_mod src/dbcsr_block_access.mod src/CMakeFiles/dbcsr.dir/dbcsr_block_access.mod.stamp GNU /usr/bin/cmake -E touch src/CMakeFiles/dbcsr.dir/block/dbcsr_block_access.F.o.provides.build [ 72%] Building Fortran object src/CMakeFiles/dbcsr.dir/ops/dbcsr_operations.F.o -[ 72%] Building Fortran object src/CMakeFiles/dbcsr.dir/ops/dbcsr_test_methods.F.o cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/gfortran -D__STATM_TOTAL -D__parallel -D__SHORT_FILE__=\"dbcsr_operations.F\" -I/build/reproducible-path/dbcsr-2.6.0/src/base -I/build/reproducible-path/dbcsr-2.6.0/src -I/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src -I/usr/lib/i386-linux-gnu/mpich/include -ffree-form -std=f2008ts -fimplicit-none -Werror=aliasing -Werror=ampersand -Werror=c-binding-type -Werror=intrinsic-shadow -Werror=intrinsics-std -Werror=line-truncation -Werror=tabs -Werror=target-lifetime -Werror=underflow -Werror=unused-but-set-parameter -Werror=unused-but-set-variable -Werror=unused-variable -Werror=unused-dummy-argument -Werror=conversion -Werror=zerotrip -Werror=uninitialized -Wno-maybe-uninitialized -Werror=unused-parameter -fallow-argument-mismatch -fPIC -fallow-invalid-boz -fallow-argument-mismatch -fopenmp -c /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/ops/dbcsr_operations.F -o CMakeFiles/dbcsr.dir/ops/dbcsr_operations.F.o +[ 72%] Building Fortran object src/CMakeFiles/dbcsr.dir/ops/dbcsr_test_methods.F.o cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/gfortran -D__STATM_TOTAL -D__parallel -D__SHORT_FILE__=\"dbcsr_test_methods.F\" -I/build/reproducible-path/dbcsr-2.6.0/src/base -I/build/reproducible-path/dbcsr-2.6.0/src -I/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src -I/usr/lib/i386-linux-gnu/mpich/include -ffree-form -std=f2008ts -fimplicit-none -Werror=aliasing -Werror=ampersand -Werror=c-binding-type -Werror=intrinsic-shadow -Werror=intrinsics-std -Werror=line-truncation -Werror=tabs -Werror=target-lifetime -Werror=underflow -Werror=unused-but-set-parameter -Werror=unused-but-set-variable -Werror=unused-variable -Werror=unused-dummy-argument -Werror=conversion -Werror=zerotrip -Werror=uninitialized -Wno-maybe-uninitialized -Werror=unused-parameter -fallow-argument-mismatch -fPIC -fallow-invalid-boz -fallow-argument-mismatch -fopenmp -c /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/ops/dbcsr_test_methods.F -o CMakeFiles/dbcsr.dir/ops/dbcsr_test_methods.F.o /usr/bin/cmake -E cmake_copy_f90_mod src/dbcsr_test_methods.mod src/CMakeFiles/dbcsr.dir/dbcsr_test_methods.mod.stamp GNU /usr/bin/cmake -E touch src/CMakeFiles/dbcsr.dir/ops/dbcsr_test_methods.F.o.provides.build @@ -1241,8 +1277,8 @@ /usr/bin/cmake -E cmake_copy_f90_mod src/dbcsr_operations.mod src/CMakeFiles/dbcsr.dir/dbcsr_operations.mod.stamp GNU /usr/bin/cmake -E touch src/CMakeFiles/dbcsr.dir/ops/dbcsr_operations.F.o.provides.build [ 73%] Building Fortran object src/CMakeFiles/dbcsr.dir/ops/dbcsr_transformations.F.o -[ 73%] Building Fortran object src/CMakeFiles/dbcsr.dir/tas/dbcsr_tas_base.F.o cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/gfortran -D__STATM_TOTAL -D__parallel -D__SHORT_FILE__=\"dbcsr_transformations.F\" -I/build/reproducible-path/dbcsr-2.6.0/src/base -I/build/reproducible-path/dbcsr-2.6.0/src -I/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src -I/usr/lib/i386-linux-gnu/mpich/include -ffree-form -std=f2008ts -fimplicit-none -Werror=aliasing -Werror=ampersand -Werror=c-binding-type -Werror=intrinsic-shadow -Werror=intrinsics-std -Werror=line-truncation -Werror=tabs -Werror=target-lifetime -Werror=underflow -Werror=unused-but-set-parameter -Werror=unused-but-set-variable -Werror=unused-variable -Werror=unused-dummy-argument -Werror=conversion -Werror=zerotrip -Werror=uninitialized -Wno-maybe-uninitialized -Werror=unused-parameter -fallow-argument-mismatch -fPIC -fallow-invalid-boz -fallow-argument-mismatch -fopenmp -c /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/ops/dbcsr_transformations.F -o CMakeFiles/dbcsr.dir/ops/dbcsr_transformations.F.o +[ 73%] Building Fortran object src/CMakeFiles/dbcsr.dir/tas/dbcsr_tas_base.F.o cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/gfortran -D__STATM_TOTAL -D__parallel -D__SHORT_FILE__=\"dbcsr_tas_base.F\" -I/build/reproducible-path/dbcsr-2.6.0/src/base -I/build/reproducible-path/dbcsr-2.6.0/src -I/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src -I/usr/lib/i386-linux-gnu/mpich/include -ffree-form -std=f2008ts -fimplicit-none -Werror=aliasing -Werror=ampersand -Werror=c-binding-type -Werror=intrinsic-shadow -Werror=intrinsics-std -Werror=line-truncation -Werror=tabs -Werror=target-lifetime -Werror=underflow -Werror=unused-but-set-parameter -Werror=unused-but-set-variable -Werror=unused-variable -Werror=unused-dummy-argument -Werror=conversion -Werror=zerotrip -Werror=uninitialized -Wno-maybe-uninitialized -Werror=unused-parameter -fallow-argument-mismatch -fPIC -fallow-invalid-boz -fallow-argument-mismatch -fopenmp -c /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/tas/dbcsr_tas_base.F -o CMakeFiles/dbcsr.dir/tas/dbcsr_tas_base.F.o /usr/bin/cmake -E cmake_copy_f90_mod src/dbcsr_tas_base.mod src/CMakeFiles/dbcsr.dir/dbcsr_tas_base.mod.stamp GNU /usr/bin/cmake -E touch src/CMakeFiles/dbcsr.dir/tas/dbcsr_tas_base.F.o.provides.build @@ -1252,14 +1288,14 @@ cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/gfortran -D__STATM_TOTAL -D__parallel -D__SHORT_FILE__=\"dbcsr_tas_reshape_ops.F\" -I/build/reproducible-path/dbcsr-2.6.0/src/base -I/build/reproducible-path/dbcsr-2.6.0/src -I/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src -I/usr/lib/i386-linux-gnu/mpich/include -ffree-form -std=f2008ts -fimplicit-none -Werror=aliasing -Werror=ampersand -Werror=c-binding-type -Werror=intrinsic-shadow -Werror=intrinsics-std -Werror=line-truncation -Werror=tabs -Werror=target-lifetime -Werror=underflow -Werror=unused-but-set-parameter -Werror=unused-but-set-variable -Werror=unused-variable -Werror=unused-dummy-argument -Werror=conversion -Werror=zerotrip -Werror=uninitialized -Wno-maybe-uninitialized -Werror=unused-parameter -fallow-argument-mismatch -fPIC -fallow-invalid-boz -fallow-argument-mismatch -fopenmp -c /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/tas/dbcsr_tas_reshape_ops.F -o CMakeFiles/dbcsr.dir/tas/dbcsr_tas_reshape_ops.F.o /usr/bin/cmake -E cmake_copy_f90_mod src/dbcsr_tas_io.mod src/CMakeFiles/dbcsr.dir/dbcsr_tas_io.mod.stamp GNU /usr/bin/cmake -E touch src/CMakeFiles/dbcsr.dir/tas/dbcsr_tas_io.F.o.provides.build +/usr/bin/cmake -E cmake_copy_f90_mod src/dbcsr_tas_reshape_ops.mod src/CMakeFiles/dbcsr.dir/dbcsr_tas_reshape_ops.mod.stamp GNU +/usr/bin/cmake -E touch src/CMakeFiles/dbcsr.dir/tas/dbcsr_tas_reshape_ops.F.o.provides.build /usr/bin/cmake -E cmake_copy_f90_mod src/dbcsr_transformations.mod src/CMakeFiles/dbcsr.dir/dbcsr_transformations.mod.stamp GNU /usr/bin/cmake -E touch src/CMakeFiles/dbcsr.dir/ops/dbcsr_transformations.F.o.provides.build -[ 73%] Building Fortran object src/CMakeFiles/dbcsr.dir/ops/dbcsr_io.F.o [ 73%] Building Fortran object src/CMakeFiles/dbcsr.dir/ops/dbcsr_csr_conversions.F.o +[ 73%] Building Fortran object src/CMakeFiles/dbcsr.dir/ops/dbcsr_io.F.o cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/gfortran -D__STATM_TOTAL -D__parallel -D__SHORT_FILE__=\"dbcsr_io.F\" -I/build/reproducible-path/dbcsr-2.6.0/src/base -I/build/reproducible-path/dbcsr-2.6.0/src -I/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src -I/usr/lib/i386-linux-gnu/mpich/include -ffree-form -std=f2008ts -fimplicit-none -Werror=aliasing -Werror=ampersand -Werror=c-binding-type -Werror=intrinsic-shadow -Werror=intrinsics-std -Werror=line-truncation -Werror=tabs -Werror=target-lifetime -Werror=underflow -Werror=unused-but-set-parameter -Werror=unused-but-set-variable -Werror=unused-variable -Werror=unused-dummy-argument -Werror=conversion -Werror=zerotrip -Werror=uninitialized -Wno-maybe-uninitialized -Werror=unused-parameter -fallow-argument-mismatch -fPIC -fallow-invalid-boz -fallow-argument-mismatch -fopenmp -c /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/ops/dbcsr_io.F -o CMakeFiles/dbcsr.dir/ops/dbcsr_io.F.o cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/gfortran -D__STATM_TOTAL -D__parallel -D__SHORT_FILE__=\"dbcsr_csr_conversions.F\" -I/build/reproducible-path/dbcsr-2.6.0/src/base -I/build/reproducible-path/dbcsr-2.6.0/src -I/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src -I/usr/lib/i386-linux-gnu/mpich/include -ffree-form -std=f2008ts -fimplicit-none -Werror=aliasing -Werror=ampersand -Werror=c-binding-type -Werror=intrinsic-shadow -Werror=intrinsics-std -Werror=line-truncation -Werror=tabs -Werror=target-lifetime -Werror=underflow -Werror=unused-but-set-parameter -Werror=unused-but-set-variable -Werror=unused-variable -Werror=unused-dummy-argument -Werror=conversion -Werror=zerotrip -Werror=uninitialized -Wno-maybe-uninitialized -Werror=unused-parameter -fallow-argument-mismatch -fPIC -fallow-invalid-boz -fallow-argument-mismatch -fopenmp -c /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/ops/dbcsr_csr_conversions.F -o CMakeFiles/dbcsr.dir/ops/dbcsr_csr_conversions.F.o -/usr/bin/cmake -E cmake_copy_f90_mod src/dbcsr_tas_reshape_ops.mod src/CMakeFiles/dbcsr.dir/dbcsr_tas_reshape_ops.mod.stamp GNU -/usr/bin/cmake -E touch src/CMakeFiles/dbcsr.dir/tas/dbcsr_tas_reshape_ops.F.o.provides.build /usr/bin/cmake -E cmake_copy_f90_mod src/dbcsr_io.mod src/CMakeFiles/dbcsr.dir/dbcsr_io.mod.stamp GNU /usr/bin/cmake -E cmake_copy_f90_mod src/dbcsr_csr_conversions.mod src/CMakeFiles/dbcsr.dir/dbcsr_csr_conversions.mod.stamp GNU /usr/bin/cmake -E touch src/CMakeFiles/dbcsr.dir/ops/dbcsr_io.F.o.provides.build @@ -1279,8 +1315,8 @@ /usr/bin/cmake -E cmake_copy_f90_mod src/dbcsr_multiply_api.mod src/CMakeFiles/dbcsr.dir/dbcsr_multiply_api.mod.stamp GNU /usr/bin/cmake -E touch src/CMakeFiles/dbcsr.dir/mm/dbcsr_multiply_api.F.o.provides.build [ 75%] Building Fortran object src/CMakeFiles/dbcsr.dir/ops/dbcsr_tests.F.o -[ 76%] Building Fortran object src/CMakeFiles/dbcsr.dir/tas/dbcsr_tas_mm.F.o cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/gfortran -D__STATM_TOTAL -D__parallel -D__SHORT_FILE__=\"dbcsr_tests.F\" -I/build/reproducible-path/dbcsr-2.6.0/src/base -I/build/reproducible-path/dbcsr-2.6.0/src -I/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src -I/usr/lib/i386-linux-gnu/mpich/include -ffree-form -std=f2008ts -fimplicit-none -Werror=aliasing -Werror=ampersand -Werror=c-binding-type -Werror=intrinsic-shadow -Werror=intrinsics-std -Werror=line-truncation -Werror=tabs -Werror=target-lifetime -Werror=underflow -Werror=unused-but-set-parameter -Werror=unused-but-set-variable -Werror=unused-variable -Werror=unused-dummy-argument -Werror=conversion -Werror=zerotrip -Werror=uninitialized -Wno-maybe-uninitialized -Werror=unused-parameter -fallow-argument-mismatch -fPIC -fallow-invalid-boz -fallow-argument-mismatch -fopenmp -c /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/ops/dbcsr_tests.F -o CMakeFiles/dbcsr.dir/ops/dbcsr_tests.F.o +[ 76%] Building Fortran object src/CMakeFiles/dbcsr.dir/tas/dbcsr_tas_mm.F.o cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/gfortran -D__STATM_TOTAL -D__parallel -D__SHORT_FILE__=\"dbcsr_tas_mm.F\" -I/build/reproducible-path/dbcsr-2.6.0/src/base -I/build/reproducible-path/dbcsr-2.6.0/src -I/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src -I/usr/lib/i386-linux-gnu/mpich/include -ffree-form -std=f2008ts -fimplicit-none -Werror=aliasing -Werror=ampersand -Werror=c-binding-type -Werror=intrinsic-shadow -Werror=intrinsics-std -Werror=line-truncation -Werror=tabs -Werror=target-lifetime -Werror=underflow -Werror=unused-but-set-parameter -Werror=unused-but-set-variable -Werror=unused-variable -Werror=unused-dummy-argument -Werror=conversion -Werror=zerotrip -Werror=uninitialized -Wno-maybe-uninitialized -Werror=unused-parameter -fallow-argument-mismatch -fPIC -fallow-invalid-boz -fallow-argument-mismatch -fopenmp -c /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/tas/dbcsr_tas_mm.F -o CMakeFiles/dbcsr.dir/tas/dbcsr_tas_mm.F.o /usr/bin/cmake -E cmake_copy_f90_mod src/dbcsr_lib.mod src/CMakeFiles/dbcsr.dir/dbcsr_lib.mod.stamp GNU /usr/bin/cmake -E touch src/CMakeFiles/dbcsr.dir/core/dbcsr_lib.F.o.provides.build @@ -1288,14 +1324,14 @@ /usr/bin/cmake -E touch src/CMakeFiles/dbcsr.dir/ops/dbcsr_tests.F.o.provides.build [ 76%] Building Fortran object src/CMakeFiles/dbcsr.dir/dbcsr_api.F.o cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/gfortran -D__STATM_TOTAL -D__parallel -D__SHORT_FILE__=\"dbcsr_api.F\" -I/build/reproducible-path/dbcsr-2.6.0/src/base -I/build/reproducible-path/dbcsr-2.6.0/src -I/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src -I/usr/lib/i386-linux-gnu/mpich/include -ffree-form -std=f2008ts -fimplicit-none -Werror=aliasing -Werror=ampersand -Werror=c-binding-type -Werror=intrinsic-shadow -Werror=intrinsics-std -Werror=line-truncation -Werror=tabs -Werror=target-lifetime -Werror=underflow -Werror=unused-but-set-parameter -Werror=unused-but-set-variable -Werror=unused-variable -Werror=unused-dummy-argument -Werror=conversion -Werror=zerotrip -Werror=uninitialized -Wno-maybe-uninitialized -Werror=unused-parameter -fallow-argument-mismatch -fPIC -fallow-invalid-boz -fallow-argument-mismatch -fopenmp -c /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/dbcsr_api.F -o CMakeFiles/dbcsr.dir/dbcsr_api.F.o +/usr/bin/cmake -E cmake_copy_f90_mod src/dbcsr_api.mod src/CMakeFiles/dbcsr.dir/dbcsr_api.mod.stamp GNU +/usr/bin/cmake -E touch src/CMakeFiles/dbcsr.dir/dbcsr_api.F.o.provides.build /usr/bin/cmake -E cmake_copy_f90_mod src/dbcsr_tas_mm.mod src/CMakeFiles/dbcsr.dir/dbcsr_tas_mm.mod.stamp GNU /usr/bin/cmake -E touch src/CMakeFiles/dbcsr.dir/tas/dbcsr_tas_mm.F.o.provides.build +[ 76%] Building Fortran object src/CMakeFiles/dbcsr.dir/tensors/dbcsr_tensor_types.F.o [ 78%] Building Fortran object src/CMakeFiles/dbcsr.dir/tas/dbcsr_tas_test.F.o -cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/gfortran -D__STATM_TOTAL -D__parallel -D__SHORT_FILE__=\"dbcsr_tas_test.F\" -I/build/reproducible-path/dbcsr-2.6.0/src/base -I/build/reproducible-path/dbcsr-2.6.0/src -I/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src -I/usr/lib/i386-linux-gnu/mpich/include -ffree-form -std=f2008ts -fimplicit-none -Werror=aliasing -Werror=ampersand -Werror=c-binding-type -Werror=intrinsic-shadow -Werror=intrinsics-std -Werror=line-truncation -Werror=tabs -Werror=target-lifetime -Werror=underflow -Werror=unused-but-set-parameter -Werror=unused-but-set-variable -Werror=unused-variable -Werror=unused-dummy-argument -Werror=conversion -Werror=zerotrip -Werror=uninitialized -Wno-maybe-uninitialized -Werror=unused-parameter -fallow-argument-mismatch -fPIC -fallow-invalid-boz -fallow-argument-mismatch -fopenmp -c /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/tas/dbcsr_tas_test.F -o CMakeFiles/dbcsr.dir/tas/dbcsr_tas_test.F.o -/usr/bin/cmake -E cmake_copy_f90_mod src/dbcsr_api.mod src/CMakeFiles/dbcsr.dir/dbcsr_api.mod.stamp GNU -/usr/bin/cmake -E touch src/CMakeFiles/dbcsr.dir/dbcsr_api.F.o.provides.build -[ 78%] Building Fortran object src/CMakeFiles/dbcsr.dir/tensors/dbcsr_tensor_types.F.o cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/gfortran -D__STATM_TOTAL -D__parallel -D__SHORT_FILE__=\"dbcsr_tensor_types.F\" -I/build/reproducible-path/dbcsr-2.6.0/src/base -I/build/reproducible-path/dbcsr-2.6.0/src -I/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src -I/usr/lib/i386-linux-gnu/mpich/include -ffree-form -std=f2008ts -fimplicit-none -Werror=aliasing -Werror=ampersand -Werror=c-binding-type -Werror=intrinsic-shadow -Werror=intrinsics-std -Werror=line-truncation -Werror=tabs -Werror=target-lifetime -Werror=underflow -Werror=unused-but-set-parameter -Werror=unused-but-set-variable -Werror=unused-variable -Werror=unused-dummy-argument -Werror=conversion -Werror=zerotrip -Werror=uninitialized -Wno-maybe-uninitialized -Werror=unused-parameter -fallow-argument-mismatch -fPIC -fallow-invalid-boz -fallow-argument-mismatch -fopenmp -c /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/tensors/dbcsr_tensor_types.F -o CMakeFiles/dbcsr.dir/tensors/dbcsr_tensor_types.F.o +cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/gfortran -D__STATM_TOTAL -D__parallel -D__SHORT_FILE__=\"dbcsr_tas_test.F\" -I/build/reproducible-path/dbcsr-2.6.0/src/base -I/build/reproducible-path/dbcsr-2.6.0/src -I/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src -I/usr/lib/i386-linux-gnu/mpich/include -ffree-form -std=f2008ts -fimplicit-none -Werror=aliasing -Werror=ampersand -Werror=c-binding-type -Werror=intrinsic-shadow -Werror=intrinsics-std -Werror=line-truncation -Werror=tabs -Werror=target-lifetime -Werror=underflow -Werror=unused-but-set-parameter -Werror=unused-but-set-variable -Werror=unused-variable -Werror=unused-dummy-argument -Werror=conversion -Werror=zerotrip -Werror=uninitialized -Wno-maybe-uninitialized -Werror=unused-parameter -fallow-argument-mismatch -fPIC -fallow-invalid-boz -fallow-argument-mismatch -fopenmp -c /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/tas/dbcsr_tas_test.F -o CMakeFiles/dbcsr.dir/tas/dbcsr_tas_test.F.o /usr/bin/cmake -E cmake_copy_f90_mod src/dbcsr_tas_test.mod src/CMakeFiles/dbcsr.dir/dbcsr_tas_test.mod.stamp GNU /usr/bin/cmake -E touch src/CMakeFiles/dbcsr.dir/tas/dbcsr_tas_test.F.o.provides.build /usr/bin/cmake -E cmake_copy_f90_mod src/dbcsr_tensor_types.mod src/CMakeFiles/dbcsr.dir/dbcsr_tensor_types.mod.stamp GNU @@ -1307,8 +1343,8 @@ [ 78%] Building Fortran object src/CMakeFiles/dbcsr.dir/tensors/dbcsr_tensor_io.F.o [ 79%] Building Fortran object src/CMakeFiles/dbcsr.dir/tensors/dbcsr_tensor_reshape.F.o cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/gfortran -D__STATM_TOTAL -D__parallel -D__SHORT_FILE__=\"dbcsr_tensor_io.F\" -I/build/reproducible-path/dbcsr-2.6.0/src/base -I/build/reproducible-path/dbcsr-2.6.0/src -I/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src -I/usr/lib/i386-linux-gnu/mpich/include -ffree-form -std=f2008ts -fimplicit-none -Werror=aliasing -Werror=ampersand -Werror=c-binding-type -Werror=intrinsic-shadow -Werror=intrinsics-std -Werror=line-truncation -Werror=tabs -Werror=target-lifetime -Werror=underflow -Werror=unused-but-set-parameter -Werror=unused-but-set-variable -Werror=unused-variable -Werror=unused-dummy-argument -Werror=conversion -Werror=zerotrip -Werror=uninitialized -Wno-maybe-uninitialized -Werror=unused-parameter -fallow-argument-mismatch -fPIC -fallow-invalid-boz -fallow-argument-mismatch -fopenmp -c /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/tensors/dbcsr_tensor_io.F -o CMakeFiles/dbcsr.dir/tensors/dbcsr_tensor_io.F.o -[ 79%] Building Fortran object src/CMakeFiles/dbcsr.dir/tensors/dbcsr_tensor_split.F.o cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/gfortran -D__STATM_TOTAL -D__parallel -D__SHORT_FILE__=\"dbcsr_tensor_reshape.F\" -I/build/reproducible-path/dbcsr-2.6.0/src/base -I/build/reproducible-path/dbcsr-2.6.0/src -I/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src -I/usr/lib/i386-linux-gnu/mpich/include -ffree-form -std=f2008ts -fimplicit-none -Werror=aliasing -Werror=ampersand -Werror=c-binding-type -Werror=intrinsic-shadow -Werror=intrinsics-std -Werror=line-truncation -Werror=tabs -Werror=target-lifetime -Werror=underflow -Werror=unused-but-set-parameter -Werror=unused-but-set-variable -Werror=unused-variable -Werror=unused-dummy-argument -Werror=conversion -Werror=zerotrip -Werror=uninitialized -Wno-maybe-uninitialized -Werror=unused-parameter -fallow-argument-mismatch -fPIC -fallow-invalid-boz -fallow-argument-mismatch -fopenmp -c /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/tensors/dbcsr_tensor_reshape.F -o CMakeFiles/dbcsr.dir/tensors/dbcsr_tensor_reshape.F.o +[ 79%] Building Fortran object src/CMakeFiles/dbcsr.dir/tensors/dbcsr_tensor_split.F.o cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/gfortran -D__STATM_TOTAL -D__parallel -D__SHORT_FILE__=\"dbcsr_tensor_split.F\" -I/build/reproducible-path/dbcsr-2.6.0/src/base -I/build/reproducible-path/dbcsr-2.6.0/src -I/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src -I/usr/lib/i386-linux-gnu/mpich/include -ffree-form -std=f2008ts -fimplicit-none -Werror=aliasing -Werror=ampersand -Werror=c-binding-type -Werror=intrinsic-shadow -Werror=intrinsics-std -Werror=line-truncation -Werror=tabs -Werror=target-lifetime -Werror=underflow -Werror=unused-but-set-parameter -Werror=unused-but-set-variable -Werror=unused-variable -Werror=unused-dummy-argument -Werror=conversion -Werror=zerotrip -Werror=uninitialized -Wno-maybe-uninitialized -Werror=unused-parameter -fallow-argument-mismatch -fPIC -fallow-invalid-boz -fallow-argument-mismatch -fopenmp -c /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/tensors/dbcsr_tensor_split.F -o CMakeFiles/dbcsr.dir/tensors/dbcsr_tensor_split.F.o /usr/bin/cmake -E cmake_copy_f90_mod src/dbcsr_tensor_io.mod src/CMakeFiles/dbcsr.dir/dbcsr_tensor_io.mod.stamp GNU /usr/bin/cmake -E touch src/CMakeFiles/dbcsr.dir/tensors/dbcsr_tensor_io.F.o.provides.build @@ -1327,9 +1363,9 @@ [ 81%] Building Fortran object src/CMakeFiles/dbcsr.dir/tensors/dbcsr_tensor_api.F.o cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/gfortran -D__STATM_TOTAL -D__parallel -D__SHORT_FILE__=\"dbcsr_tensor_api.F\" -I/build/reproducible-path/dbcsr-2.6.0/src/base -I/build/reproducible-path/dbcsr-2.6.0/src -I/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src -I/usr/lib/i386-linux-gnu/mpich/include -ffree-form -std=f2008ts -fimplicit-none -Werror=aliasing -Werror=ampersand -Werror=c-binding-type -Werror=intrinsic-shadow -Werror=intrinsics-std -Werror=line-truncation -Werror=tabs -Werror=target-lifetime -Werror=underflow -Werror=unused-but-set-parameter -Werror=unused-but-set-variable -Werror=unused-variable -Werror=unused-dummy-argument -Werror=conversion -Werror=zerotrip -Werror=uninitialized -Wno-maybe-uninitialized -Werror=unused-parameter -fallow-argument-mismatch -fPIC -fallow-invalid-boz -fallow-argument-mismatch -fopenmp -c /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/tensors/dbcsr_tensor_api.F -o CMakeFiles/dbcsr.dir/tensors/dbcsr_tensor_api.F.o /usr/bin/cmake -E cmake_copy_f90_mod src/dbcsr_tensor_api.mod src/CMakeFiles/dbcsr.dir/dbcsr_tensor_api.mod.stamp GNU +/usr/bin/cmake -E touch src/CMakeFiles/dbcsr.dir/tensors/dbcsr_tensor_api.F.o.provides.build [ 81%] Linking Fortran static library libdbcsr.a cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/cmake -P CMakeFiles/dbcsr.dir/cmake_clean_target.cmake -/usr/bin/cmake -E touch src/CMakeFiles/dbcsr.dir/tensors/dbcsr_tensor_api.F.o.provides.build cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/cmake -E cmake_link_script CMakeFiles/dbcsr.dir/link.txt --verbose=1 /usr/bin/ar qc libdbcsr.a CMakeFiles/dbcsr.dir/dbcsr_api.F.o CMakeFiles/dbcsr.dir/acc/cuda/dbcsr_cuda_profiling.F.o CMakeFiles/dbcsr.dir/acc/dbcsr_acc_device.F.o CMakeFiles/dbcsr.dir/acc/dbcsr_acc_devmem.F.o CMakeFiles/dbcsr.dir/acc/dbcsr_acc_event.F.o CMakeFiles/dbcsr.dir/acc/dbcsr_acc_hostmem.F.o CMakeFiles/dbcsr.dir/acc/dbcsr_acc_init.F.o CMakeFiles/dbcsr.dir/acc/dbcsr_acc_stream.F.o CMakeFiles/dbcsr.dir/acc/dbcsr_acc_timings.F.o CMakeFiles/dbcsr.dir/acc/hip/dbcsr_hip_profiling.F.o CMakeFiles/dbcsr.dir/base/dbcsr_base_hooks.F.o CMakeFiles/dbcsr.dir/base/dbcsr_kinds.F.o CMakeFiles/dbcsr.dir/base/dbcsr_machine.F.o CMakeFiles/dbcsr.dir/base/dbcsr_machine_internal.F.o CMakeFiles/dbcsr.dir/block/dbcsr_block_access.F.o CMakeFiles/dbcsr.dir/block/dbcsr_block_operations.F.o CMakeFiles/dbcsr.dir/block/dbcsr_index_operations.F.o CMakeFiles/dbcsr.dir/block/dbcsr_iterator_operations.F.o CMakeFiles/dbcsr.dir/core/dbcsr_array_types.F.o CMakeFiles/dbcsr.dir/core/dbcsr_config.F.o CMakeFiles/dbcsr.dir/core/dbcsr_lib.F.o CMakeFiles/dbcsr.dir/core/dbcsr_methods.F.o CMakeFiles/dbcsr.dir/core/dbcsr_types.F.o CMakeFiles/dbcsr.dir/core/dbcsr_dict.F.o CMakeFiles/dbcsr.dir/core/dbcsr_error_handling.F.o CMakeFiles/dbcsr.dir/core/dbcsr_iter_types.F.o CMakeFiles/dbcsr.dir/core/dbcsr_list_callstackentry.F.o CMakeFiles/dbcsr.dir/core/dbcsr_list.F.o CMakeFiles/dbcsr.dir/core/dbcsr_list_routinereport.F.o CMakeFiles/dbcsr.dir/core/dbcsr_list_routinestat.F.o CMakeFiles/dbcsr.dir/core/dbcsr_list_timerenv.F.o CMakeFiles/dbcsr.dir/core/dbcsr_log_handling.F.o CMakeFiles/dbcsr.dir/core/dbcsr_print_messages.F.o CMakeFiles/dbcsr.dir/core/dbcsr_timings_base_type.F.o CMakeFiles/dbcsr.dir/core/dbcsr_timings.F.o CMakeFiles/dbcsr.dir/core/dbcsr_timings_report.F.o CMakeFiles/dbcsr.dir/core/dbcsr_timings_types.F.o CMakeFiles/dbcsr.dir/data/dbcsr_data_operations.F.o CMakeFiles/dbcsr.dir/data/dbcsr_data_methods.F.o CMakeFiles/dbcsr.dir/data/dbcsr_data_methods_low.F.o CMakeFiles/dbcsr.dir/data/dbcsr_data_types.F.o CMakeFiles/dbcsr.dir/data/dbcsr_mem_methods.F.o CMakeFiles/dbcsr.dir/data/dbcsr_ptr_util.F.o CMakeFiles/dbcsr.dir/dist/dbcsr_dist_methods.F.o CMakeFiles/dbcsr.dir/dist/dbcsr_dist_operations.F.o CMakeFiles/dbcsr.dir/dist/dbcsr_dist_util.F.o CMakeFiles/dbcsr.dir/mm/dbcsr_acc_operations.F.o CMakeFiles/dbcsr.dir/mm/dbcsr_mm_3d.F.o CMakeFiles/dbcsr.dir/mm/dbcsr_mm_accdrv.F.o CMakeFiles/dbcsr.dir/mm/dbcsr_mm_cannon.F.o CMakeFiles/dbcsr.dir/mm/dbcsr_mm_common.F.o CMakeFiles/dbcsr.dir/mm/dbcsr_mm_csr.F.o CMakeFiles/dbcsr.dir/mm/dbcsr_mm_dist_operations.F.o CMakeFiles/dbcsr.dir/mm/dbcsr_mm.F.o CMakeFiles/dbcsr.dir/mm/dbcsr_mm_hostdrv.F.o CMakeFiles/dbcsr.dir/mm/dbcsr_mm_multrec.F.o CMakeFiles/dbcsr.dir/mm/dbcsr_mm_sched.F.o CMakeFiles/dbcsr.dir/mm/dbcsr_mm_types.F.o CMakeFiles/dbcsr.dir/mm/dbcsr_multiply_api.F.o CMakeFiles/dbcsr.dir/mpi/dbcsr_mp_methods.F.o CMakeFiles/dbcsr.dir/mpi/dbcsr_mp_operations.F.o CMakeFiles/dbcsr.dir/mpi/dbcsr_mpiwrap.F.o CMakeFiles/dbcsr.dir/ops/dbcsr_csr_conversions.F.o CMakeFiles/dbcsr.dir/ops/dbcsr_io.F.o CMakeFiles/dbcsr.dir/ops/dbcsr_operations.F.o CMakeFiles/dbcsr.dir/ops/dbcsr_test_methods.F.o CMakeFiles/dbcsr.dir/ops/dbcsr_tests.F.o CMakeFiles/dbcsr.dir/ops/dbcsr_transformations.F.o CMakeFiles/dbcsr.dir/tas/dbcsr_tas_base.F.o CMakeFiles/dbcsr.dir/tas/dbcsr_tas_global.F.o CMakeFiles/dbcsr.dir/tas/dbcsr_tas_io.F.o CMakeFiles/dbcsr.dir/tas/dbcsr_tas_mm.F.o CMakeFiles/dbcsr.dir/tas/dbcsr_tas_reshape_ops.F.o CMakeFiles/dbcsr.dir/tas/dbcsr_tas_split.F.o CMakeFiles/dbcsr.dir/tas/dbcsr_tas_test.F.o CMakeFiles/dbcsr.dir/tas/dbcsr_tas_types.F.o CMakeFiles/dbcsr.dir/tas/dbcsr_tas_util.F.o CMakeFiles/dbcsr.dir/tensors/dbcsr_allocate_wrap.F.o CMakeFiles/dbcsr.dir/tensors/dbcsr_array_list_methods.F.o CMakeFiles/dbcsr.dir/tensors/dbcsr_tensor_api.F.o CMakeFiles/dbcsr.dir/tensors/dbcsr_tensor_block.F.o CMakeFiles/dbcsr.dir/tensors/dbcsr_tensor.F.o CMakeFiles/dbcsr.dir/tensors/dbcsr_tensor_index.F.o CMakeFiles/dbcsr.dir/tensors/dbcsr_tensor_io.F.o CMakeFiles/dbcsr.dir/tensors/dbcsr_tensor_reshape.F.o CMakeFiles/dbcsr.dir/tensors/dbcsr_tensor_split.F.o CMakeFiles/dbcsr.dir/tensors/dbcsr_tensor_test.F.o CMakeFiles/dbcsr.dir/tensors/dbcsr_tensor_types.F.o CMakeFiles/dbcsr.dir/utils/dbcsr_array_sort.F.o CMakeFiles/dbcsr.dir/utils/dbcsr_blas_operations.F.o CMakeFiles/dbcsr.dir/utils/dbcsr_btree.F.o CMakeFiles/dbcsr.dir/utils/dbcsr_files.F.o CMakeFiles/dbcsr.dir/utils/dbcsr_min_heap.F.o CMakeFiles/dbcsr.dir/utils/dbcsr_string_utilities.F.o CMakeFiles/dbcsr.dir/utils/dbcsr_toollib.F.o CMakeFiles/dbcsr.dir/work/dbcsr_work_operations.F.o /usr/bin/ranlib libdbcsr.a @@ -1339,252 +1375,252 @@ make -f tests/CMakeFiles/dbcsr_perf.dir/build.make tests/CMakeFiles/dbcsr_perf.dir/depend make -f tests/CMakeFiles/dbcsr_unittest_common.dir/build.make tests/CMakeFiles/dbcsr_unittest_common.dir/depend make -f examples/CMakeFiles/dbcsr_example_1.dir/build.make examples/CMakeFiles/dbcsr_example_1.dir/depend -make[3]: Entering directory '/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu' make -f examples/CMakeFiles/dbcsr_example_2.dir/build.make examples/CMakeFiles/dbcsr_example_2.dir/depend +make[3]: Entering directory '/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu' make -f examples/CMakeFiles/dbcsr_example_3.dir/build.make examples/CMakeFiles/dbcsr_example_3.dir/depend make[3]: Entering directory '/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu' cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu && /usr/bin/cmake -E cmake_depends "Unix Makefiles" /build/reproducible-path/dbcsr-2.6.0 /build/reproducible-path/dbcsr-2.6.0/tests /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/tests /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/tests/CMakeFiles/dbcsr_perf.dir/DependInfo.cmake "--color=" make -f examples/CMakeFiles/dbcsr_tensor_example_1.dir/build.make examples/CMakeFiles/dbcsr_tensor_example_1.dir/depend make[3]: Entering directory '/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu' -cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu && /usr/bin/cmake -E cmake_depends "Unix Makefiles" /build/reproducible-path/dbcsr-2.6.0 /build/reproducible-path/dbcsr-2.6.0/tests /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/tests /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/tests/CMakeFiles/dbcsr_unittest_common.dir/DependInfo.cmake "--color=" make[3]: Entering directory '/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu' cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu && /usr/bin/cmake -E cmake_depends "Unix Makefiles" /build/reproducible-path/dbcsr-2.6.0 /build/reproducible-path/dbcsr-2.6.0/examples /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/examples /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/examples/CMakeFiles/dbcsr_example_1.dir/DependInfo.cmake "--color=" +cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu && /usr/bin/cmake -E cmake_depends "Unix Makefiles" /build/reproducible-path/dbcsr-2.6.0 /build/reproducible-path/dbcsr-2.6.0/tests /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/tests /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/tests/CMakeFiles/dbcsr_unittest_common.dir/DependInfo.cmake "--color=" make[3]: Entering directory '/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu' cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu && /usr/bin/cmake -E cmake_depends "Unix Makefiles" /build/reproducible-path/dbcsr-2.6.0 /build/reproducible-path/dbcsr-2.6.0/examples /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/examples /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/examples/CMakeFiles/dbcsr_example_2.dir/DependInfo.cmake "--color=" make[3]: Entering directory '/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu' cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu && /usr/bin/cmake -E cmake_depends "Unix Makefiles" /build/reproducible-path/dbcsr-2.6.0 /build/reproducible-path/dbcsr-2.6.0/examples /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/examples /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/examples/CMakeFiles/dbcsr_example_3.dir/DependInfo.cmake "--color=" make[3]: Entering directory '/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu' cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu && /usr/bin/cmake -E cmake_depends "Unix Makefiles" /build/reproducible-path/dbcsr-2.6.0 /build/reproducible-path/dbcsr-2.6.0/examples /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/examples /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/examples/CMakeFiles/dbcsr_tensor_example_1.dir/DependInfo.cmake "--color=" -[ 81%] Generating dbcsr.h -Dependee "/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/tests/CMakeFiles/dbcsr_unittest_common.dir/DependInfo.cmake" is newer than depender "/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/tests/CMakeFiles/dbcsr_unittest_common.dir/depend.internal". -Dependee "/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/tests/CMakeFiles/dbcsr_perf.dir/DependInfo.cmake" is newer than depender "/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/tests/CMakeFiles/dbcsr_perf.dir/depend.internal". -Dependee "/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/tests/CMakeFiles/CMakeDirectoryInformation.cmake" is newer than depender "/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/tests/CMakeFiles/dbcsr_perf.dir/depend.internal". -Dependee "/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/tests/CMakeFiles/CMakeDirectoryInformation.cmake" is newer than depender "/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/tests/CMakeFiles/dbcsr_unittest_common.dir/depend.internal". -[ 81%] Generating tensors/dbcsr_tensor_api_c.F -[ 81%] Generating tensors/dbcsr_tensor.h Dependee "/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/examples/CMakeFiles/dbcsr_example_1.dir/DependInfo.cmake" is newer than depender "/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/examples/CMakeFiles/dbcsr_example_1.dir/depend.internal". Dependee "/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/examples/CMakeFiles/CMakeDirectoryInformation.cmake" is newer than depender "/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/examples/CMakeFiles/dbcsr_example_1.dir/depend.internal". +[ 82%] Generating tensors/dbcsr_tensor_api_c.F [ 82%] Generating dbcsr_api_c.F -cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/python3 /usr/bin/fypp -F /build/reproducible-path/dbcsr-2.6.0/src/dbcsr.h /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/dbcsr.h Dependee "/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/examples/CMakeFiles/dbcsr_example_2.dir/DependInfo.cmake" is newer than depender "/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/examples/CMakeFiles/dbcsr_example_2.dir/depend.internal". Dependee "/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/examples/CMakeFiles/CMakeDirectoryInformation.cmake" is newer than depender "/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/examples/CMakeFiles/dbcsr_example_2.dir/depend.internal". +Scanning dependencies of target dbcsr_example_1 +cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/python3 /usr/bin/fypp /build/reproducible-path/dbcsr-2.6.0/src/dbcsr_api_c.F /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/dbcsr_api_c.F +Dependee "/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/tests/CMakeFiles/dbcsr_unittest_common.dir/DependInfo.cmake" is newer than depender "/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/tests/CMakeFiles/dbcsr_unittest_common.dir/depend.internal". +Dependee "/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/tests/CMakeFiles/CMakeDirectoryInformation.cmake" is newer than depender "/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/tests/CMakeFiles/dbcsr_unittest_common.dir/depend.internal". +Dependee "/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/tests/CMakeFiles/dbcsr_perf.dir/DependInfo.cmake" is newer than depender "/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/tests/CMakeFiles/dbcsr_perf.dir/depend.internal". +Dependee "/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/tests/CMakeFiles/CMakeDirectoryInformation.cmake" is newer than depender "/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/tests/CMakeFiles/dbcsr_perf.dir/depend.internal". +[ 82%] Generating tensors/dbcsr_tensor.h +Scanning dependencies of target dbcsr_example_2 cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/python3 /usr/bin/fypp /build/reproducible-path/dbcsr-2.6.0/src/tensors/dbcsr_tensor_api_c.F /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/tensors/dbcsr_tensor_api_c.F +Dependee "/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/examples/CMakeFiles/dbcsr_tensor_example_1.dir/DependInfo.cmake" is newer than depender "/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/examples/CMakeFiles/dbcsr_tensor_example_1.dir/depend.internal". +Dependee "/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/examples/CMakeFiles/CMakeDirectoryInformation.cmake" is newer than depender "/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/examples/CMakeFiles/dbcsr_tensor_example_1.dir/depend.internal". +[ 82%] Generating dbcsr.h +make[3]: Leaving directory '/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu' cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/python3 /usr/bin/fypp -F /build/reproducible-path/dbcsr-2.6.0/src/tensors/dbcsr_tensor.h /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/tensors/dbcsr_tensor.h +make[3]: Leaving directory '/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu' Dependee "/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/examples/CMakeFiles/dbcsr_example_3.dir/DependInfo.cmake" is newer than depender "/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/examples/CMakeFiles/dbcsr_example_3.dir/depend.internal". Dependee "/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/examples/CMakeFiles/CMakeDirectoryInformation.cmake" is newer than depender "/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/examples/CMakeFiles/dbcsr_example_3.dir/depend.internal". -cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/python3 /usr/bin/fypp /build/reproducible-path/dbcsr-2.6.0/src/dbcsr_api_c.F /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/dbcsr_api_c.F -Scanning dependencies of target dbcsr_example_1 -Dependee "/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/examples/CMakeFiles/dbcsr_tensor_example_1.dir/DependInfo.cmake" is newer than depender "/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/examples/CMakeFiles/dbcsr_tensor_example_1.dir/depend.internal". -Dependee "/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/examples/CMakeFiles/CMakeDirectoryInformation.cmake" is newer than depender "/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/examples/CMakeFiles/dbcsr_tensor_example_1.dir/depend.internal". -Scanning dependencies of target dbcsr_example_2 +cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/python3 /usr/bin/fypp -F /build/reproducible-path/dbcsr-2.6.0/src/dbcsr.h /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/dbcsr.h Scanning dependencies of target dbcsr_perf -Scanning dependencies of target dbcsr_example_3 -make[3]: Leaving directory '/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu' -make -f examples/CMakeFiles/dbcsr_example_1.dir/build.make examples/CMakeFiles/dbcsr_example_1.dir/build Scanning dependencies of target dbcsr_unittest_common -make[3]: Leaving directory '/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu' -make[3]: Leaving directory '/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu' +make -f examples/CMakeFiles/dbcsr_example_1.dir/build.make examples/CMakeFiles/dbcsr_example_1.dir/build Scanning dependencies of target dbcsr_tensor_example_1 make[3]: Leaving directory '/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu' make -f examples/CMakeFiles/dbcsr_example_2.dir/build.make examples/CMakeFiles/dbcsr_example_2.dir/build +make[3]: Leaving directory '/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu' make -f tests/CMakeFiles/dbcsr_perf.dir/build.make tests/CMakeFiles/dbcsr_perf.dir/build make[3]: Leaving directory '/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu' make -f tests/CMakeFiles/dbcsr_unittest_common.dir/build.make tests/CMakeFiles/dbcsr_unittest_common.dir/build make[3]: Entering directory '/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu' -make[3]: Leaving directory '/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu' -make -f examples/CMakeFiles/dbcsr_example_3.dir/build.make examples/CMakeFiles/dbcsr_example_3.dir/build make -f examples/CMakeFiles/dbcsr_tensor_example_1.dir/build.make examples/CMakeFiles/dbcsr_tensor_example_1.dir/build make[3]: Entering directory '/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu' make[3]: Entering directory '/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu' make[3]: Entering directory '/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu' make[3]: Entering directory '/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu' +Scanning dependencies of target dbcsr_example_3 +make[3]: Leaving directory '/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu' +make -f examples/CMakeFiles/dbcsr_example_3.dir/build.make examples/CMakeFiles/dbcsr_example_3.dir/build make[3]: Entering directory '/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu' -[ 82%] Building Fortran object examples/CMakeFiles/dbcsr_example_2.dir/dbcsr_example_2.F.o +[ 82%] Building Fortran object tests/CMakeFiles/dbcsr_unittest_common.dir/dbcsr_test_add.F.o [ 82%] Building Fortran object examples/CMakeFiles/dbcsr_example_1.dir/dbcsr_example_1.F.o +[ 82%] Building Fortran object examples/CMakeFiles/dbcsr_tensor_example_1.dir/dbcsr_tensor_example_1.F.o [ 82%] Building Fortran object tests/CMakeFiles/dbcsr_perf.dir/dbcsr_performance_multiply.F.o -[ 82%] Building Fortran object tests/CMakeFiles/dbcsr_unittest_common.dir/dbcsr_test_add.F.o -[ 84%] Building Fortran object examples/CMakeFiles/dbcsr_example_3.dir/dbcsr_example_3.F.o -[ 84%] Building Fortran object tests/CMakeFiles/dbcsr_unittest_common.dir/dbcsr_test_multiply.F.o -cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/examples && /usr/bin/gfortran -I/build/reproducible-path/dbcsr-2.6.0/src -I/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src -I/usr/lib/i386-linux-gnu/mpich/include -ffree-form -std=f2008ts -fimplicit-none -Werror=aliasing -Werror=ampersand -Werror=c-binding-type -Werror=intrinsic-shadow -Werror=intrinsics-std -Werror=line-truncation -Werror=tabs -Werror=target-lifetime -Werror=underflow -Werror=unused-but-set-parameter -Werror=unused-but-set-variable -Werror=unused-variable -Werror=unused-dummy-argument -Werror=conversion -Werror=zerotrip -Werror=uninitialized -Wno-maybe-uninitialized -Werror=unused-parameter -fallow-argument-mismatch -fallow-invalid-boz -fallow-argument-mismatch -c /build/reproducible-path/dbcsr-2.6.0/examples/dbcsr_example_1.F -o CMakeFiles/dbcsr_example_1.dir/dbcsr_example_1.F.o +[ 82%] Building Fortran object examples/CMakeFiles/dbcsr_example_2.dir/dbcsr_example_2.F.o cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/examples && /usr/bin/gfortran -I/build/reproducible-path/dbcsr-2.6.0/src -I/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src -I/usr/lib/i386-linux-gnu/mpich/include -ffree-form -std=f2008ts -fimplicit-none -Werror=aliasing -Werror=ampersand -Werror=c-binding-type -Werror=intrinsic-shadow -Werror=intrinsics-std -Werror=line-truncation -Werror=tabs -Werror=target-lifetime -Werror=underflow -Werror=unused-but-set-parameter -Werror=unused-but-set-variable -Werror=unused-variable -Werror=unused-dummy-argument -Werror=conversion -Werror=zerotrip -Werror=uninitialized -Wno-maybe-uninitialized -Werror=unused-parameter -fallow-argument-mismatch -fallow-invalid-boz -fallow-argument-mismatch -c /build/reproducible-path/dbcsr-2.6.0/examples/dbcsr_example_2.F -o CMakeFiles/dbcsr_example_2.dir/dbcsr_example_2.F.o -cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/tests && /usr/bin/gfortran -D__SHORT_FILE__=\"dbcsr_performance_multiply.F\" -I/build/reproducible-path/dbcsr-2.6.0/src -I/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src -I/usr/lib/i386-linux-gnu/mpich/include -ffree-form -std=f2008ts -fimplicit-none -Werror=aliasing -Werror=ampersand -Werror=c-binding-type -Werror=intrinsic-shadow -Werror=intrinsics-std -Werror=line-truncation -Werror=tabs -Werror=target-lifetime -Werror=underflow -Werror=unused-but-set-parameter -Werror=unused-but-set-variable -Werror=unused-variable -Werror=unused-dummy-argument -Werror=conversion -Werror=zerotrip -Werror=uninitialized -Wno-maybe-uninitialized -Werror=unused-parameter -fallow-argument-mismatch -fallow-invalid-boz -fallow-argument-mismatch -fopenmp -c /build/reproducible-path/dbcsr-2.6.0/tests/dbcsr_performance_multiply.F -o CMakeFiles/dbcsr_perf.dir/dbcsr_performance_multiply.F.o -[ 84%] Building Fortran object examples/CMakeFiles/dbcsr_tensor_example_1.dir/dbcsr_tensor_example_1.F.o +cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/examples && /usr/bin/gfortran -I/build/reproducible-path/dbcsr-2.6.0/src -I/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src -I/usr/lib/i386-linux-gnu/mpich/include -ffree-form -std=f2008ts -fimplicit-none -Werror=aliasing -Werror=ampersand -Werror=c-binding-type -Werror=intrinsic-shadow -Werror=intrinsics-std -Werror=line-truncation -Werror=tabs -Werror=target-lifetime -Werror=underflow -Werror=unused-but-set-parameter -Werror=unused-but-set-variable -Werror=unused-variable -Werror=unused-dummy-argument -Werror=conversion -Werror=zerotrip -Werror=uninitialized -Wno-maybe-uninitialized -Werror=unused-parameter -fallow-argument-mismatch -fallow-invalid-boz -fallow-argument-mismatch -c /build/reproducible-path/dbcsr-2.6.0/examples/dbcsr_example_1.F -o CMakeFiles/dbcsr_example_1.dir/dbcsr_example_1.F.o cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/tests && /usr/bin/gfortran -D__SHORT_FILE__=\"dbcsr_test_add.F\" -I/build/reproducible-path/dbcsr-2.6.0/src -I/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src -I/usr/lib/i386-linux-gnu/mpich/include -ffree-form -std=f2008ts -fimplicit-none -Werror=aliasing -Werror=ampersand -Werror=c-binding-type -Werror=intrinsic-shadow -Werror=intrinsics-std -Werror=line-truncation -Werror=tabs -Werror=target-lifetime -Werror=underflow -Werror=unused-but-set-parameter -Werror=unused-but-set-variable -Werror=unused-variable -Werror=unused-dummy-argument -Werror=conversion -Werror=zerotrip -Werror=uninitialized -Wno-maybe-uninitialized -Werror=unused-parameter -fallow-argument-mismatch -fopenmp -fallow-invalid-boz -fallow-argument-mismatch -c /build/reproducible-path/dbcsr-2.6.0/tests/dbcsr_test_add.F -o CMakeFiles/dbcsr_unittest_common.dir/dbcsr_test_add.F.o +cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/examples && /usr/bin/gfortran -I/build/reproducible-path/dbcsr-2.6.0/src -I/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src -I/usr/lib/i386-linux-gnu/mpich/include -ffree-form -std=f2008ts -fimplicit-none -Werror=aliasing -Werror=ampersand -Werror=c-binding-type -Werror=intrinsic-shadow -Werror=intrinsics-std -Werror=line-truncation -Werror=tabs -Werror=target-lifetime -Werror=underflow -Werror=unused-but-set-parameter -Werror=unused-but-set-variable -Werror=unused-variable -Werror=unused-dummy-argument -Werror=conversion -Werror=zerotrip -Werror=uninitialized -Wno-maybe-uninitialized -Werror=unused-parameter -fallow-argument-mismatch -fallow-invalid-boz -fallow-argument-mismatch -Wno-error -c /build/reproducible-path/dbcsr-2.6.0/examples/dbcsr_tensor_example_1.F -o CMakeFiles/dbcsr_tensor_example_1.dir/dbcsr_tensor_example_1.F.o +cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/tests && /usr/bin/gfortran -D__SHORT_FILE__=\"dbcsr_performance_multiply.F\" -I/build/reproducible-path/dbcsr-2.6.0/src -I/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src -I/usr/lib/i386-linux-gnu/mpich/include -ffree-form -std=f2008ts -fimplicit-none -Werror=aliasing -Werror=ampersand -Werror=c-binding-type -Werror=intrinsic-shadow -Werror=intrinsics-std -Werror=line-truncation -Werror=tabs -Werror=target-lifetime -Werror=underflow -Werror=unused-but-set-parameter -Werror=unused-but-set-variable -Werror=unused-variable -Werror=unused-dummy-argument -Werror=conversion -Werror=zerotrip -Werror=uninitialized -Wno-maybe-uninitialized -Werror=unused-parameter -fallow-argument-mismatch -fallow-invalid-boz -fallow-argument-mismatch -fopenmp -c /build/reproducible-path/dbcsr-2.6.0/tests/dbcsr_performance_multiply.F -o CMakeFiles/dbcsr_perf.dir/dbcsr_performance_multiply.F.o +[ 84%] Building Fortran object examples/CMakeFiles/dbcsr_example_3.dir/dbcsr_example_3.F.o cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/examples && /usr/bin/gfortran -I/build/reproducible-path/dbcsr-2.6.0/src -I/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src -I/usr/lib/i386-linux-gnu/mpich/include -ffree-form -std=f2008ts -fimplicit-none -Werror=aliasing -Werror=ampersand -Werror=c-binding-type -Werror=intrinsic-shadow -Werror=intrinsics-std -Werror=line-truncation -Werror=tabs -Werror=target-lifetime -Werror=underflow -Werror=unused-but-set-parameter -Werror=unused-but-set-variable -Werror=unused-variable -Werror=unused-dummy-argument -Werror=conversion -Werror=zerotrip -Werror=uninitialized -Wno-maybe-uninitialized -Werror=unused-parameter -fallow-argument-mismatch -fallow-invalid-boz -fallow-argument-mismatch -c /build/reproducible-path/dbcsr-2.6.0/examples/dbcsr_example_3.F -o CMakeFiles/dbcsr_example_3.dir/dbcsr_example_3.F.o +[ 84%] Building Fortran object tests/CMakeFiles/dbcsr_unittest_common.dir/dbcsr_test_multiply.F.o cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/tests && /usr/bin/gfortran -D__SHORT_FILE__=\"dbcsr_test_multiply.F\" -I/build/reproducible-path/dbcsr-2.6.0/src -I/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src -I/usr/lib/i386-linux-gnu/mpich/include -ffree-form -std=f2008ts -fimplicit-none -Werror=aliasing -Werror=ampersand -Werror=c-binding-type -Werror=intrinsic-shadow -Werror=intrinsics-std -Werror=line-truncation -Werror=tabs -Werror=target-lifetime -Werror=underflow -Werror=unused-but-set-parameter -Werror=unused-but-set-variable -Werror=unused-variable -Werror=unused-dummy-argument -Werror=conversion -Werror=zerotrip -Werror=uninitialized -Wno-maybe-uninitialized -Werror=unused-parameter -fallow-argument-mismatch -fopenmp -fallow-invalid-boz -fallow-argument-mismatch -c /build/reproducible-path/dbcsr-2.6.0/tests/dbcsr_test_multiply.F -o CMakeFiles/dbcsr_unittest_common.dir/dbcsr_test_multiply.F.o -cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/examples && /usr/bin/gfortran -I/build/reproducible-path/dbcsr-2.6.0/src -I/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src -I/usr/lib/i386-linux-gnu/mpich/include -ffree-form -std=f2008ts -fimplicit-none -Werror=aliasing -Werror=ampersand -Werror=c-binding-type -Werror=intrinsic-shadow -Werror=intrinsics-std -Werror=line-truncation -Werror=tabs -Werror=target-lifetime -Werror=underflow -Werror=unused-but-set-parameter -Werror=unused-but-set-variable -Werror=unused-variable -Werror=unused-dummy-argument -Werror=conversion -Werror=zerotrip -Werror=uninitialized -Wno-maybe-uninitialized -Werror=unused-parameter -fallow-argument-mismatch -fallow-invalid-boz -fallow-argument-mismatch -Wno-error -c /build/reproducible-path/dbcsr-2.6.0/examples/dbcsr_tensor_example_1.F -o CMakeFiles/dbcsr_tensor_example_1.dir/dbcsr_tensor_example_1.F.o [ 85%] Linking Fortran executable dbcsr_example_1 cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/examples && /usr/bin/cmake -E cmake_link_script CMakeFiles/dbcsr_example_1.dir/link.txt --verbose=1 [ 85%] Linking Fortran executable dbcsr_example_2 cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/examples && /usr/bin/cmake -E cmake_link_script CMakeFiles/dbcsr_example_2.dir/link.txt --verbose=1 [ 85%] Linking Fortran executable dbcsr_example_3 -cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/examples && /usr/bin/cmake -E cmake_link_script CMakeFiles/dbcsr_example_3.dir/link.txt --verbose=1 cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu && /usr/bin/cmake -E cmake_depends "Unix Makefiles" /build/reproducible-path/dbcsr-2.6.0 /build/reproducible-path/dbcsr-2.6.0/src /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/CMakeFiles/dbcsr_c.dir/DependInfo.cmake "--color=" +cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/examples && /usr/bin/cmake -E cmake_link_script CMakeFiles/dbcsr_example_3.dir/link.txt --verbose=1 Dependee "/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/CMakeFiles/dbcsr_c.dir/DependInfo.cmake" is newer than depender "/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/CMakeFiles/dbcsr_c.dir/depend.internal". Dependee "/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/CMakeFiles/CMakeDirectoryInformation.cmake" is newer than depender "/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/CMakeFiles/dbcsr_c.dir/depend.internal". Scanning dependencies of target dbcsr_c +/usr/bin/cmake -E cmake_copy_f90_mod tests/dbcsr_test_add.mod tests/CMakeFiles/dbcsr_unittest_common.dir/dbcsr_test_add.mod.stamp GNU make[3]: Leaving directory '/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu' make -f src/CMakeFiles/dbcsr_c.dir/build.make src/CMakeFiles/dbcsr_c.dir/build make[3]: Entering directory '/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu' -/usr/bin/cmake -E cmake_copy_f90_mod tests/dbcsr_test_add.mod tests/CMakeFiles/dbcsr_unittest_common.dir/dbcsr_test_add.mod.stamp GNU [ 85%] Building Fortran object src/CMakeFiles/dbcsr_c.dir/dbcsr_api_c.F.o -[ 86%] Building Fortran object src/CMakeFiles/dbcsr_c.dir/tensors/dbcsr_tensor_api_c.F.o -cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/gfortran -I/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src -I/build/reproducible-path/dbcsr-2.6.0/src -I/usr/lib/i386-linux-gnu/mpich/include -ffree-form -std=f2008ts -fimplicit-none -Werror=aliasing -Werror=ampersand -Werror=c-binding-type -Werror=intrinsic-shadow -Werror=intrinsics-std -Werror=line-truncation -Werror=tabs -Werror=target-lifetime -Werror=underflow -Werror=unused-but-set-parameter -Werror=unused-but-set-variable -Werror=unused-variable -Werror=unused-dummy-argument -Werror=conversion -Werror=zerotrip -Werror=uninitialized -Wno-maybe-uninitialized -Werror=unused-parameter -fallow-argument-mismatch -fPIC -fallow-invalid-boz -fallow-argument-mismatch -c /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/tensors/dbcsr_tensor_api_c.F -o CMakeFiles/dbcsr_c.dir/tensors/dbcsr_tensor_api_c.F.o cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/gfortran -I/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src -I/build/reproducible-path/dbcsr-2.6.0/src -I/usr/lib/i386-linux-gnu/mpich/include -ffree-form -std=f2008ts -fimplicit-none -Werror=aliasing -Werror=ampersand -Werror=c-binding-type -Werror=intrinsic-shadow -Werror=intrinsics-std -Werror=line-truncation -Werror=tabs -Werror=target-lifetime -Werror=underflow -Werror=unused-but-set-parameter -Werror=unused-but-set-variable -Werror=unused-variable -Werror=unused-dummy-argument -Werror=conversion -Werror=zerotrip -Werror=uninitialized -Wno-maybe-uninitialized -Werror=unused-parameter -fallow-argument-mismatch -fPIC -fallow-invalid-boz -fallow-argument-mismatch -c /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/dbcsr_api_c.F -o CMakeFiles/dbcsr_c.dir/dbcsr_api_c.F.o /usr/bin/cmake -E touch tests/CMakeFiles/dbcsr_unittest_common.dir/dbcsr_test_add.F.o.provides.build -/usr/bin/cmake -E cmake_copy_f90_mod tests/dbcsr_test_multiply.mod tests/CMakeFiles/dbcsr_unittest_common.dir/dbcsr_test_multiply.mod.stamp GNU -[ 88%] Linking Fortran static library libdbcsr_unittest_common.a -/usr/bin/cmake -E touch tests/CMakeFiles/dbcsr_unittest_common.dir/dbcsr_test_multiply.F.o.provides.build -cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/tests && /usr/bin/cmake -P CMakeFiles/dbcsr_unittest_common.dir/cmake_clean_target.cmake -cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/tests && /usr/bin/cmake -E cmake_link_script CMakeFiles/dbcsr_unittest_common.dir/link.txt --verbose=1 -/usr/bin/gfortran -Wl,-z,relro -Wl,--dependency-file,CMakeFiles/dbcsr_example_2.dir/link.d -ffree-form -std=f2008ts -fimplicit-none -Werror=aliasing -Werror=ampersand -Werror=c-binding-type -Werror=intrinsic-shadow -Werror=intrinsics-std -Werror=line-truncation -Werror=tabs -Werror=target-lifetime -Werror=underflow -Werror=unused-but-set-parameter -Werror=unused-but-set-variable -Werror=unused-variable -Werror=unused-dummy-argument -Werror=conversion -Werror=zerotrip -Werror=uninitialized -Wno-maybe-uninitialized -Werror=unused-parameter -fallow-argument-mismatch CMakeFiles/dbcsr_example_2.dir/dbcsr_example_2.F.o -o dbcsr_example_2 -Wl,-rpath,/usr/lib/i386-linux-gnu/mpich/lib ../src/libdbcsr.a /usr/lib/i386-linux-gnu/libblas.so /usr/lib/i386-linux-gnu/liblapack.so /usr/lib/i386-linux-gnu/libblas.so /usr/lib/i386-linux-gnu/liblapack.so /usr/lib/i386-linux-gnu/mpich/lib/libmpichfort.so /usr/lib/i386-linux-gnu/mpich/lib/libmpich.so /usr/lib/gcc/i686-linux-gnu/14/libgomp.so /usr/lib/i386-linux-gnu/libpthread.a +[ 86%] Building Fortran object src/CMakeFiles/dbcsr_c.dir/tensors/dbcsr_tensor_api_c.F.o +cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/gfortran -I/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src -I/build/reproducible-path/dbcsr-2.6.0/src -I/usr/lib/i386-linux-gnu/mpich/include -ffree-form -std=f2008ts -fimplicit-none -Werror=aliasing -Werror=ampersand -Werror=c-binding-type -Werror=intrinsic-shadow -Werror=intrinsics-std -Werror=line-truncation -Werror=tabs -Werror=target-lifetime -Werror=underflow -Werror=unused-but-set-parameter -Werror=unused-but-set-variable -Werror=unused-variable -Werror=unused-dummy-argument -Werror=conversion -Werror=zerotrip -Werror=uninitialized -Wno-maybe-uninitialized -Werror=unused-parameter -fallow-argument-mismatch -fPIC -fallow-invalid-boz -fallow-argument-mismatch -c /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/tensors/dbcsr_tensor_api_c.F -o CMakeFiles/dbcsr_c.dir/tensors/dbcsr_tensor_api_c.F.o /usr/bin/gfortran -Wl,-z,relro -Wl,--dependency-file,CMakeFiles/dbcsr_example_1.dir/link.d -ffree-form -std=f2008ts -fimplicit-none -Werror=aliasing -Werror=ampersand -Werror=c-binding-type -Werror=intrinsic-shadow -Werror=intrinsics-std -Werror=line-truncation -Werror=tabs -Werror=target-lifetime -Werror=underflow -Werror=unused-but-set-parameter -Werror=unused-but-set-variable -Werror=unused-variable -Werror=unused-dummy-argument -Werror=conversion -Werror=zerotrip -Werror=uninitialized -Wno-maybe-uninitialized -Werror=unused-parameter -fallow-argument-mismatch CMakeFiles/dbcsr_example_1.dir/dbcsr_example_1.F.o -o dbcsr_example_1 -Wl,-rpath,/usr/lib/i386-linux-gnu/mpich/lib ../src/libdbcsr.a /usr/lib/i386-linux-gnu/libblas.so /usr/lib/i386-linux-gnu/liblapack.so /usr/lib/i386-linux-gnu/libblas.so /usr/lib/i386-linux-gnu/liblapack.so /usr/lib/i386-linux-gnu/mpich/lib/libmpichfort.so /usr/lib/i386-linux-gnu/mpich/lib/libmpich.so /usr/lib/gcc/i686-linux-gnu/14/libgomp.so /usr/lib/i386-linux-gnu/libpthread.a make[3]: Leaving directory '/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu' +/usr/bin/gfortran -Wl,-z,relro -Wl,--dependency-file,CMakeFiles/dbcsr_example_2.dir/link.d -ffree-form -std=f2008ts -fimplicit-none -Werror=aliasing -Werror=ampersand -Werror=c-binding-type -Werror=intrinsic-shadow -Werror=intrinsics-std -Werror=line-truncation -Werror=tabs -Werror=target-lifetime -Werror=underflow -Werror=unused-but-set-parameter -Werror=unused-but-set-variable -Werror=unused-variable -Werror=unused-dummy-argument -Werror=conversion -Werror=zerotrip -Werror=uninitialized -Wno-maybe-uninitialized -Werror=unused-parameter -fallow-argument-mismatch CMakeFiles/dbcsr_example_2.dir/dbcsr_example_2.F.o -o dbcsr_example_2 -Wl,-rpath,/usr/lib/i386-linux-gnu/mpich/lib ../src/libdbcsr.a /usr/lib/i386-linux-gnu/libblas.so /usr/lib/i386-linux-gnu/liblapack.so /usr/lib/i386-linux-gnu/libblas.so /usr/lib/i386-linux-gnu/liblapack.so /usr/lib/i386-linux-gnu/mpich/lib/libmpichfort.so /usr/lib/i386-linux-gnu/mpich/lib/libmpich.so /usr/lib/gcc/i686-linux-gnu/14/libgomp.so /usr/lib/i386-linux-gnu/libpthread.a make[3]: Leaving directory '/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu' +[ 86%] Built target dbcsr_example_1 +/usr/bin/cmake -E cmake_copy_f90_mod tests/dbcsr_test_multiply.mod tests/CMakeFiles/dbcsr_unittest_common.dir/dbcsr_test_multiply.mod.stamp GNU +[ 86%] Built target dbcsr_example_2 /usr/bin/gfortran -Wl,-z,relro -Wl,--dependency-file,CMakeFiles/dbcsr_example_3.dir/link.d -ffree-form -std=f2008ts -fimplicit-none -Werror=aliasing -Werror=ampersand -Werror=c-binding-type -Werror=intrinsic-shadow -Werror=intrinsics-std -Werror=line-truncation -Werror=tabs -Werror=target-lifetime -Werror=underflow -Werror=unused-but-set-parameter -Werror=unused-but-set-variable -Werror=unused-variable -Werror=unused-dummy-argument -Werror=conversion -Werror=zerotrip -Werror=uninitialized -Wno-maybe-uninitialized -Werror=unused-parameter -fallow-argument-mismatch CMakeFiles/dbcsr_example_3.dir/dbcsr_example_3.F.o -o dbcsr_example_3 -Wl,-rpath,/usr/lib/i386-linux-gnu/mpich/lib ../src/libdbcsr.a /usr/lib/i386-linux-gnu/libblas.so /usr/lib/i386-linux-gnu/liblapack.so /usr/lib/i386-linux-gnu/libblas.so /usr/lib/i386-linux-gnu/liblapack.so /usr/lib/i386-linux-gnu/mpich/lib/libmpichfort.so /usr/lib/i386-linux-gnu/mpich/lib/libmpich.so /usr/lib/gcc/i686-linux-gnu/14/libgomp.so /usr/lib/i386-linux-gnu/libpthread.a make[3]: Leaving directory '/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu' -[ 88%] Built target dbcsr_example_1 -[ 88%] Built target dbcsr_example_2 +/usr/bin/cmake -E touch tests/CMakeFiles/dbcsr_unittest_common.dir/dbcsr_test_multiply.F.o.provides.build +[ 88%] Linking Fortran static library libdbcsr_unittest_common.a +cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/tests && /usr/bin/cmake -P CMakeFiles/dbcsr_unittest_common.dir/cmake_clean_target.cmake +[ 88%] Built target dbcsr_example_3 +cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/tests && /usr/bin/cmake -E cmake_link_script CMakeFiles/dbcsr_unittest_common.dir/link.txt --verbose=1 +/usr/bin/cmake -E cmake_copy_f90_mod tests/dbcsr_performance_multiply.mod tests/CMakeFiles/dbcsr_perf.dir/dbcsr_performance_multiply.mod.stamp GNU /usr/bin/ar qc libdbcsr_unittest_common.a CMakeFiles/dbcsr_unittest_common.dir/dbcsr_test_add.F.o CMakeFiles/dbcsr_unittest_common.dir/dbcsr_test_multiply.F.o /usr/bin/ranlib libdbcsr_unittest_common.a make[3]: Leaving directory '/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu' -[ 88%] Built target dbcsr_example_3 [ 88%] Built target dbcsr_unittest_common +/usr/bin/cmake -E touch tests/CMakeFiles/dbcsr_perf.dir/dbcsr_performance_multiply.F.o.provides.build make -f tests/CMakeFiles/dbcsr_unittest1.dir/build.make tests/CMakeFiles/dbcsr_unittest1.dir/depend make -f tests/CMakeFiles/dbcsr_unittest2.dir/build.make tests/CMakeFiles/dbcsr_unittest2.dir/depend make -f tests/CMakeFiles/dbcsr_unittest3.dir/build.make tests/CMakeFiles/dbcsr_unittest3.dir/depend make -f tests/CMakeFiles/dbcsr_unittest4.dir/build.make tests/CMakeFiles/dbcsr_unittest4.dir/depend -make[3]: Entering directory '/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu' make -f tests/CMakeFiles/dbcsr_tensor_unittest.dir/build.make tests/CMakeFiles/dbcsr_tensor_unittest.dir/depend +make[3]: Entering directory '/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu' cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu && /usr/bin/cmake -E cmake_depends "Unix Makefiles" /build/reproducible-path/dbcsr-2.6.0 /build/reproducible-path/dbcsr-2.6.0/tests /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/tests /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/tests/CMakeFiles/dbcsr_unittest1.dir/DependInfo.cmake "--color=" make[3]: Entering directory '/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu' cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu && /usr/bin/cmake -E cmake_depends "Unix Makefiles" /build/reproducible-path/dbcsr-2.6.0 /build/reproducible-path/dbcsr-2.6.0/tests /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/tests /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/tests/CMakeFiles/dbcsr_unittest2.dir/DependInfo.cmake "--color=" -make -f tests/CMakeFiles/dbcsr_tas_unittest.dir/build.make tests/CMakeFiles/dbcsr_tas_unittest.dir/depend make[3]: Entering directory '/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu' cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu && /usr/bin/cmake -E cmake_depends "Unix Makefiles" /build/reproducible-path/dbcsr-2.6.0 /build/reproducible-path/dbcsr-2.6.0/tests /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/tests /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/tests/CMakeFiles/dbcsr_unittest3.dir/DependInfo.cmake "--color=" -make -f tests/CMakeFiles/dbcsr_test_csr_conversions.dir/build.make tests/CMakeFiles/dbcsr_test_csr_conversions.dir/depend make[3]: Entering directory '/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu' cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu && /usr/bin/cmake -E cmake_depends "Unix Makefiles" /build/reproducible-path/dbcsr-2.6.0 /build/reproducible-path/dbcsr-2.6.0/tests /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/tests /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/tests/CMakeFiles/dbcsr_unittest4.dir/DependInfo.cmake "--color=" make[3]: Entering directory '/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu' cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu && /usr/bin/cmake -E cmake_depends "Unix Makefiles" /build/reproducible-path/dbcsr-2.6.0 /build/reproducible-path/dbcsr-2.6.0/tests /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/tests /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/tests/CMakeFiles/dbcsr_tensor_unittest.dir/DependInfo.cmake "--color=" -make[3]: Entering directory '/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu' -cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu && /usr/bin/cmake -E cmake_depends "Unix Makefiles" /build/reproducible-path/dbcsr-2.6.0 /build/reproducible-path/dbcsr-2.6.0/tests /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/tests /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/tests/CMakeFiles/dbcsr_tas_unittest.dir/DependInfo.cmake "--color=" -make[3]: Entering directory '/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu' -cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu && /usr/bin/cmake -E cmake_depends "Unix Makefiles" /build/reproducible-path/dbcsr-2.6.0 /build/reproducible-path/dbcsr-2.6.0/tests /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/tests /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/tests/CMakeFiles/dbcsr_test_csr_conversions.dir/DependInfo.cmake "--color=" -Dependee "/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/tests/CMakeFiles/dbcsr_unittest3.dir/DependInfo.cmake" is newer than depender "/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/tests/CMakeFiles/dbcsr_unittest3.dir/depend.internal". +make -f tests/CMakeFiles/dbcsr_tas_unittest.dir/build.make tests/CMakeFiles/dbcsr_tas_unittest.dir/depend +[ 89%] Building Fortran object tests/CMakeFiles/dbcsr_perf.dir/dbcsr_performance_driver.F.o Dependee "/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/tests/CMakeFiles/dbcsr_unittest2.dir/DependInfo.cmake" is newer than depender "/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/tests/CMakeFiles/dbcsr_unittest2.dir/depend.internal". Dependee "/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/tests/CMakeFiles/dbcsr_unittest1.dir/DependInfo.cmake" is newer than depender "/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/tests/CMakeFiles/dbcsr_unittest1.dir/depend.internal". Dependee "/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/tests/CMakeFiles/CMakeDirectoryInformation.cmake" is newer than depender "/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/tests/CMakeFiles/dbcsr_unittest1.dir/depend.internal". Dependee "/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/tests/CMakeFiles/CMakeDirectoryInformation.cmake" is newer than depender "/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/tests/CMakeFiles/dbcsr_unittest2.dir/depend.internal". +make[3]: Entering directory '/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu' +cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu && /usr/bin/cmake -E cmake_depends "Unix Makefiles" /build/reproducible-path/dbcsr-2.6.0 /build/reproducible-path/dbcsr-2.6.0/tests /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/tests /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/tests/CMakeFiles/dbcsr_tas_unittest.dir/DependInfo.cmake "--color=" +Dependee "/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/tests/CMakeFiles/dbcsr_unittest3.dir/DependInfo.cmake" is newer than depender "/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/tests/CMakeFiles/dbcsr_unittest3.dir/depend.internal". Dependee "/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/tests/CMakeFiles/CMakeDirectoryInformation.cmake" is newer than depender "/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/tests/CMakeFiles/dbcsr_unittest3.dir/depend.internal". +cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/tests && /usr/bin/gfortran -D__SHORT_FILE__=\"dbcsr_performance_driver.F\" -I/build/reproducible-path/dbcsr-2.6.0/src -I/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src -I/usr/lib/i386-linux-gnu/mpich/include -ffree-form -std=f2008ts -fimplicit-none -Werror=aliasing -Werror=ampersand -Werror=c-binding-type -Werror=intrinsic-shadow -Werror=intrinsics-std -Werror=line-truncation -Werror=tabs -Werror=target-lifetime -Werror=underflow -Werror=unused-but-set-parameter -Werror=unused-but-set-variable -Werror=unused-variable -Werror=unused-dummy-argument -Werror=conversion -Werror=zerotrip -Werror=uninitialized -Wno-maybe-uninitialized -Werror=unused-parameter -fallow-argument-mismatch -fallow-invalid-boz -fallow-argument-mismatch -fopenmp -c /build/reproducible-path/dbcsr-2.6.0/tests/dbcsr_performance_driver.F -o CMakeFiles/dbcsr_perf.dir/dbcsr_performance_driver.F.o Dependee "/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/tests/CMakeFiles/dbcsr_unittest4.dir/DependInfo.cmake" is newer than depender "/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/tests/CMakeFiles/dbcsr_unittest4.dir/depend.internal". Dependee "/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/tests/CMakeFiles/CMakeDirectoryInformation.cmake" is newer than depender "/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/tests/CMakeFiles/dbcsr_unittest4.dir/depend.internal". -Scanning dependencies of target dbcsr_unittest2 -Scanning dependencies of target dbcsr_unittest3 -Dependee "/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/tests/CMakeFiles/dbcsr_test_csr_conversions.dir/DependInfo.cmake" is newer than depender "/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/tests/CMakeFiles/dbcsr_test_csr_conversions.dir/depend.internal". -Dependee "/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/tests/CMakeFiles/CMakeDirectoryInformation.cmake" is newer than depender "/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/tests/CMakeFiles/dbcsr_test_csr_conversions.dir/depend.internal". Dependee "/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/tests/CMakeFiles/dbcsr_tensor_unittest.dir/DependInfo.cmake" is newer than depender "/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/tests/CMakeFiles/dbcsr_tensor_unittest.dir/depend.internal". Dependee "/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/tests/CMakeFiles/CMakeDirectoryInformation.cmake" is newer than depender "/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/tests/CMakeFiles/dbcsr_tensor_unittest.dir/depend.internal". -Dependee "/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/tests/CMakeFiles/dbcsr_tas_unittest.dir/DependInfo.cmake" is newer than depender "/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/tests/CMakeFiles/dbcsr_tas_unittest.dir/depend.internal". -Dependee "/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/tests/CMakeFiles/CMakeDirectoryInformation.cmake" is newer than depender "/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/tests/CMakeFiles/dbcsr_tas_unittest.dir/depend.internal". +Scanning dependencies of target dbcsr_unittest3 +Scanning dependencies of target dbcsr_unittest2 Scanning dependencies of target dbcsr_unittest1 +Scanning dependencies of target dbcsr_tensor_unittest Scanning dependencies of target dbcsr_unittest4 make[3]: Leaving directory '/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu' -make[3]: Leaving directory '/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu' -Scanning dependencies of target dbcsr_test_csr_conversions -make -f tests/CMakeFiles/dbcsr_unittest3.dir/build.make tests/CMakeFiles/dbcsr_unittest3.dir/build -make[3]: Leaving directory '/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu' -Scanning dependencies of target dbcsr_tas_unittest make -f tests/CMakeFiles/dbcsr_unittest2.dir/build.make tests/CMakeFiles/dbcsr_unittest2.dir/build -make -f tests/CMakeFiles/dbcsr_unittest1.dir/build.make tests/CMakeFiles/dbcsr_unittest1.dir/build make[3]: Leaving directory '/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu' -make -f tests/CMakeFiles/dbcsr_unittest4.dir/build.make tests/CMakeFiles/dbcsr_unittest4.dir/build -Scanning dependencies of target dbcsr_tensor_unittest make[3]: Leaving directory '/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu' -make -f tests/CMakeFiles/dbcsr_test_csr_conversions.dir/build.make tests/CMakeFiles/dbcsr_test_csr_conversions.dir/build make[3]: Leaving directory '/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu' -make -f tests/CMakeFiles/dbcsr_tas_unittest.dir/build.make tests/CMakeFiles/dbcsr_tas_unittest.dir/build -make[3]: Entering directory '/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu' -make[3]: Entering directory '/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu' make[3]: Leaving directory '/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu' -make[3]: Entering directory '/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu' +make -f tests/CMakeFiles/dbcsr_unittest1.dir/build.make tests/CMakeFiles/dbcsr_unittest1.dir/build +make -f tests/CMakeFiles/dbcsr_unittest3.dir/build.make tests/CMakeFiles/dbcsr_unittest3.dir/build +make -f tests/CMakeFiles/dbcsr_unittest4.dir/build.make tests/CMakeFiles/dbcsr_unittest4.dir/build make -f tests/CMakeFiles/dbcsr_tensor_unittest.dir/build.make tests/CMakeFiles/dbcsr_tensor_unittest.dir/build make[3]: Entering directory '/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu' make[3]: Entering directory '/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu' make[3]: Entering directory '/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu' make[3]: Entering directory '/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu' -[ 91%] Building Fortran object tests/CMakeFiles/dbcsr_unittest2.dir/dbcsr_unittest2.F.o +make[3]: Entering directory '/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu' +Dependee "/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/tests/CMakeFiles/dbcsr_tas_unittest.dir/DependInfo.cmake" is newer than depender "/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/tests/CMakeFiles/dbcsr_tas_unittest.dir/depend.internal". +Dependee "/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/tests/CMakeFiles/CMakeDirectoryInformation.cmake" is newer than depender "/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/tests/CMakeFiles/dbcsr_tas_unittest.dir/depend.internal". +Scanning dependencies of target dbcsr_tas_unittest +make[3]: Leaving directory '/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu' +[ 89%] Building Fortran object tests/CMakeFiles/dbcsr_unittest2.dir/dbcsr_unittest2.F.o +make -f tests/CMakeFiles/dbcsr_tas_unittest.dir/build.make tests/CMakeFiles/dbcsr_tas_unittest.dir/build [ 91%] Building Fortran object tests/CMakeFiles/dbcsr_unittest1.dir/dbcsr_unittest1.F.o -[ 91%] Building Fortran object tests/CMakeFiles/dbcsr_test_csr_conversions.dir/dbcsr_test_csr_conversions.F.o -[ 91%] Building Fortran object tests/CMakeFiles/dbcsr_unittest3.dir/dbcsr_unittest3.F.o -[ 92%] Building Fortran object tests/CMakeFiles/dbcsr_unittest4.dir/dbcsr_test_scale_by_vector.F.o -cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/tests && /usr/bin/gfortran -D__SHORT_FILE__=\"dbcsr_test_csr_conversions.F\" -I/build/reproducible-path/dbcsr-2.6.0/src -I/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src -I/usr/lib/i386-linux-gnu/mpich/include -ffree-form -std=f2008ts -fimplicit-none -Werror=aliasing -Werror=ampersand -Werror=c-binding-type -Werror=intrinsic-shadow -Werror=intrinsics-std -Werror=line-truncation -Werror=tabs -Werror=target-lifetime -Werror=underflow -Werror=unused-but-set-parameter -Werror=unused-but-set-variable -Werror=unused-variable -Werror=unused-dummy-argument -Werror=conversion -Werror=zerotrip -Werror=uninitialized -Wno-maybe-uninitialized -Werror=unused-parameter -fallow-argument-mismatch -fopenmp -fallow-invalid-boz -fallow-argument-mismatch -c /build/reproducible-path/dbcsr-2.6.0/tests/dbcsr_test_csr_conversions.F -o CMakeFiles/dbcsr_test_csr_conversions.dir/dbcsr_test_csr_conversions.F.o +cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/tests && /usr/bin/gfortran -D__SHORT_FILE__=\"dbcsr_unittest2.F\" -I/build/reproducible-path/dbcsr-2.6.0/src -I/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src -I/usr/lib/i386-linux-gnu/mpich/include -ffree-form -std=f2008ts -fimplicit-none -Werror=aliasing -Werror=ampersand -Werror=c-binding-type -Werror=intrinsic-shadow -Werror=intrinsics-std -Werror=line-truncation -Werror=tabs -Werror=target-lifetime -Werror=underflow -Werror=unused-but-set-parameter -Werror=unused-but-set-variable -Werror=unused-variable -Werror=unused-dummy-argument -Werror=conversion -Werror=zerotrip -Werror=uninitialized -Wno-maybe-uninitialized -Werror=unused-parameter -fallow-argument-mismatch -fopenmp -fallow-invalid-boz -fallow-argument-mismatch -c /build/reproducible-path/dbcsr-2.6.0/tests/dbcsr_unittest2.F -o CMakeFiles/dbcsr_unittest2.dir/dbcsr_unittest2.F.o +[ 92%] Building Fortran object tests/CMakeFiles/dbcsr_unittest3.dir/dbcsr_unittest3.F.o +make[3]: Entering directory '/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu' +[ 94%] Building Fortran object tests/CMakeFiles/dbcsr_tensor_unittest.dir/dbcsr_tensor_unittest.F.o +[ 94%] Building Fortran object tests/CMakeFiles/dbcsr_unittest4.dir/dbcsr_test_scale_by_vector.F.o cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/tests && /usr/bin/gfortran -D__SHORT_FILE__=\"dbcsr_unittest1.F\" -I/build/reproducible-path/dbcsr-2.6.0/src -I/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src -I/usr/lib/i386-linux-gnu/mpich/include -ffree-form -std=f2008ts -fimplicit-none -Werror=aliasing -Werror=ampersand -Werror=c-binding-type -Werror=intrinsic-shadow -Werror=intrinsics-std -Werror=line-truncation -Werror=tabs -Werror=target-lifetime -Werror=underflow -Werror=unused-but-set-parameter -Werror=unused-but-set-variable -Werror=unused-variable -Werror=unused-dummy-argument -Werror=conversion -Werror=zerotrip -Werror=uninitialized -Wno-maybe-uninitialized -Werror=unused-parameter -fallow-argument-mismatch -fopenmp -fallow-invalid-boz -fallow-argument-mismatch -c /build/reproducible-path/dbcsr-2.6.0/tests/dbcsr_unittest1.F -o CMakeFiles/dbcsr_unittest1.dir/dbcsr_unittest1.F.o cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/tests && /usr/bin/gfortran -D__SHORT_FILE__=\"dbcsr_unittest3.F\" -I/build/reproducible-path/dbcsr-2.6.0/src -I/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src -I/usr/lib/i386-linux-gnu/mpich/include -ffree-form -std=f2008ts -fimplicit-none -Werror=aliasing -Werror=ampersand -Werror=c-binding-type -Werror=intrinsic-shadow -Werror=intrinsics-std -Werror=line-truncation -Werror=tabs -Werror=target-lifetime -Werror=underflow -Werror=unused-but-set-parameter -Werror=unused-but-set-variable -Werror=unused-variable -Werror=unused-dummy-argument -Werror=conversion -Werror=zerotrip -Werror=uninitialized -Wno-maybe-uninitialized -Werror=unused-parameter -fallow-argument-mismatch -fopenmp -fallow-invalid-boz -fallow-argument-mismatch -c /build/reproducible-path/dbcsr-2.6.0/tests/dbcsr_unittest3.F -o CMakeFiles/dbcsr_unittest3.dir/dbcsr_unittest3.F.o -cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/tests && /usr/bin/gfortran -D__SHORT_FILE__=\"dbcsr_unittest2.F\" -I/build/reproducible-path/dbcsr-2.6.0/src -I/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src -I/usr/lib/i386-linux-gnu/mpich/include -ffree-form -std=f2008ts -fimplicit-none -Werror=aliasing -Werror=ampersand -Werror=c-binding-type -Werror=intrinsic-shadow -Werror=intrinsics-std -Werror=line-truncation -Werror=tabs -Werror=target-lifetime -Werror=underflow -Werror=unused-but-set-parameter -Werror=unused-but-set-variable -Werror=unused-variable -Werror=unused-dummy-argument -Werror=conversion -Werror=zerotrip -Werror=uninitialized -Wno-maybe-uninitialized -Werror=unused-parameter -fallow-argument-mismatch -fopenmp -fallow-invalid-boz -fallow-argument-mismatch -c /build/reproducible-path/dbcsr-2.6.0/tests/dbcsr_unittest2.F -o CMakeFiles/dbcsr_unittest2.dir/dbcsr_unittest2.F.o -[ 94%] Building Fortran object tests/CMakeFiles/dbcsr_tas_unittest.dir/dbcsr_tas_unittest.F.o cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/tests && /usr/bin/gfortran -D__SHORT_FILE__=\"dbcsr_test_scale_by_vector.F\" -I/build/reproducible-path/dbcsr-2.6.0/src -I/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src -I/usr/lib/i386-linux-gnu/mpich/include -ffree-form -std=f2008ts -fimplicit-none -Werror=aliasing -Werror=ampersand -Werror=c-binding-type -Werror=intrinsic-shadow -Werror=intrinsics-std -Werror=line-truncation -Werror=tabs -Werror=target-lifetime -Werror=underflow -Werror=unused-but-set-parameter -Werror=unused-but-set-variable -Werror=unused-variable -Werror=unused-dummy-argument -Werror=conversion -Werror=zerotrip -Werror=uninitialized -Wno-maybe-uninitialized -Werror=unused-parameter -fallow-argument-mismatch -fopenmp -fallow-invalid-boz -fallow-argument-mismatch -c /build/reproducible-path/dbcsr-2.6.0/tests/dbcsr_test_scale_by_vector.F -o CMakeFiles/dbcsr_unittest4.dir/dbcsr_test_scale_by_vector.F.o -cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/tests && /usr/bin/gfortran -D__SHORT_FILE__=\"dbcsr_tas_unittest.F\" -I/build/reproducible-path/dbcsr-2.6.0/src -I/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src -I/usr/lib/i386-linux-gnu/mpich/include -ffree-form -std=f2008ts -fimplicit-none -Werror=aliasing -Werror=ampersand -Werror=c-binding-type -Werror=intrinsic-shadow -Werror=intrinsics-std -Werror=line-truncation -Werror=tabs -Werror=target-lifetime -Werror=underflow -Werror=unused-but-set-parameter -Werror=unused-but-set-variable -Werror=unused-variable -Werror=unused-dummy-argument -Werror=conversion -Werror=zerotrip -Werror=uninitialized -Wno-maybe-uninitialized -Werror=unused-parameter -fallow-argument-mismatch -fopenmp -fallow-invalid-boz -fallow-argument-mismatch -c /build/reproducible-path/dbcsr-2.6.0/tests/dbcsr_tas_unittest.F -o CMakeFiles/dbcsr_tas_unittest.dir/dbcsr_tas_unittest.F.o -/usr/bin/cmake -E cmake_copy_f90_mod tests/dbcsr_performance_multiply.mod tests/CMakeFiles/dbcsr_perf.dir/dbcsr_performance_multiply.mod.stamp GNU -[ 94%] Building Fortran object tests/CMakeFiles/dbcsr_tensor_unittest.dir/dbcsr_tensor_unittest.F.o cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/tests && /usr/bin/gfortran -D__SHORT_FILE__=\"dbcsr_tensor_unittest.F\" -I/build/reproducible-path/dbcsr-2.6.0/src -I/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src -I/usr/lib/i386-linux-gnu/mpich/include -ffree-form -std=f2008ts -fimplicit-none -Werror=aliasing -Werror=ampersand -Werror=c-binding-type -Werror=intrinsic-shadow -Werror=intrinsics-std -Werror=line-truncation -Werror=tabs -Werror=target-lifetime -Werror=underflow -Werror=unused-but-set-parameter -Werror=unused-but-set-variable -Werror=unused-variable -Werror=unused-dummy-argument -Werror=conversion -Werror=zerotrip -Werror=uninitialized -Wno-maybe-uninitialized -Werror=unused-parameter -fallow-argument-mismatch -fopenmp -fallow-invalid-boz -fallow-argument-mismatch -c /build/reproducible-path/dbcsr-2.6.0/tests/dbcsr_tensor_unittest.F -o CMakeFiles/dbcsr_tensor_unittest.dir/dbcsr_tensor_unittest.F.o -/usr/bin/cmake -E touch tests/CMakeFiles/dbcsr_perf.dir/dbcsr_performance_multiply.F.o.provides.build -[ 95%] Building Fortran object tests/CMakeFiles/dbcsr_perf.dir/dbcsr_performance_driver.F.o -cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/tests && /usr/bin/gfortran -D__SHORT_FILE__=\"dbcsr_performance_driver.F\" -I/build/reproducible-path/dbcsr-2.6.0/src -I/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src -I/usr/lib/i386-linux-gnu/mpich/include -ffree-form -std=f2008ts -fimplicit-none -Werror=aliasing -Werror=ampersand -Werror=c-binding-type -Werror=intrinsic-shadow -Werror=intrinsics-std -Werror=line-truncation -Werror=tabs -Werror=target-lifetime -Werror=underflow -Werror=unused-but-set-parameter -Werror=unused-but-set-variable -Werror=unused-variable -Werror=unused-dummy-argument -Werror=conversion -Werror=zerotrip -Werror=uninitialized -Wno-maybe-uninitialized -Werror=unused-parameter -fallow-argument-mismatch -fallow-invalid-boz -fallow-argument-mismatch -fopenmp -c /build/reproducible-path/dbcsr-2.6.0/tests/dbcsr_performance_driver.F -o CMakeFiles/dbcsr_perf.dir/dbcsr_performance_driver.F.o +[ 95%] Building Fortran object tests/CMakeFiles/dbcsr_tas_unittest.dir/dbcsr_tas_unittest.F.o +cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/tests && /usr/bin/gfortran -D__SHORT_FILE__=\"dbcsr_tas_unittest.F\" -I/build/reproducible-path/dbcsr-2.6.0/src -I/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src -I/usr/lib/i386-linux-gnu/mpich/include -ffree-form -std=f2008ts -fimplicit-none -Werror=aliasing -Werror=ampersand -Werror=c-binding-type -Werror=intrinsic-shadow -Werror=intrinsics-std -Werror=line-truncation -Werror=tabs -Werror=target-lifetime -Werror=underflow -Werror=unused-but-set-parameter -Werror=unused-but-set-variable -Werror=unused-variable -Werror=unused-dummy-argument -Werror=conversion -Werror=zerotrip -Werror=uninitialized -Wno-maybe-uninitialized -Werror=unused-parameter -fallow-argument-mismatch -fopenmp -fallow-invalid-boz -fallow-argument-mismatch -c /build/reproducible-path/dbcsr-2.6.0/tests/dbcsr_tas_unittest.F -o CMakeFiles/dbcsr_tas_unittest.dir/dbcsr_tas_unittest.F.o [ 95%] Linking Fortran executable dbcsr_tensor_example_1 cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/examples && /usr/bin/cmake -E cmake_link_script CMakeFiles/dbcsr_tensor_example_1.dir/link.txt --verbose=1 +[ 95%] Linking Fortran executable dbcsr_perf +cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/tests && /usr/bin/cmake -E cmake_link_script CMakeFiles/dbcsr_perf.dir/link.txt --verbose=1 [ 95%] Linking Fortran executable dbcsr_unittest2 cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/tests && /usr/bin/cmake -E cmake_link_script CMakeFiles/dbcsr_unittest2.dir/link.txt --verbose=1 [ 95%] Linking Fortran executable dbcsr_unittest3 cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/tests && /usr/bin/cmake -E cmake_link_script CMakeFiles/dbcsr_unittest3.dir/link.txt --verbose=1 -[ 95%] Linking Fortran executable dbcsr_test_csr_conversions -cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/tests && /usr/bin/cmake -E cmake_link_script CMakeFiles/dbcsr_test_csr_conversions.dir/link.txt --verbose=1 -[ 95%] Linking Fortran executable dbcsr_perf -cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/tests && /usr/bin/cmake -E cmake_link_script CMakeFiles/dbcsr_perf.dir/link.txt --verbose=1 -[ 95%] Linking Fortran executable dbcsr_unittest1 -cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/tests && /usr/bin/cmake -E cmake_link_script CMakeFiles/dbcsr_unittest1.dir/link.txt --verbose=1 -[ 95%] Linking Fortran executable dbcsr_tas_unittest -cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/tests && /usr/bin/cmake -E cmake_link_script CMakeFiles/dbcsr_tas_unittest.dir/link.txt --verbose=1 /usr/bin/cmake -E cmake_copy_f90_mod tests/dbcsr_test_scale_by_vector.mod tests/CMakeFiles/dbcsr_unittest4.dir/dbcsr_test_scale_by_vector.mod.stamp GNU /usr/bin/cmake -E touch tests/CMakeFiles/dbcsr_unittest4.dir/dbcsr_test_scale_by_vector.F.o.provides.build +make -f tests/CMakeFiles/dbcsr_test_csr_conversions.dir/build.make tests/CMakeFiles/dbcsr_test_csr_conversions.dir/depend +make[3]: Entering directory '/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu' +cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu && /usr/bin/cmake -E cmake_depends "Unix Makefiles" /build/reproducible-path/dbcsr-2.6.0 /build/reproducible-path/dbcsr-2.6.0/tests /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/tests /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/tests/CMakeFiles/dbcsr_test_csr_conversions.dir/DependInfo.cmake "--color=" +[ 95%] Linking Fortran executable dbcsr_unittest1 +cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/tests && /usr/bin/cmake -E cmake_link_script CMakeFiles/dbcsr_unittest1.dir/link.txt --verbose=1 [ 95%] Building Fortran object tests/CMakeFiles/dbcsr_unittest4.dir/dbcsr_unittest4.F.o +Dependee "/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/tests/CMakeFiles/dbcsr_test_csr_conversions.dir/DependInfo.cmake" is newer than depender "/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/tests/CMakeFiles/dbcsr_test_csr_conversions.dir/depend.internal". +Dependee "/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/tests/CMakeFiles/CMakeDirectoryInformation.cmake" is newer than depender "/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/tests/CMakeFiles/dbcsr_test_csr_conversions.dir/depend.internal". +Scanning dependencies of target dbcsr_test_csr_conversions cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/tests && /usr/bin/gfortran -D__SHORT_FILE__=\"dbcsr_unittest4.F\" -I/build/reproducible-path/dbcsr-2.6.0/src -I/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src -I/usr/lib/i386-linux-gnu/mpich/include -ffree-form -std=f2008ts -fimplicit-none -Werror=aliasing -Werror=ampersand -Werror=c-binding-type -Werror=intrinsic-shadow -Werror=intrinsics-std -Werror=line-truncation -Werror=tabs -Werror=target-lifetime -Werror=underflow -Werror=unused-but-set-parameter -Werror=unused-but-set-variable -Werror=unused-variable -Werror=unused-dummy-argument -Werror=conversion -Werror=zerotrip -Werror=uninitialized -Wno-maybe-uninitialized -Werror=unused-parameter -fallow-argument-mismatch -fopenmp -fallow-invalid-boz -fallow-argument-mismatch -c /build/reproducible-path/dbcsr-2.6.0/tests/dbcsr_unittest4.F -o CMakeFiles/dbcsr_unittest4.dir/dbcsr_unittest4.F.o -/usr/bin/gfortran -Wl,-z,relro -Wl,--dependency-file,CMakeFiles/dbcsr_unittest2.dir/link.d -ffree-form -std=f2008ts -fimplicit-none -Werror=aliasing -Werror=ampersand -Werror=c-binding-type -Werror=intrinsic-shadow -Werror=intrinsics-std -Werror=line-truncation -Werror=tabs -Werror=target-lifetime -Werror=underflow -Werror=unused-but-set-parameter -Werror=unused-but-set-variable -Werror=unused-variable -Werror=unused-dummy-argument -Werror=conversion -Werror=zerotrip -Werror=uninitialized -Wno-maybe-uninitialized -Werror=unused-parameter -fallow-argument-mismatch CMakeFiles/dbcsr_unittest2.dir/dbcsr_unittest2.F.o -o dbcsr_unittest2 -Wl,-rpath,/usr/lib/i386-linux-gnu/mpich/lib libdbcsr_unittest_common.a ../src/libdbcsr.a /usr/lib/i386-linux-gnu/libblas.so /usr/lib/i386-linux-gnu/liblapack.so /usr/lib/i386-linux-gnu/libblas.so /usr/lib/i386-linux-gnu/liblapack.so /usr/lib/i386-linux-gnu/mpich/lib/libmpichfort.so /usr/lib/i386-linux-gnu/mpich/lib/libmpich.so /usr/lib/gcc/i686-linux-gnu/14/libgomp.so /usr/lib/i386-linux-gnu/libpthread.a make[3]: Leaving directory '/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu' -/usr/bin/gfortran -Wl,-z,relro -Wl,--dependency-file,CMakeFiles/dbcsr_unittest3.dir/link.d -ffree-form -std=f2008ts -fimplicit-none -Werror=aliasing -Werror=ampersand -Werror=c-binding-type -Werror=intrinsic-shadow -Werror=intrinsics-std -Werror=line-truncation -Werror=tabs -Werror=target-lifetime -Werror=underflow -Werror=unused-but-set-parameter -Werror=unused-but-set-variable -Werror=unused-variable -Werror=unused-dummy-argument -Werror=conversion -Werror=zerotrip -Werror=uninitialized -Wno-maybe-uninitialized -Werror=unused-parameter -fallow-argument-mismatch CMakeFiles/dbcsr_unittest3.dir/dbcsr_unittest3.F.o -o dbcsr_unittest3 -Wl,-rpath,/usr/lib/i386-linux-gnu/mpich/lib libdbcsr_unittest_common.a ../src/libdbcsr.a /usr/lib/i386-linux-gnu/libblas.so /usr/lib/i386-linux-gnu/liblapack.so /usr/lib/i386-linux-gnu/libblas.so /usr/lib/i386-linux-gnu/liblapack.so /usr/lib/i386-linux-gnu/mpich/lib/libmpichfort.so /usr/lib/i386-linux-gnu/mpich/lib/libmpich.so /usr/lib/gcc/i686-linux-gnu/14/libgomp.so /usr/lib/i386-linux-gnu/libpthread.a -make[3]: Leaving directory '/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu' -[ 95%] Built target dbcsr_unittest2 -[ 95%] Built target dbcsr_unittest3 -/usr/bin/gfortran -Wl,-z,relro -Wl,--dependency-file,CMakeFiles/dbcsr_test_csr_conversions.dir/link.d -ffree-form -std=f2008ts -fimplicit-none -Werror=aliasing -Werror=ampersand -Werror=c-binding-type -Werror=intrinsic-shadow -Werror=intrinsics-std -Werror=line-truncation -Werror=tabs -Werror=target-lifetime -Werror=underflow -Werror=unused-but-set-parameter -Werror=unused-but-set-variable -Werror=unused-variable -Werror=unused-dummy-argument -Werror=conversion -Werror=zerotrip -Werror=uninitialized -Wno-maybe-uninitialized -Werror=unused-parameter -fallow-argument-mismatch CMakeFiles/dbcsr_test_csr_conversions.dir/dbcsr_test_csr_conversions.F.o -o dbcsr_test_csr_conversions -Wl,-rpath,/usr/lib/i386-linux-gnu/mpich/lib libdbcsr_unittest_common.a ../src/libdbcsr.a /usr/lib/i386-linux-gnu/libblas.so /usr/lib/i386-linux-gnu/liblapack.so /usr/lib/i386-linux-gnu/libblas.so /usr/lib/i386-linux-gnu/liblapack.so /usr/lib/i386-linux-gnu/mpich/lib/libmpichfort.so /usr/lib/i386-linux-gnu/mpich/lib/libmpich.so /usr/lib/gcc/i686-linux-gnu/14/libgomp.so /usr/lib/i386-linux-gnu/libpthread.a +make -f tests/CMakeFiles/dbcsr_test_csr_conversions.dir/build.make tests/CMakeFiles/dbcsr_test_csr_conversions.dir/build +make[3]: Entering directory '/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu' +[ 95%] Linking Fortran executable dbcsr_tas_unittest +cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/tests && /usr/bin/cmake -E cmake_link_script CMakeFiles/dbcsr_tas_unittest.dir/link.txt --verbose=1 +[ 95%] Building Fortran object tests/CMakeFiles/dbcsr_test_csr_conversions.dir/dbcsr_test_csr_conversions.F.o +cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/tests && /usr/bin/gfortran -D__SHORT_FILE__=\"dbcsr_test_csr_conversions.F\" -I/build/reproducible-path/dbcsr-2.6.0/src -I/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src -I/usr/lib/i386-linux-gnu/mpich/include -ffree-form -std=f2008ts -fimplicit-none -Werror=aliasing -Werror=ampersand -Werror=c-binding-type -Werror=intrinsic-shadow -Werror=intrinsics-std -Werror=line-truncation -Werror=tabs -Werror=target-lifetime -Werror=underflow -Werror=unused-but-set-parameter -Werror=unused-but-set-variable -Werror=unused-variable -Werror=unused-dummy-argument -Werror=conversion -Werror=zerotrip -Werror=uninitialized -Wno-maybe-uninitialized -Werror=unused-parameter -fallow-argument-mismatch -fopenmp -fallow-invalid-boz -fallow-argument-mismatch -c /build/reproducible-path/dbcsr-2.6.0/tests/dbcsr_test_csr_conversions.F -o CMakeFiles/dbcsr_test_csr_conversions.dir/dbcsr_test_csr_conversions.F.o /usr/bin/gfortran -Wl,-z,relro -Wl,--dependency-file,CMakeFiles/dbcsr_tensor_example_1.dir/link.d -ffree-form -std=f2008ts -fimplicit-none -Werror=aliasing -Werror=ampersand -Werror=c-binding-type -Werror=intrinsic-shadow -Werror=intrinsics-std -Werror=line-truncation -Werror=tabs -Werror=target-lifetime -Werror=underflow -Werror=unused-but-set-parameter -Werror=unused-but-set-variable -Werror=unused-variable -Werror=unused-dummy-argument -Werror=conversion -Werror=zerotrip -Werror=uninitialized -Wno-maybe-uninitialized -Werror=unused-parameter -fallow-argument-mismatch CMakeFiles/dbcsr_tensor_example_1.dir/dbcsr_tensor_example_1.F.o -o dbcsr_tensor_example_1 -Wl,-rpath,/usr/lib/i386-linux-gnu/mpich/lib ../src/libdbcsr.a /usr/lib/i386-linux-gnu/libblas.so /usr/lib/i386-linux-gnu/liblapack.so /usr/lib/i386-linux-gnu/libblas.so /usr/lib/i386-linux-gnu/liblapack.so /usr/lib/i386-linux-gnu/mpich/lib/libmpichfort.so /usr/lib/i386-linux-gnu/mpich/lib/libmpich.so /usr/lib/gcc/i686-linux-gnu/14/libgomp.so /usr/lib/i386-linux-gnu/libpthread.a make[3]: Leaving directory '/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu' -make[3]: Leaving directory '/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu' -[ 95%] Built target dbcsr_test_csr_conversions [ 95%] Built target dbcsr_tensor_example_1 +/usr/bin/cmake -E cmake_copy_f90_mod src/dbcsr_api_c.mod src/CMakeFiles/dbcsr_c.dir/dbcsr_api_c.mod.stamp GNU +/usr/bin/cmake -E touch src/CMakeFiles/dbcsr_c.dir/dbcsr_api_c.F.o.provides.build /usr/bin/gfortran -Wl,-z,relro -Wl,--dependency-file,CMakeFiles/dbcsr_perf.dir/link.d -ffree-form -std=f2008ts -fimplicit-none -Werror=aliasing -Werror=ampersand -Werror=c-binding-type -Werror=intrinsic-shadow -Werror=intrinsics-std -Werror=line-truncation -Werror=tabs -Werror=target-lifetime -Werror=underflow -Werror=unused-but-set-parameter -Werror=unused-but-set-variable -Werror=unused-variable -Werror=unused-dummy-argument -Werror=conversion -Werror=zerotrip -Werror=uninitialized -Wno-maybe-uninitialized -Werror=unused-parameter -fallow-argument-mismatch CMakeFiles/dbcsr_perf.dir/dbcsr_performance_driver.F.o CMakeFiles/dbcsr_perf.dir/dbcsr_performance_multiply.F.o -o dbcsr_perf -Wl,-rpath,/usr/lib/i386-linux-gnu/mpich/lib ../src/libdbcsr.a /usr/lib/i386-linux-gnu/libblas.so /usr/lib/i386-linux-gnu/liblapack.so /usr/lib/i386-linux-gnu/libblas.so /usr/lib/i386-linux-gnu/liblapack.so /usr/lib/i386-linux-gnu/mpich/lib/libmpichfort.so /usr/lib/i386-linux-gnu/mpich/lib/libmpich.so /usr/lib/gcc/i686-linux-gnu/14/libgomp.so /usr/lib/i386-linux-gnu/libpthread.a make[3]: Leaving directory '/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu' [ 95%] Built target dbcsr_perf -/usr/bin/cmake -E cmake_copy_f90_mod src/dbcsr_api_c.mod src/CMakeFiles/dbcsr_c.dir/dbcsr_api_c.mod.stamp GNU +/usr/bin/gfortran -Wl,-z,relro -Wl,--dependency-file,CMakeFiles/dbcsr_unittest2.dir/link.d -ffree-form -std=f2008ts -fimplicit-none -Werror=aliasing -Werror=ampersand -Werror=c-binding-type -Werror=intrinsic-shadow -Werror=intrinsics-std -Werror=line-truncation -Werror=tabs -Werror=target-lifetime -Werror=underflow -Werror=unused-but-set-parameter -Werror=unused-but-set-variable -Werror=unused-variable -Werror=unused-dummy-argument -Werror=conversion -Werror=zerotrip -Werror=uninitialized -Wno-maybe-uninitialized -Werror=unused-parameter -fallow-argument-mismatch CMakeFiles/dbcsr_unittest2.dir/dbcsr_unittest2.F.o -o dbcsr_unittest2 -Wl,-rpath,/usr/lib/i386-linux-gnu/mpich/lib libdbcsr_unittest_common.a ../src/libdbcsr.a /usr/lib/i386-linux-gnu/libblas.so /usr/lib/i386-linux-gnu/liblapack.so /usr/lib/i386-linux-gnu/libblas.so /usr/lib/i386-linux-gnu/liblapack.so /usr/lib/i386-linux-gnu/mpich/lib/libmpichfort.so /usr/lib/i386-linux-gnu/mpich/lib/libmpich.so /usr/lib/gcc/i686-linux-gnu/14/libgomp.so /usr/lib/i386-linux-gnu/libpthread.a +make[3]: Leaving directory '/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu' +/usr/bin/gfortran -Wl,-z,relro -Wl,--dependency-file,CMakeFiles/dbcsr_unittest3.dir/link.d -ffree-form -std=f2008ts -fimplicit-none -Werror=aliasing -Werror=ampersand -Werror=c-binding-type -Werror=intrinsic-shadow -Werror=intrinsics-std -Werror=line-truncation -Werror=tabs -Werror=target-lifetime -Werror=underflow -Werror=unused-but-set-parameter -Werror=unused-but-set-variable -Werror=unused-variable -Werror=unused-dummy-argument -Werror=conversion -Werror=zerotrip -Werror=uninitialized -Wno-maybe-uninitialized -Werror=unused-parameter -fallow-argument-mismatch CMakeFiles/dbcsr_unittest3.dir/dbcsr_unittest3.F.o -o dbcsr_unittest3 -Wl,-rpath,/usr/lib/i386-linux-gnu/mpich/lib libdbcsr_unittest_common.a ../src/libdbcsr.a /usr/lib/i386-linux-gnu/libblas.so /usr/lib/i386-linux-gnu/liblapack.so /usr/lib/i386-linux-gnu/libblas.so /usr/lib/i386-linux-gnu/liblapack.so /usr/lib/i386-linux-gnu/mpich/lib/libmpichfort.so /usr/lib/i386-linux-gnu/mpich/lib/libmpich.so /usr/lib/gcc/i686-linux-gnu/14/libgomp.so /usr/lib/i386-linux-gnu/libpthread.a +make[3]: Leaving directory '/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu' +[ 95%] Linking Fortran executable dbcsr_unittest4 +cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/tests && /usr/bin/cmake -E cmake_link_script CMakeFiles/dbcsr_unittest4.dir/link.txt --verbose=1 +[ 95%] Built target dbcsr_unittest2 +[ 95%] Built target dbcsr_unittest3 +[ 95%] Linking Fortran executable dbcsr_test_csr_conversions +cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/tests && /usr/bin/cmake -E cmake_link_script CMakeFiles/dbcsr_test_csr_conversions.dir/link.txt --verbose=1 /usr/bin/gfortran -Wl,-z,relro -Wl,--dependency-file,CMakeFiles/dbcsr_unittest1.dir/link.d -ffree-form -std=f2008ts -fimplicit-none -Werror=aliasing -Werror=ampersand -Werror=c-binding-type -Werror=intrinsic-shadow -Werror=intrinsics-std -Werror=line-truncation -Werror=tabs -Werror=target-lifetime -Werror=underflow -Werror=unused-but-set-parameter -Werror=unused-but-set-variable -Werror=unused-variable -Werror=unused-dummy-argument -Werror=conversion -Werror=zerotrip -Werror=uninitialized -Wno-maybe-uninitialized -Werror=unused-parameter -fallow-argument-mismatch CMakeFiles/dbcsr_unittest1.dir/dbcsr_unittest1.F.o -o dbcsr_unittest1 -Wl,-rpath,/usr/lib/i386-linux-gnu/mpich/lib libdbcsr_unittest_common.a ../src/libdbcsr.a /usr/lib/i386-linux-gnu/libblas.so /usr/lib/i386-linux-gnu/liblapack.so /usr/lib/i386-linux-gnu/libblas.so /usr/lib/i386-linux-gnu/liblapack.so /usr/lib/i386-linux-gnu/mpich/lib/libmpichfort.so /usr/lib/i386-linux-gnu/mpich/lib/libmpich.so /usr/lib/gcc/i686-linux-gnu/14/libgomp.so /usr/lib/i386-linux-gnu/libpthread.a make[3]: Leaving directory '/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu' +[ 95%] Built target dbcsr_unittest1 /usr/bin/gfortran -Wl,-z,relro -Wl,--dependency-file,CMakeFiles/dbcsr_tas_unittest.dir/link.d -ffree-form -std=f2008ts -fimplicit-none -Werror=aliasing -Werror=ampersand -Werror=c-binding-type -Werror=intrinsic-shadow -Werror=intrinsics-std -Werror=line-truncation -Werror=tabs -Werror=target-lifetime -Werror=underflow -Werror=unused-but-set-parameter -Werror=unused-but-set-variable -Werror=unused-variable -Werror=unused-dummy-argument -Werror=conversion -Werror=zerotrip -Werror=uninitialized -Wno-maybe-uninitialized -Werror=unused-parameter -fallow-argument-mismatch CMakeFiles/dbcsr_tas_unittest.dir/dbcsr_tas_unittest.F.o -o dbcsr_tas_unittest -Wl,-rpath,/usr/lib/i386-linux-gnu/mpich/lib libdbcsr_unittest_common.a ../src/libdbcsr.a /usr/lib/i386-linux-gnu/libblas.so /usr/lib/i386-linux-gnu/liblapack.so /usr/lib/i386-linux-gnu/libblas.so /usr/lib/i386-linux-gnu/liblapack.so /usr/lib/i386-linux-gnu/mpich/lib/libmpichfort.so /usr/lib/i386-linux-gnu/mpich/lib/libmpich.so /usr/lib/gcc/i686-linux-gnu/14/libgomp.so /usr/lib/i386-linux-gnu/libpthread.a -/usr/bin/cmake -E touch src/CMakeFiles/dbcsr_c.dir/dbcsr_api_c.F.o.provides.build make[3]: Leaving directory '/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu' -[ 95%] Built target dbcsr_unittest1 [ 95%] Built target dbcsr_tas_unittest -[ 95%] Linking Fortran executable dbcsr_unittest4 -cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/tests && /usr/bin/cmake -E cmake_link_script CMakeFiles/dbcsr_unittest4.dir/link.txt --verbose=1 -[ 95%] Linking Fortran executable dbcsr_tensor_unittest -cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/tests && /usr/bin/cmake -E cmake_link_script CMakeFiles/dbcsr_tensor_unittest.dir/link.txt --verbose=1 /usr/bin/gfortran -Wl,-z,relro -Wl,--dependency-file,CMakeFiles/dbcsr_unittest4.dir/link.d -ffree-form -std=f2008ts -fimplicit-none -Werror=aliasing -Werror=ampersand -Werror=c-binding-type -Werror=intrinsic-shadow -Werror=intrinsics-std -Werror=line-truncation -Werror=tabs -Werror=target-lifetime -Werror=underflow -Werror=unused-but-set-parameter -Werror=unused-but-set-variable -Werror=unused-variable -Werror=unused-dummy-argument -Werror=conversion -Werror=zerotrip -Werror=uninitialized -Wno-maybe-uninitialized -Werror=unused-parameter -fallow-argument-mismatch CMakeFiles/dbcsr_unittest4.dir/dbcsr_unittest4.F.o CMakeFiles/dbcsr_unittest4.dir/dbcsr_test_scale_by_vector.F.o -o dbcsr_unittest4 -Wl,-rpath,/usr/lib/i386-linux-gnu/mpich/lib libdbcsr_unittest_common.a ../src/libdbcsr.a /usr/lib/i386-linux-gnu/libblas.so /usr/lib/i386-linux-gnu/liblapack.so /usr/lib/i386-linux-gnu/libblas.so /usr/lib/i386-linux-gnu/liblapack.so /usr/lib/i386-linux-gnu/mpich/lib/libmpichfort.so /usr/lib/i386-linux-gnu/mpich/lib/libmpich.so /usr/lib/gcc/i686-linux-gnu/14/libgomp.so /usr/lib/i386-linux-gnu/libpthread.a make[3]: Leaving directory '/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu' +/usr/bin/gfortran -Wl,-z,relro -Wl,--dependency-file,CMakeFiles/dbcsr_test_csr_conversions.dir/link.d -ffree-form -std=f2008ts -fimplicit-none -Werror=aliasing -Werror=ampersand -Werror=c-binding-type -Werror=intrinsic-shadow -Werror=intrinsics-std -Werror=line-truncation -Werror=tabs -Werror=target-lifetime -Werror=underflow -Werror=unused-but-set-parameter -Werror=unused-but-set-variable -Werror=unused-variable -Werror=unused-dummy-argument -Werror=conversion -Werror=zerotrip -Werror=uninitialized -Wno-maybe-uninitialized -Werror=unused-parameter -fallow-argument-mismatch CMakeFiles/dbcsr_test_csr_conversions.dir/dbcsr_test_csr_conversions.F.o -o dbcsr_test_csr_conversions -Wl,-rpath,/usr/lib/i386-linux-gnu/mpich/lib libdbcsr_unittest_common.a ../src/libdbcsr.a /usr/lib/i386-linux-gnu/libblas.so /usr/lib/i386-linux-gnu/liblapack.so /usr/lib/i386-linux-gnu/libblas.so /usr/lib/i386-linux-gnu/liblapack.so /usr/lib/i386-linux-gnu/mpich/lib/libmpichfort.so /usr/lib/i386-linux-gnu/mpich/lib/libmpich.so /usr/lib/gcc/i686-linux-gnu/14/libgomp.so /usr/lib/i386-linux-gnu/libpthread.a +make[3]: Leaving directory '/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu' [ 95%] Built target dbcsr_unittest4 +[ 95%] Built target dbcsr_test_csr_conversions +[ 95%] Linking Fortran executable dbcsr_tensor_unittest +cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/tests && /usr/bin/cmake -E cmake_link_script CMakeFiles/dbcsr_tensor_unittest.dir/link.txt --verbose=1 /usr/bin/gfortran -Wl,-z,relro -Wl,--dependency-file,CMakeFiles/dbcsr_tensor_unittest.dir/link.d -ffree-form -std=f2008ts -fimplicit-none -Werror=aliasing -Werror=ampersand -Werror=c-binding-type -Werror=intrinsic-shadow -Werror=intrinsics-std -Werror=line-truncation -Werror=tabs -Werror=target-lifetime -Werror=underflow -Werror=unused-but-set-parameter -Werror=unused-but-set-variable -Werror=unused-variable -Werror=unused-dummy-argument -Werror=conversion -Werror=zerotrip -Werror=uninitialized -Wno-maybe-uninitialized -Werror=unused-parameter -fallow-argument-mismatch CMakeFiles/dbcsr_tensor_unittest.dir/dbcsr_tensor_unittest.F.o -o dbcsr_tensor_unittest -Wl,-rpath,/usr/lib/i386-linux-gnu/mpich/lib libdbcsr_unittest_common.a ../src/libdbcsr.a /usr/lib/i386-linux-gnu/libblas.so /usr/lib/i386-linux-gnu/liblapack.so /usr/lib/i386-linux-gnu/libblas.so /usr/lib/i386-linux-gnu/liblapack.so /usr/lib/i386-linux-gnu/mpich/lib/libmpichfort.so /usr/lib/i386-linux-gnu/mpich/lib/libmpich.so /usr/lib/gcc/i686-linux-gnu/14/libgomp.so /usr/lib/i386-linux-gnu/libpthread.a make[3]: Leaving directory '/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu' -[ 95%] Built target dbcsr_tensor_unittest /usr/bin/cmake -E cmake_copy_f90_mod src/dbcsr_tensor_api_c.mod src/CMakeFiles/dbcsr_c.dir/dbcsr_tensor_api_c.mod.stamp GNU -[ 95%] Linking Fortran static library libdbcsr_c.a +[ 95%] Built target dbcsr_tensor_unittest /usr/bin/cmake -E touch src/CMakeFiles/dbcsr_c.dir/tensors/dbcsr_tensor_api_c.F.o.provides.build +[ 95%] Linking Fortran static library libdbcsr_c.a cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/cmake -P CMakeFiles/dbcsr_c.dir/cmake_clean_target.cmake cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src && /usr/bin/cmake -E cmake_link_script CMakeFiles/dbcsr_c.dir/link.txt --verbose=1 /usr/bin/ar qc libdbcsr_c.a CMakeFiles/dbcsr_c.dir/dbcsr_api_c.F.o CMakeFiles/dbcsr_c.dir/tensors/dbcsr_tensor_api_c.F.o @@ -1604,25 +1640,25 @@ make[3]: Entering directory '/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu' cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu && /usr/bin/cmake -E cmake_depends "Unix Makefiles" /build/reproducible-path/dbcsr-2.6.0 /build/reproducible-path/dbcsr-2.6.0/examples /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/examples /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/examples/CMakeFiles/dbcsr_tensor_example_2_cpp.dir/DependInfo.cmake "--color=" make[3]: Leaving directory '/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu' +make -f tests/CMakeFiles/dbcsr_test.dir/build.make tests/CMakeFiles/dbcsr_test.dir/build make[3]: Leaving directory '/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu' -make -f tests/CMakeFiles/dbcsr_tensor_test.dir/build.make tests/CMakeFiles/dbcsr_tensor_test.dir/build -make -f examples/CMakeFiles/dbcsr_example_3_cpp.dir/build.make examples/CMakeFiles/dbcsr_example_3_cpp.dir/build make[3]: Leaving directory '/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu' -make -f tests/CMakeFiles/dbcsr_test.dir/build.make tests/CMakeFiles/dbcsr_test.dir/build make[3]: Leaving directory '/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu' +make -f tests/CMakeFiles/dbcsr_tensor_test.dir/build.make tests/CMakeFiles/dbcsr_tensor_test.dir/build make[3]: Entering directory '/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu' +make -f examples/CMakeFiles/dbcsr_example_3_cpp.dir/build.make examples/CMakeFiles/dbcsr_example_3_cpp.dir/build make -f examples/CMakeFiles/dbcsr_tensor_example_2_cpp.dir/build.make examples/CMakeFiles/dbcsr_tensor_example_2_cpp.dir/build make[3]: Entering directory '/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu' make[3]: Entering directory '/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu' make[3]: Entering directory '/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu' -[ 95%] Building CXX object examples/CMakeFiles/dbcsr_example_3_cpp.dir/dbcsr_example_3.cpp.o -[ 95%] Building CXX object tests/CMakeFiles/dbcsr_tensor_test.dir/dbcsr_tensor_test.cpp.o [ 95%] Building CXX object tests/CMakeFiles/dbcsr_test.dir/dbcsr_test.cpp.o -cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/examples && /usr/bin/c++ -I/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src -I/build/reproducible-path/dbcsr-2.6.0/src -isystem /usr/lib/i386-linux-gnu/mpich/include -g -O2 -ffile-prefix-map=/build/reproducible-path/dbcsr-2.6.0=. -fstack-protector-strong -Wformat -Werror=format-security -Wdate-time -D_FORTIFY_SOURCE=2 -std=gnu++14 -MD -MT examples/CMakeFiles/dbcsr_example_3_cpp.dir/dbcsr_example_3.cpp.o -MF CMakeFiles/dbcsr_example_3_cpp.dir/dbcsr_example_3.cpp.o.d -o CMakeFiles/dbcsr_example_3_cpp.dir/dbcsr_example_3.cpp.o -c /build/reproducible-path/dbcsr-2.6.0/examples/dbcsr_example_3.cpp -cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/tests && /usr/bin/c++ -I/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src -I/build/reproducible-path/dbcsr-2.6.0/src -isystem /usr/lib/i386-linux-gnu/mpich/include -g -O2 -ffile-prefix-map=/build/reproducible-path/dbcsr-2.6.0=. -fstack-protector-strong -Wformat -Werror=format-security -Wdate-time -D_FORTIFY_SOURCE=2 -std=gnu++11 -MD -MT tests/CMakeFiles/dbcsr_tensor_test.dir/dbcsr_tensor_test.cpp.o -MF CMakeFiles/dbcsr_tensor_test.dir/dbcsr_tensor_test.cpp.o.d -o CMakeFiles/dbcsr_tensor_test.dir/dbcsr_tensor_test.cpp.o -c /build/reproducible-path/dbcsr-2.6.0/tests/dbcsr_tensor_test.cpp cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/tests && /usr/bin/c++ -I/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src -I/build/reproducible-path/dbcsr-2.6.0/src -isystem /usr/lib/i386-linux-gnu/mpich/include -g -O2 -ffile-prefix-map=/build/reproducible-path/dbcsr-2.6.0=. -fstack-protector-strong -Wformat -Werror=format-security -Wdate-time -D_FORTIFY_SOURCE=2 -std=gnu++11 -MD -MT tests/CMakeFiles/dbcsr_test.dir/dbcsr_test.cpp.o -MF CMakeFiles/dbcsr_test.dir/dbcsr_test.cpp.o.d -o CMakeFiles/dbcsr_test.dir/dbcsr_test.cpp.o -c /build/reproducible-path/dbcsr-2.6.0/tests/dbcsr_test.cpp +[ 95%] Building CXX object examples/CMakeFiles/dbcsr_example_3_cpp.dir/dbcsr_example_3.cpp.o +cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/examples && /usr/bin/c++ -I/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src -I/build/reproducible-path/dbcsr-2.6.0/src -isystem /usr/lib/i386-linux-gnu/mpich/include -g -O2 -ffile-prefix-map=/build/reproducible-path/dbcsr-2.6.0=. -fstack-protector-strong -Wformat -Werror=format-security -Wdate-time -D_FORTIFY_SOURCE=2 -std=gnu++14 -MD -MT examples/CMakeFiles/dbcsr_example_3_cpp.dir/dbcsr_example_3.cpp.o -MF CMakeFiles/dbcsr_example_3_cpp.dir/dbcsr_example_3.cpp.o.d -o CMakeFiles/dbcsr_example_3_cpp.dir/dbcsr_example_3.cpp.o -c /build/reproducible-path/dbcsr-2.6.0/examples/dbcsr_example_3.cpp [ 97%] Building CXX object examples/CMakeFiles/dbcsr_tensor_example_2_cpp.dir/dbcsr_tensor_example_2.cpp.o +[ 97%] Building CXX object tests/CMakeFiles/dbcsr_tensor_test.dir/dbcsr_tensor_test.cpp.o cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/examples && /usr/bin/c++ -I/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src -I/build/reproducible-path/dbcsr-2.6.0/src -isystem /usr/lib/i386-linux-gnu/mpich/include -g -O2 -ffile-prefix-map=/build/reproducible-path/dbcsr-2.6.0=. -fstack-protector-strong -Wformat -Werror=format-security -Wdate-time -D_FORTIFY_SOURCE=2 -std=gnu++14 -MD -MT examples/CMakeFiles/dbcsr_tensor_example_2_cpp.dir/dbcsr_tensor_example_2.cpp.o -MF CMakeFiles/dbcsr_tensor_example_2_cpp.dir/dbcsr_tensor_example_2.cpp.o.d -o CMakeFiles/dbcsr_tensor_example_2_cpp.dir/dbcsr_tensor_example_2.cpp.o -c /build/reproducible-path/dbcsr-2.6.0/examples/dbcsr_tensor_example_2.cpp +cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/tests && /usr/bin/c++ -I/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src -I/build/reproducible-path/dbcsr-2.6.0/src -isystem /usr/lib/i386-linux-gnu/mpich/include -g -O2 -ffile-prefix-map=/build/reproducible-path/dbcsr-2.6.0=. -fstack-protector-strong -Wformat -Werror=format-security -Wdate-time -D_FORTIFY_SOURCE=2 -std=gnu++11 -MD -MT tests/CMakeFiles/dbcsr_tensor_test.dir/dbcsr_tensor_test.cpp.o -MF CMakeFiles/dbcsr_tensor_test.dir/dbcsr_tensor_test.cpp.o.d -o CMakeFiles/dbcsr_tensor_test.dir/dbcsr_tensor_test.cpp.o -c /build/reproducible-path/dbcsr-2.6.0/tests/dbcsr_tensor_test.cpp [ 97%] Linking CXX executable dbcsr_example_3_cpp cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/examples && /usr/bin/cmake -E cmake_link_script CMakeFiles/dbcsr_example_3_cpp.dir/link.txt --verbose=1 /usr/bin/c++ -g -O2 -ffile-prefix-map=/build/reproducible-path/dbcsr-2.6.0=. -fstack-protector-strong -Wformat -Werror=format-security -Wdate-time -D_FORTIFY_SOURCE=2 -Wl,-z,relro -Wl,--dependency-file,CMakeFiles/dbcsr_example_3_cpp.dir/link.d CMakeFiles/dbcsr_example_3_cpp.dir/dbcsr_example_3.cpp.o -o dbcsr_example_3_cpp -Wl,-rpath,/usr/lib/i386-linux-gnu/mpich/lib ../src/libdbcsr_c.a ../src/libdbcsr.a /usr/lib/i386-linux-gnu/libblas.so /usr/lib/i386-linux-gnu/liblapack.so /usr/lib/i386-linux-gnu/libblas.so /usr/lib/i386-linux-gnu/liblapack.so /usr/lib/i386-linux-gnu/mpich/lib/libmpichfort.so /usr/lib/gcc/i686-linux-gnu/14/libgomp.so /usr/lib/i386-linux-gnu/libpthread.a /usr/lib/i386-linux-gnu/mpich/lib/libmpichcxx.so /usr/lib/i386-linux-gnu/mpich/lib/libmpich.so -lgfortran -lquadmath @@ -1667,7 +1703,7 @@ test 1 Start 1: dbcsr_perf:inputs/test_H2O.perf -1: Test command: /usr/bin/mpiexec "-n" "12" "/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/tests/dbcsr_perf" "/build/reproducible-path/dbcsr-2.6.0/tests/inputs/test_H2O.perf" +1: Test command: /usr/bin/mpiexec "-n" "7" "/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/tests/dbcsr_perf" "/build/reproducible-path/dbcsr-2.6.0/tests/inputs/test_H2O.perf" 1: Working Directory: /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/tests 1: Environment variables: 1: OMP_NUM_THREADS=2 @@ -1686,12 +1722,12 @@ 1: DBCSR| Use Communication thread T (D) 1: DBCSR| Communication thread load 100 (D) 1: DBCSR| MPI: My process id 0 -1: DBCSR| MPI: Number of processes 12 +1: DBCSR| MPI: Number of processes 7 1: DBCSR| OMP: Current number of threads 2 1: DBCSR| OMP: Max number of threads 2 1: DBCSR| Split modifier for TAS multiplication algorithm 1.0E+00 (D) 1: numthreads 2 -1: numnodes 12 +1: numnodes 7 1: matrix_sizes 2208 2208 2208 1: sparsities 0.20000000000000001 0.20000000000000001 0.20000000000000001 1: trans NN @@ -1708,7 +1744,7 @@ 1: ******************************************************************************** 1: -- PERF dbcsr_multiply (N, N, 3 , N, N, N) 1: matrix sizes A( 2208 x 2208), B( 2208 x 2208) and C( 2208 x 2208) -1: numnodes (nprows X npcols) = 12( 4 X 3) +1: numnodes (nprows X npcols) = 7( 7 X 1) 1: nthreads = 2 1: checksum(A) = 0.129355614363956E+07 1: checksum(B) = 0.130255535956734E+07 @@ -1718,12 +1754,12 @@ 1: 1: 1: mean std minmin maxmax -1: time = 724.12E-03 20.15E-03 616.14E-03 1.49E+00 seconds -1: perf total = 19.34E+09 354.65E+06 9.22E+09 22.24E+09 FLOPS -1: perf per node = 1.61E+09 29.55E+06 768.02E+06 1.85E+09 FLOPS -1: perf per thread = 805.92E+06 14.78E+06 384.01E+06 926.48E+06 FLOPS -1: load imbalance = 0.67E+00 0.19E-01 0.57E+00 0.14E+01 -1: rel load imbal = 0.92E+00 0.36E-04 0.92E+00 0.92E+00 +1: time = 2.09E+00 112.53E-03 1.47E+00 4.53E+00 seconds +1: perf total = 7.22E+09 251.69E+06 3.03E+09 9.32E+09 FLOPS +1: perf per node = 1.03E+09 35.96E+06 433.12E+06 1.33E+09 FLOPS +1: perf per thread = 515.43E+06 17.98E+06 216.56E+06 665.85E+06 FLOPS +1: load imbalance = 0.18E+01 0.98E-01 0.13E+01 0.39E+01 +1: rel load imbal = 0.86E+00 0.10E-03 0.86E+00 0.86E+00 1: ******************************************************************************** 1: 1: ------------------------------------------------------------------------------- @@ -1735,35 +1771,35 @@ 1: flops 23 x 23 x 23 687272462200 100.0% 0.0% 0.0% 1: flops inhomo. stacks 0 0.0% 0.0% 0.0% 1: flops total 687.272462E+09 100.0% 0.0% 0.0% -1: flops max/rank 58.054840E+09 100.0% 0.0% 0.0% +1: flops max/rank 101.245257E+09 100.0% 0.0% 0.0% 1: matmuls inhomo. stacks 0 0.0% 0.0% 0.0% 1: matmuls total 28243300 100.0% 0.0% 0.0% -1: number of processed stacks 33750 100.0% 0.0% 0.0% -1: average stack size 836.8 0.0 0.0 +1: number of processed stacks 30700 100.0% 0.0% 0.0% +1: average stack size 920.0 0.0 0.0 1: marketing flops 1.076458E+12 1: ------------------------------------------------------------------------------- 1: # multiplications 50 -1: max memory usage/rank 136.876032E+06 -1: # max total images/rank 4 +1: max memory usage/rank 134.356992E+06 +1: # max total images/rank 7 1: # max 3D layers 1 -1: # MPI messages exchanged 10200 +1: # MPI messages exchanged 2100 1: MPI messages size (bytes): -1: total size 7.795557E+09 -1: min size 600.944000E+03 -1: max size 931.040000E+03 -1: average size 764.270312E+03 +1: total size 9.378529E+09 +1: min size 4.215072E+06 +1: max size 4.583256E+06 +1: average size 4.465966E+06 1: MPI breakdown and total messages size (bytes): 1: size <= 128 0 0 1: 128 < size <= 8192 0 0 1: 8192 < size <= 32768 0 0 1: 32768 < size <= 131072 0 0 -1: 131072 < size <= 4194304 10200 7795555600 -1: 4194304 < size <= 16777216 0 0 +1: 131072 < size <= 4194304 0 0 +1: 4194304 < size <= 16777216 2100 9378535200 1: 16777216 < size 0 0 1: ------------------------------------------------------------------------------- 1: 1: *** WARNING in dbcsr_mm.F:291 :: Using a non-square number of MPI ranks *** -1: *** might lead to poor performance. Used ranks: 12 Suggested: 9 25 *** +1: *** might lead to poor performance. Used ranks: 7 Suggested: 9 16 *** 1: 1: ------------------------------------------------------------------------------- 1: - - @@ -1772,10 +1808,10 @@ 1: ------------------------------------------------------------------------------- 1: ROUTINE CALLS AVE VOLUME [Bytes] 1: MP_Bcast 2 12. -1: MP_Allreduce 328 38. -1: MP_Alltoall 121 259498. -1: MP_ISend 2100 351247. -1: MP_IRecv 2100 348820. +1: MP_Allreduce 328 26. +1: MP_Alltoall 121 422568. +1: MP_ISend 800 1677459. +1: MP_IRecv 800 1700270. 1: ------------------------------------------------------------------------------- 1: 1: ------------------------------------------------------------------------------- @@ -1785,115 +1821,114 @@ 1: ------------------------------------------------------------------------------- 1: SUBROUTINE CALLS ASD SELF TIME TOTAL TIME MAXRANK 1: MAXIMUM AVERAGE MAXIMUM AVERAGE MAXIMUM -1: dbcsr_performance_driver 1 1.0 0.000 0.000 36.681 36.683 0 -1: dbcsr_perf_multiply_low 1 2.0 0.000 0.000 36.681 36.683 0 -1: perf_multiply 1 3.0 0.001 0.001 36.625 36.640 0 -1: dbcsr_multiply_generic 50 4.0 0.015 0.115 36.206 36.224 1 -1: multiply_cannon 50 5.0 0.071 0.149 30.765 31.339 7 -1: multiply_cannon_loop 50 6.0 0.140 0.174 30.115 30.646 9 -1: multiply_cannon_multrec 600 7.0 27.117 28.040 27.119 28.042 2 -1: mp_sum_l 385 4.2 3.424 4.522 3.424 4.522 0 -1: dbcsr_multiply_generic_mpsum_f 50 5.0 0.000 0.000 3.421 4.519 6 -1: mp_waitall_1 2200 8.3 3.198 4.123 3.198 4.123 11 -1: multiply_cannon_metrocomm1 600 7.0 0.002 0.002 1.954 2.853 8 -1: make_m2s 100 5.0 0.003 0.004 1.648 1.694 3 -1: make_images 100 6.0 0.127 0.159 1.639 1.686 11 -1: multiply_cannon_metrocomm3 600 7.0 0.001 0.001 0.887 1.227 7 -1: make_images_sizes 100 7.0 0.000 0.000 0.536 0.688 3 -1: mp_alltoall_i44 100 8.0 0.536 0.687 0.536 0.687 0 -1: make_images_data 100 7.0 0.003 0.003 0.453 0.529 3 -1: hybrid_alltoall_any 100 8.0 0.088 0.170 0.423 0.490 6 -1: dbcsr_special_finalize 350 7.0 0.004 0.011 0.272 0.323 11 -1: dbcsr_merge_single_wm 350 8.0 0.092 0.130 0.266 0.311 11 -1: buffer_matrices_ensure_size 100 6.0 0.219 0.283 0.219 0.283 10 -1: mp_allgather_i34 50 6.0 0.236 0.274 0.236 0.274 5 -1: dbcsr_finalize 57 4.9 0.001 0.002 0.086 0.248 0 -1: mp_sync 50 4.0 0.203 0.228 0.203 0.228 5 -1: dbcsr_merge_all 53 5.9 0.012 0.035 0.065 0.228 0 -1: dbcsr_copy 150 4.7 0.115 0.131 0.204 0.227 1 -1: make_images_pack 100 7.0 0.192 0.202 0.193 0.203 4 -1: dbcsr_data_copy_aa2 53 6.9 0.041 0.203 0.041 0.203 11 -1: dbcsr_create_new 857 6.7 0.106 0.142 0.131 0.182 10 -1: dbcsr_sort_data 350 9.0 0.166 0.173 0.166 0.173 11 -1: dbcsr_data_release 2740 7.1 0.152 0.167 0.152 0.167 3 -1: dbcsr_add_wm_from_matrix 50 5.0 0.020 0.052 0.121 0.138 0 -1: dbcsr_fill_wm_from_matrix 50 6.0 0.100 0.110 0.100 0.110 10 -1: dbcsr_destroy 807 5.4 0.002 0.002 0.085 0.097 11 -1: setup_rec_index_2d 100 6.0 0.044 0.094 0.044 0.094 2 -1: setup_buffer_matrices 100 6.0 0.002 0.002 0.038 0.083 5 -1: dbcsr_redistribute 3 4.0 0.024 0.035 0.060 0.071 3 -1: dbcsr_make_random_matrix 3 3.0 0.039 0.051 0.054 0.070 0 -1: dbcsr_checksum 5 4.0 0.017 0.027 0.042 0.047 3 -1: dbcsr_make_index_exist 857 7.7 0.021 0.041 0.021 0.041 1 -1: mp_alltoall_i22 3 5.0 0.024 0.041 0.024 0.041 6 -1: mp_sum_d 76 1.3 0.025 0.034 0.025 0.034 9 -1: dbcsr_make_untransposed_blocks 100 5.0 0.016 0.028 0.017 0.029 9 -1: dbcsr_work_destroy_all 406 7.7 0.001 0.002 0.021 0.022 10 -1: dbcsr_mm_multrec_init 50 6.0 0.000 0.000 0.010 0.015 1 -1: dbcsr_mm_csr_init 50 7.0 0.006 0.012 0.010 0.015 10 -1: mp_alltoall_d11v 9 5.0 0.008 0.011 0.008 0.011 3 -1: dbcsr_sort_indices 406 8.7 0.010 0.010 0.010 0.010 1 -1: multiply_cannon_metrocomm2 450 7.0 0.003 0.003 0.009 0.010 2 -1: dbcsr_data_new 1831 7.4 0.009 0.009 0.009 0.009 0 -1: dbcsr_make_index_list 350 6.0 0.005 0.009 0.005 0.009 9 -1: tree_to_linear_d 3 6.0 0.007 0.008 0.007 0.008 3 -1: multiply_cannon_metrocomm4 400 7.0 0.002 0.002 0.006 0.007 3 -1: merge_index 53 6.9 0.002 0.007 0.002 0.007 0 -1: mp_irecv_dv 1050 8.2 0.005 0.006 0.005 0.006 4 -1: dbcsr_init_lib_low 1 1.0 0.002 0.005 0.002 0.005 7 -1: mp_max_l 90 1.0 0.002 0.004 0.002 0.004 7 -1: fill_hash_tables 50 8.0 0.003 0.004 0.003 0.004 9 -1: dbcsr_work_create 406 6.8 0.001 0.001 0.003 0.003 0 -1: mp_isend_dv 1050 8.2 0.003 0.003 0.003 0.003 2 -1: mp_isend_iv 1150 8.0 0.003 0.003 0.003 0.003 1 -1: multiply_cannon_multrec_finali 50 8.0 0.000 0.000 0.003 0.003 2 -1: dbcsr_mm_multrec_finalize 50 9.0 0.002 0.003 0.002 0.003 3 -1: mp_cart_create 1 5.0 0.001 0.002 0.001 0.002 8 -1: dbcsr_iterator_start 356 7.0 0.001 0.001 0.002 0.002 4 -1: mp_irecv_iv 1150 8.0 0.001 0.002 0.001 0.002 3 -1: dbcsr_iterator_stop 356 7.0 0.001 0.001 0.001 0.001 8 -1: mp_maxloc_dv 203 1.0 0.001 0.001 0.001 0.001 8 -1: dbcsr_iterator_seek 356 8.0 0.001 0.001 0.001 0.001 6 -1: dbcsr_make_dbcsr_index 406 8.7 0.001 0.001 0.001 0.001 3 -1: dbcsr_make_index_local_row 350 6.0 0.001 0.001 0.001 0.001 0 -1: mp_bcast_av 99 1.0 0.000 0.000 0.001 0.001 6 -1: mp_cart_sub 2 5.0 0.001 0.001 0.001 0.001 3 -1: mp_sum_b 100 5.0 0.001 0.001 0.001 0.001 2 -1: mp_max_i 93 1.0 0.000 0.000 0.000 0.000 8 -1: dbcsr_distribution_new 106 4.9 0.000 0.000 0.000 0.000 11 -1: mp_bcast_i 100 2.0 0.000 0.000 0.000 0.000 6 -1: quick_finalize 3 6.0 0.000 0.000 0.000 0.000 4 -1: dbcsr_switch_data_area 103 6.0 0.000 0.000 0.000 0.000 2 -1: dbcsr_mm_sched_init 50 8.0 0.000 0.000 0.000 0.000 6 -1: dbcsr_get_data_size_used 56 5.9 0.000 0.000 0.000 0.000 8 -1: mp_sum_root_rm 2 4.0 0.000 0.000 0.000 0.000 0 -1: mp_max_r 1 1.0 0.000 0.000 0.000 0.000 9 -1: dbcsr_verify_matrix 3 4.0 0.000 0.000 0.000 0.000 5 -1: dbcsr_dist_bin 4 3.0 0.000 0.000 0.000 0.000 0 -1: mp_comm_free 4 2.0 0.000 0.000 0.000 0.000 7 -1: dbcsr_mm_sched_finalize 50 10.0 0.000 0.000 0.000 0.000 2 -1: dbcsr_get_local_cols 50 5.0 0.000 0.000 0.000 0.000 4 -1: dbcsr_get_local_rows 50 5.0 0.000 0.000 0.000 0.000 0 -1: dbcsr_get_global_col_map 50 5.0 0.000 0.000 0.000 0.000 10 -1: dbcsr_mm_hostdrv_init 50 9.0 0.000 0.000 0.000 0.000 4 +1: dbcsr_performance_driver 1 1.0 0.000 0.000 106.308 106.340 0 +1: dbcsr_perf_multiply_low 1 2.0 0.000 0.000 106.308 106.339 0 +1: perf_multiply 1 3.0 0.001 0.002 106.141 106.174 0 +1: dbcsr_multiply_generic 50 4.0 0.055 0.094 104.314 104.503 0 +1: multiply_cannon 50 5.0 0.223 0.290 90.599 92.298 1 +1: multiply_cannon_loop 50 6.0 0.560 0.743 87.817 89.782 0 +1: multiply_cannon_multrec 350 7.0 73.445 75.893 73.452 75.898 5 +1: multiply_cannon_metrocomm1 350 7.0 0.010 0.015 13.786 16.531 2 +1: mp_waitall_1 2400 8.2 13.779 16.526 13.779 16.526 0 +1: mp_sum_l 385 4.2 6.004 7.455 6.004 7.455 1 +1: make_m2s 100 5.0 0.008 0.019 6.570 6.636 4 +1: make_images 100 6.0 0.755 0.878 6.464 6.530 5 +1: dbcsr_multiply_generic_mpsum_f 50 5.0 0.000 0.000 4.599 6.072 0 +1: make_images_sizes 100 7.0 0.001 0.001 1.855 2.064 0 +1: mp_alltoall_i44 100 8.0 1.855 2.063 1.855 2.063 0 +1: make_images_data 100 7.0 0.008 0.013 1.772 1.850 3 +1: hybrid_alltoall_any 100 8.0 1.756 1.838 1.758 1.839 1 +1: mp_allgather_i34 50 6.0 1.107 1.244 1.107 1.244 2 +1: buffer_matrices_ensure_size 100 6.0 0.946 1.086 0.946 1.086 0 +1: dbcsr_create_new 957 6.8 0.570 0.668 0.824 1.072 3 +1: dbcsr_special_finalize 400 7.0 0.097 0.117 0.934 1.015 6 +1: dbcsr_copy 150 4.7 0.507 0.599 0.914 1.011 3 +1: mp_sum_d 76 1.3 0.830 0.916 0.830 0.916 6 +1: mp_sync 50 4.0 0.784 0.885 0.784 0.885 1 +1: mp_maxloc_dv 201 1.0 0.741 0.871 0.741 0.871 2 +1: dbcsr_merge_single_wm 350 8.0 0.377 0.468 0.763 0.863 2 +1: make_images_pack 100 7.0 0.767 0.817 0.771 0.820 4 +1: dbcsr_add_wm_from_matrix 50 5.0 0.210 0.314 0.591 0.669 4 +1: dbcsr_finalize 57 4.9 0.017 0.034 0.457 0.587 6 +1: mp_max_l 89 1.0 0.464 0.543 0.464 0.543 6 +1: dbcsr_merge_all 53 5.9 0.175 0.280 0.370 0.497 6 +1: mp_max_i 92 1.0 0.391 0.472 0.391 0.472 0 +1: dbcsr_sort_data 350 9.0 0.375 0.453 0.375 0.453 4 +1: dbcsr_fill_wm_from_matrix 50 6.0 0.374 0.434 0.376 0.443 0 +1: setup_rec_index_2d 100 6.0 0.239 0.417 0.239 0.417 3 +1: dbcsr_make_index_exist 957 7.8 0.245 0.398 0.245 0.398 3 +1: dbcsr_data_release 2990 7.1 0.373 0.391 0.373 0.391 3 +1: dbcsr_checksum 5 4.0 0.247 0.315 0.367 0.379 3 +1: setup_buffer_matrices 100 6.0 0.005 0.012 0.193 0.348 2 +1: mp_sum_b 100 5.0 0.248 0.284 0.248 0.284 4 +1: dbcsr_redistribute 3 4.0 0.121 0.140 0.211 0.229 6 +1: dbcsr_destroy 907 5.4 0.005 0.006 0.169 0.188 0 +1: dbcsr_make_random_matrix 3 3.0 0.104 0.112 0.161 0.172 1 +1: mp_bcast_av 98 1.0 0.001 0.001 0.077 0.161 5 +1: mp_bcast_i 99 2.0 0.076 0.160 0.076 0.160 2 +1: dbcsr_data_copy_aa2 53 6.9 0.145 0.156 0.145 0.156 3 +1: dbcsr_make_index_list 400 6.0 0.097 0.147 0.097 0.147 0 +1: dbcsr_make_untransposed_blocks 100 5.0 0.072 0.120 0.074 0.122 6 +1: dbcsr_work_destroy_all 456 7.7 0.008 0.015 0.076 0.100 2 +1: quick_finalize 53 7.9 0.060 0.091 0.068 0.098 2 +1: mp_alltoall_d11v 9 5.0 0.050 0.061 0.050 0.061 1 +1: dbcsr_data_new 1981 7.4 0.030 0.057 0.030 0.057 6 +1: mp_sum_lv 2 1.0 0.039 0.055 0.039 0.055 6 +1: mp_alltoall_i22 3 5.0 0.031 0.045 0.031 0.045 2 +1: dbcsr_mm_multrec_init 50 6.0 0.000 0.000 0.024 0.038 5 +1: dbcsr_mm_csr_init 50 7.0 0.015 0.023 0.023 0.038 2 +1: mp_sum_root_rm 2 4.0 0.020 0.036 0.020 0.036 0 +1: merge_index 53 6.9 0.019 0.035 0.019 0.035 6 +1: tree_to_linear_d 3 6.0 0.024 0.029 0.024 0.029 3 +1: mp_sum_r 1 1.0 0.015 0.028 0.015 0.028 0 +1: mp_bcast_iv 2 1.0 0.006 0.028 0.006 0.028 4 +1: dbcsr_sort_indices 456 8.7 0.021 0.027 0.021 0.027 1 +1: mp_sum_i 1 1.0 0.011 0.024 0.011 0.024 2 +1: multiply_cannon_metrocomm2 300 7.0 0.005 0.006 0.018 0.024 0 +1: mp_max_rv 1 1.0 0.013 0.020 0.013 0.020 6 +1: mp_max_r 1 1.0 0.012 0.020 0.012 0.020 4 +1: mp_min_rv 1 1.0 0.012 0.016 0.012 0.016 2 +1: mp_sum_lm3 1 1.0 0.016 0.016 0.016 0.016 6 +1: mp_max_d 1 1.0 0.011 0.016 0.011 0.016 4 +1: fill_hash_tables 50 8.0 0.008 0.014 0.008 0.014 2 +1: multiply_cannon_multrec_finali 50 8.0 0.000 0.000 0.007 0.014 1 +1: dbcsr_make_dbcsr_index 456 8.7 0.003 0.014 0.003 0.014 1 +1: dbcsr_mm_multrec_finalize 50 9.0 0.007 0.013 0.007 0.013 2 +1: dbcsr_iterator_start 356 7.0 0.004 0.011 0.005 0.012 3 +1: mp_sum_rv 1 1.0 0.010 0.012 0.010 0.012 4 +1: dbcsr_init_lib_low 1 1.0 0.005 0.012 0.005 0.012 4 +1: dbcsr_iterator_stop 356 7.0 0.004 0.011 0.005 0.012 3 +1: mp_irecv_dv 300 8.0 0.004 0.011 0.004 0.011 5 +1: dbcsr_work_create 456 6.9 0.003 0.003 0.008 0.008 1 +1: mp_isend_dv 300 8.0 0.004 0.006 0.004 0.006 6 +1: mp_isend_iv 500 8.0 0.005 0.006 0.005 0.006 0 +1: mp_irecv_iv 500 8.0 0.004 0.005 0.004 0.005 2 +1: dbcsr_make_index_local_row 400 6.0 0.002 0.005 0.002 0.005 0 +1: mp_cart_create 1 5.0 0.002 0.004 0.002 0.004 4 +1: dbcsr_iterator_seek 356 8.0 0.002 0.002 0.002 0.002 4 +1: mp_cart_sub 2 5.0 0.002 0.002 0.002 0.002 4 +1: dbcsr_switch_data_area 153 7.0 0.001 0.001 0.001 0.001 0 +1: dbcsr_distribution_new 106 4.9 0.001 0.001 0.001 0.001 6 +1: multiply_cannon_metrocomm3 350 7.0 0.000 0.000 0.000 0.000 1 +1: dbcsr_mm_sched_init 50 8.0 0.000 0.000 0.000 0.000 3 +1: dbcsr_get_data_size_used 56 5.9 0.000 0.000 0.000 0.000 6 +1: dbcsr_mm_sched_finalize 50 10.0 0.000 0.000 0.000 0.000 3 1: mp_alltoall_i11v 9 5.0 0.000 0.000 0.000 0.000 0 -1: dbcsr_get_global_row_map 50 5.0 0.000 0.000 0.000 0.000 7 -1: mp_sum_lm3 1 1.0 0.000 0.000 0.000 0.000 1 -1: mp_sum_lv 2 1.0 0.000 0.000 0.000 0.000 4 -1: mp_bcast_iv 2 1.0 0.000 0.000 0.000 0.000 10 -1: mp_max_rv 1 1.0 0.000 0.000 0.000 0.000 4 -1: mp_min_rv 1 1.0 0.000 0.000 0.000 0.000 3 -1: mp_sum_r 1 1.0 0.000 0.000 0.000 0.000 1 -1: mp_sum_rv 1 1.0 0.000 0.000 0.000 0.000 8 -1: mp_max_d 1 1.0 0.000 0.000 0.000 0.000 10 -1: mp_sum_i 1 1.0 0.000 0.000 0.000 0.000 8 +1: dbcsr_verify_matrix 3 4.0 0.000 0.000 0.000 0.000 1 +1: dbcsr_get_local_rows 50 5.0 0.000 0.000 0.000 0.000 2 +1: dbcsr_get_global_row_map 50 5.0 0.000 0.000 0.000 0.000 2 +1: dbcsr_get_global_col_map 50 5.0 0.000 0.000 0.000 0.000 2 +1: dbcsr_get_local_cols 50 5.0 0.000 0.000 0.000 0.000 5 +1: dbcsr_mm_hostdrv_init 50 9.0 0.000 0.000 0.000 0.000 5 +1: dbcsr_dist_bin 4 3.0 0.000 0.000 0.000 0.000 4 +1: mp_comm_free 4 2.0 0.000 0.000 0.000 0.000 0 1: ------------------------------------------------------------------------------- 1: - 1/19 Test #1: dbcsr_perf:inputs/test_H2O.perf ....................... Passed 36.74 sec + 1/19 Test #1: dbcsr_perf:inputs/test_H2O.perf ....................... Passed 109.87 sec test 2 Start 2: dbcsr_perf:inputs/test_rect1_dense.perf -2: Test command: /usr/bin/mpiexec "-n" "12" "/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/tests/dbcsr_perf" "/build/reproducible-path/dbcsr-2.6.0/tests/inputs/test_rect1_dense.perf" +2: Test command: /usr/bin/mpiexec "-n" "7" "/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/tests/dbcsr_perf" "/build/reproducible-path/dbcsr-2.6.0/tests/inputs/test_rect1_dense.perf" 2: Working Directory: /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/tests 2: Environment variables: 2: OMP_NUM_THREADS=2 @@ -1912,12 +1947,12 @@ 2: DBCSR| Use Communication thread T (D) 2: DBCSR| Communication thread load 100 (D) 2: DBCSR| MPI: My process id 0 -2: DBCSR| MPI: Number of processes 12 +2: DBCSR| MPI: Number of processes 7 2: DBCSR| OMP: Current number of threads 2 2: DBCSR| OMP: Max number of threads 2 2: DBCSR| Split modifier for TAS multiplication algorithm 1.0E+00 (D) 2: numthreads 2 -2: numnodes 12 +2: numnodes 7 2: matrix_sizes 1000 100 100 2: sparsities 0.0000000000000000 0.0000000000000000 0.0000000000000000 2: trans NN @@ -1934,7 +1969,7 @@ 2: ******************************************************************************** 2: -- PERF dbcsr_multiply (N, N, 3 , N, N, N) 2: matrix sizes A( 1000 x 100), B( 100 x 100) and C( 1000 x 100) -2: numnodes (nprows X npcols) = 12( 12 X 1) +2: numnodes (nprows X npcols) = 7( 7 X 1) 2: nthreads = 2 2: checksum(A) = 0.333563309139543E+05 2: checksum(B) = 0.342949174893408E+04 @@ -1944,12 +1979,12 @@ 2: 2: 2: mean std minmin maxmax -2: time = 43.66E-03 5.04E-03 25.18E-03 74.11E-03 seconds -2: perf total = 474.58E+06 42.03E+06 269.88E+06 627.46E+06 FLOPS -2: perf per node = 39.55E+06 3.50E+06 22.49E+06 52.29E+06 FLOPS -2: perf per thread = 19.77E+06 1.75E+06 11.24E+06 26.14E+06 FLOPS -2: load imbalance = 0.43E-01 0.47E-02 0.30E-01 0.68E-01 -2: rel load imbal = 0.92E+00 0.10E-02 0.92E+00 0.93E+00 +2: time = 423.03E-03 32.11E-03 220.87E-03 664.22E-03 seconds +2: perf total = 47.12E+06 4.06E+06 30.11E+06 77.96E+06 FLOPS +2: perf per node = 6.73E+06 580.47E+03 4.30E+06 11.14E+06 FLOPS +2: perf per thread = 3.37E+06 290.24E+03 2.15E+06 5.57E+06 FLOPS +2: load imbalance = 0.39E+00 0.32E-01 0.22E+00 0.58E+00 +2: rel load imbal = 0.87E+00 0.12E-02 0.86E+00 0.87E+00 2: ******************************************************************************** 2: 2: ------------------------------------------------------------------------------- @@ -1958,35 +1993,33 @@ 2: - - 2: ------------------------------------------------------------------------------- 2: COUNTER TOTAL BLAS SMM ACC -2: flops 35 x 100 x 5 2800000 100.0% 0.0% 0.0% -2: flops 35 x 100 x 10 11200000 100.0% 0.0% 0.0% -2: flops 45 x 100 x 5 18000000 100.0% 0.0% 0.0% -2: flops 40 x 100 x 5 19200000 100.0% 0.0% 0.0% -2: flops 45 x 100 x 10 72000000 100.0% 0.0% 0.0% -2: flops 40 x 100 x 10 76800000 100.0% 0.0% 0.0% +2: flops 75 x 100 x 10 6000000 100.0% 0.0% 0.0% +2: flops 70 x 100 x 10 14000000 100.0% 0.0% 0.0% +2: flops 75 x 100 x 15 54000000 100.0% 0.0% 0.0% +2: flops 70 x 100 x 15 126000000 100.0% 0.0% 0.0% 2: flops inhomo. stacks 0 0.0% 0.0% 0.0% 2: flops total 200.000000E+06 100.0% 0.0% 0.0% -2: flops max/rank 17.000000E+06 100.0% 0.0% 0.0% +2: flops max/rank 29.000000E+06 100.0% 0.0% 0.0% 2: matmuls inhomo. stacks 0 0.0% 0.0% 0.0% -2: matmuls total 2880 100.0% 0.0% 0.0% -2: number of processed stacks 2880 100.0% 0.0% 0.0% +2: matmuls total 980 100.0% 0.0% 0.0% +2: number of processed stacks 980 100.0% 0.0% 0.0% 2: average stack size 1.0 0.0 0.0 -2: marketing flops 200.000016E+06 +2: marketing flops 199.999968E+06 2: ------------------------------------------------------------------------------- 2: # multiplications 10 -2: max memory usage/rank 99.299328E+06 -2: # max total images/rank 12 +2: max memory usage/rank 73.629696E+06 +2: # max total images/rank 7 2: # max 3D layers 1 -2: # MPI messages exchanged 1320 +2: # MPI messages exchanged 420 2: MPI messages size (bytes): -2: total size 8.800000E+06 -2: min size 4.000000E+03 -2: max size 8.000000E+03 -2: average size 6.666667E+03 +2: total size 4.800000E+06 +2: min size 8.000000E+03 +2: max size 12.000000E+03 +2: average size 11.428571E+03 2: MPI breakdown and total messages size (bytes): 2: size <= 128 0 0 -2: 128 < size <= 8192 1320 8800000 -2: 8192 < size <= 32768 0 0 +2: 128 < size <= 8192 60 480000 +2: 8192 < size <= 32768 360 4320000 2: 32768 < size <= 131072 0 0 2: 131072 < size <= 4194304 0 0 2: 4194304 < size <= 16777216 0 0 @@ -1994,7 +2027,7 @@ 2: ------------------------------------------------------------------------------- 2: 2: *** WARNING in dbcsr_mm.F:291 :: Using a non-square number of MPI ranks *** -2: *** might lead to poor performance. Used ranks: 12 Suggested: 9 25 *** +2: *** might lead to poor performance. Used ranks: 7 Suggested: 9 16 *** 2: 2: ------------------------------------------------------------------------------- 2: - - @@ -2002,11 +2035,11 @@ 2: - - 2: ------------------------------------------------------------------------------- 2: ROUTINE CALLS AVE VOLUME [Bytes] -2: MP_Bcast 7 12. -2: MP_Allreduce 98 32. -2: MP_Alltoall 41 14576. -2: MP_ISend 260 3533. -2: MP_IRecv 260 3379. +2: MP_Bcast 5 12. +2: MP_Allreduce 94 24. +2: MP_Alltoall 41 25033. +2: MP_ISend 160 5900. +2: MP_IRecv 160 5900. 2: ------------------------------------------------------------------------------- 2: 2: ------------------------------------------------------------------------------- @@ -2016,119 +2049,119 @@ 2: ------------------------------------------------------------------------------- 2: SUBROUTINE CALLS ASD SELF TIME TOTAL TIME MAXRANK 2: MAXIMUM AVERAGE MAXIMUM AVERAGE MAXIMUM -2: dbcsr_performance_driver 1 1.0 0.000 0.000 0.509 0.512 0 -2: dbcsr_perf_multiply_low 1 2.0 0.000 0.000 0.509 0.511 0 -2: perf_multiply 1 3.0 0.000 0.000 0.504 0.509 0 -2: dbcsr_multiply_generic 10 4.0 0.001 0.001 0.437 0.450 2 -2: multiply_cannon 10 5.0 0.016 0.040 0.210 0.219 11 -2: make_m2s 20 5.0 0.001 0.001 0.162 0.171 1 -2: make_images 20 6.0 0.029 0.043 0.150 0.160 10 -2: multiply_cannon_loop 10 6.0 0.002 0.004 0.137 0.153 11 -2: make_images_sizes 20 7.0 0.000 0.000 0.113 0.129 11 -2: mp_alltoall_i44 20 8.0 0.113 0.129 0.113 0.129 4 -2: multiply_cannon_metrocomm1 120 7.0 0.001 0.001 0.103 0.124 2 -2: mp_waitall_1 680 8.2 0.103 0.123 0.103 0.123 9 -2: mp_allgather_i34 10 6.0 0.051 0.059 0.051 0.059 8 -2: multiply_cannon_multrec 120 7.0 0.029 0.043 0.030 0.044 5 -2: mp_sum_l 145 2.7 0.032 0.040 0.032 0.040 8 -2: dbcsr_multiply_generic_mpsum_f 10 5.0 0.000 0.000 0.031 0.039 5 -2: dbcsr_make_dense 10 5.0 0.000 0.000 0.006 0.032 1 -2: mp_sync 10 4.0 0.027 0.031 0.027 0.031 6 -2: dbcsr_create_new 447 6.8 0.015 0.024 0.019 0.030 11 -2: dbcsr_make_dense_low 140 6.9 0.001 0.001 0.010 0.028 1 -2: dbcsr_make_undense 10 5.0 0.002 0.002 0.013 0.026 2 -2: make_dense_data 140 7.9 0.005 0.009 0.008 0.026 8 -2: dbcsr_redistribute 3 4.0 0.006 0.010 0.019 0.023 1 -2: dbcsr_checksum 5 4.0 0.005 0.010 0.020 0.022 3 -2: mp_sum_d 76 1.3 0.015 0.020 0.015 0.020 8 -2: mp_alltoall_i22 3 5.0 0.012 0.019 0.012 0.019 2 -2: dbcsr_make_dists_dense 10 5.0 0.010 0.018 0.010 0.018 0 -2: buffer_matrices_ensure_size 20 6.0 0.002 0.014 0.002 0.014 2 -2: dbcsr_iterator_start 226 8.1 0.002 0.011 0.002 0.012 8 -2: dbcsr_make_images_dense 20 6.0 0.001 0.001 0.009 0.010 10 -2: dbcsr_init_lib_low 1 1.0 0.003 0.009 0.003 0.009 1 -2: make_images_data 20 7.0 0.000 0.000 0.003 0.009 11 -2: hybrid_alltoall_any 20 8.0 0.002 0.008 0.002 0.009 1 -2: dbcsr_make_index_exist 447 7.8 0.003 0.007 0.003 0.007 8 -2: dbcsr_make_random_matrix 3 3.0 0.003 0.003 0.004 0.007 3 -2: mp_max_l 94 1.0 0.005 0.006 0.005 0.006 7 -2: dbcsr_iterator_stop 226 8.1 0.001 0.006 0.001 0.006 8 -2: dbcsr_make_untransposed_blocks 20 5.0 0.001 0.005 0.001 0.005 8 -2: setup_buffer_matrices 20 6.0 0.000 0.000 0.002 0.005 4 -2: dbcsr_copy 10 4.0 0.001 0.004 0.001 0.004 9 -2: dbcsr_finalize 17 4.8 0.000 0.000 0.002 0.004 2 -2: multiply_cannon_multrec_finali 10 8.0 0.000 0.000 0.001 0.004 2 -2: dbcsr_mm_multrec_finalize 10 9.0 0.001 0.004 0.001 0.004 4 -2: dbcsr_merge_all 13 5.8 0.001 0.003 0.001 0.004 0 -2: dbcsr_special_finalize 130 7.0 0.000 0.000 0.002 0.002 11 -2: setup_rec_index_2d 20 6.0 0.001 0.002 0.001 0.002 4 -2: quick_finalize 133 8.0 0.001 0.001 0.002 0.002 3 -2: multiply_cannon_metrocomm2 110 7.0 0.001 0.001 0.001 0.002 2 -2: dbcsr_destroy 437 5.9 0.001 0.001 0.001 0.001 7 -2: make_images_pack 20 7.0 0.001 0.001 0.001 0.001 6 -2: dbcsr_make_index_list 130 6.0 0.001 0.001 0.001 0.001 5 -2: mp_maxloc_dv 211 1.0 0.001 0.001 0.001 0.001 9 -2: dbcsr_data_release 1830 8.0 0.001 0.001 0.001 0.001 10 -2: dbcsr_data_new 1021 7.8 0.001 0.001 0.001 0.001 6 -2: mp_cart_sub 2 5.0 0.001 0.001 0.001 0.001 2 -2: mp_bcast_av 103 1.0 0.000 0.000 0.001 0.001 1 -2: dbcsr_mm_multrec_init 10 6.0 0.000 0.000 0.001 0.001 0 -2: dbcsr_mm_csr_init 10 7.0 0.001 0.001 0.001 0.001 4 -2: dbcsr_sort_indices 146 8.8 0.001 0.001 0.001 0.001 8 -2: dbcsr_switch_data_area 283 8.3 0.000 0.000 0.001 0.001 1 -2: mp_isend_dv 110 8.0 0.000 0.001 0.000 0.001 1 -2: dbcsr_add_wm_from_matrix 10 5.0 0.000 0.000 0.000 0.001 0 -2: mp_bcast_i 104 2.0 0.000 0.001 0.000 0.001 5 -2: dbcsr_work_create 146 6.8 0.000 0.000 0.000 0.001 3 -2: tree_to_linear_d 3 6.0 0.000 0.001 0.000 0.001 3 -2: mp_max_i 102 1.0 0.000 0.000 0.000 0.000 9 -2: dbcsr_fill_wm_from_matrix 10 6.0 0.000 0.000 0.000 0.000 3 -2: dbcsr_work_destroy_all 146 7.8 0.000 0.000 0.000 0.000 10 -2: dbcsr_iterator_seek 226 9.1 0.000 0.000 0.000 0.000 11 -2: dbcsr_index_prune_deleted 130 7.0 0.000 0.000 0.000 0.000 0 -2: mp_isend_iv 150 8.0 0.000 0.000 0.000 0.000 2 -2: dbcsr_data_copy_aa2 13 6.8 0.000 0.000 0.000 0.000 7 -2: dbcsr_make_dbcsr_index 146 8.8 0.000 0.000 0.000 0.000 8 -2: dbcsr_distribution_new 56 5.4 0.000 0.000 0.000 0.000 11 -2: mp_sum_b 20 5.0 0.000 0.000 0.000 0.000 5 -2: dbcsr_make_index_local_row 130 6.0 0.000 0.000 0.000 0.000 6 -2: mp_cart_create 1 5.0 0.000 0.000 0.000 0.000 10 -2: mp_irecv_iv 150 8.0 0.000 0.000 0.000 0.000 2 -2: mp_max_r 1 1.0 0.000 0.000 0.000 0.000 5 -2: dbcsr_dist_bin 4 3.0 0.000 0.000 0.000 0.000 8 -2: mp_irecv_dv 110 8.0 0.000 0.000 0.000 0.000 11 -2: mp_sum_root_rm 2 4.0 0.000 0.000 0.000 0.000 0 -2: merge_index 13 6.8 0.000 0.000 0.000 0.000 3 -2: mp_alltoall_d11v 9 5.0 0.000 0.000 0.000 0.000 9 -2: dbcsr_get_local_rows 20 5.5 0.000 0.000 0.000 0.000 10 -2: multiply_cannon_metrocomm3 120 7.0 0.000 0.000 0.000 0.000 11 -2: mp_sum_lv 7 1.0 0.000 0.000 0.000 0.000 9 -2: dbcsr_verify_matrix 3 4.0 0.000 0.000 0.000 0.000 8 -2: mp_comm_free 4 2.0 0.000 0.000 0.000 0.000 4 -2: dbcsr_mm_sched_init 10 8.0 0.000 0.000 0.000 0.000 5 -2: mp_bcast_iv 7 1.0 0.000 0.000 0.000 0.000 6 -2: dbcsr_get_data_size_used 16 5.8 0.000 0.000 0.000 0.000 3 -2: dbcsr_get_local_cols 20 5.5 0.000 0.000 0.000 0.000 8 -2: mp_alltoall_i11v 9 5.0 0.000 0.000 0.000 0.000 9 +2: dbcsr_performance_driver 1 1.0 0.001 0.008 5.448 5.464 0 +2: dbcsr_perf_multiply_low 1 2.0 0.049 0.165 5.447 5.463 5 +2: perf_multiply 1 3.0 0.000 0.001 5.344 5.446 0 +2: dbcsr_multiply_generic 10 4.0 0.005 0.018 4.230 4.380 5 +2: multiply_cannon 10 5.0 0.137 0.178 1.631 1.688 6 +2: mp_sum_l 145 2.7 1.466 1.589 1.466 1.589 1 +2: multiply_cannon_loop 10 6.0 0.123 0.157 0.985 1.185 5 +2: make_m2s 20 5.0 0.001 0.001 0.876 0.941 6 +2: multiply_cannon_metrocomm1 70 7.0 0.001 0.001 0.665 0.901 2 +2: mp_waitall_1 480 8.2 0.665 0.900 0.665 0.900 2 +2: make_images 20 6.0 0.147 0.191 0.829 0.896 2 +2: make_images_sizes 20 7.0 0.000 0.000 0.634 0.709 6 +2: mp_alltoall_i44 20 8.0 0.634 0.709 0.634 0.709 4 +2: dbcsr_redistribute 3 4.0 0.082 0.141 0.549 0.667 1 +2: mp_maxloc_dv 211 1.0 0.553 0.630 0.553 0.630 2 +2: mp_sum_d 76 1.3 0.499 0.601 0.499 0.601 0 +2: dbcsr_multiply_generic_mpsum_f 10 5.0 0.000 0.000 0.451 0.585 0 +2: dbcsr_create_new 297 6.7 0.167 0.316 0.254 0.500 0 +2: mp_alltoall_i22 3 5.0 0.386 0.484 0.386 0.484 6 +2: mp_sync 10 4.0 0.412 0.475 0.412 0.475 2 +2: mp_max_l 94 1.0 0.316 0.406 0.316 0.406 3 +2: mp_allgather_i34 10 6.0 0.301 0.375 0.301 0.375 0 +2: mp_max_i 100 1.0 0.344 0.370 0.344 0.370 6 +2: dbcsr_make_random_matrix 3 3.0 0.009 0.013 0.054 0.264 1 +2: dbcsr_finalize 17 4.8 0.004 0.021 0.097 0.259 0 +2: mp_sum_b 20 5.0 0.222 0.254 0.222 0.254 0 +2: dbcsr_merge_all 13 5.8 0.080 0.212 0.091 0.237 0 +2: multiply_cannon_multrec 70 7.0 0.168 0.206 0.194 0.233 0 +2: dbcsr_make_undense 10 5.0 0.025 0.041 0.149 0.233 0 +2: dbcsr_make_dense 10 5.0 0.000 0.000 0.137 0.195 6 +2: dbcsr_make_index_exist 297 7.7 0.087 0.183 0.087 0.183 0 +2: setup_rec_index_2d 20 6.0 0.119 0.177 0.119 0.177 6 +2: dbcsr_checksum 5 4.0 0.027 0.050 0.137 0.166 1 +2: dbcsr_make_dense_low 90 6.9 0.003 0.010 0.066 0.134 5 +2: make_dense_data 90 7.9 0.029 0.060 0.062 0.131 0 +2: buffer_matrices_ensure_size 20 6.0 0.059 0.129 0.059 0.129 6 +2: dbcsr_make_dists_dense 10 5.0 0.099 0.115 0.099 0.115 1 +2: mp_bcast_av 103 1.0 0.001 0.001 0.064 0.111 5 +2: mp_bcast_i 104 2.0 0.063 0.110 0.063 0.110 5 +2: dbcsr_make_images_dense 20 6.0 0.004 0.009 0.034 0.103 1 +2: dbcsr_iterator_start 176 7.8 0.050 0.098 0.050 0.098 0 +2: mp_sum_lv 5 1.0 0.080 0.088 0.080 0.088 1 +2: setup_buffer_matrices 20 6.0 0.000 0.001 0.026 0.079 0 +2: mp_cart_sub 2 5.0 0.060 0.064 0.060 0.064 1 +2: dbcsr_init_lib_low 1 1.0 0.039 0.060 0.039 0.060 5 +2: make_images_data 20 7.0 0.001 0.001 0.034 0.051 6 +2: hybrid_alltoall_any 20 8.0 0.033 0.049 0.033 0.049 6 +2: multiply_cannon_multrec_finali 10 8.0 0.000 0.000 0.026 0.038 4 +2: dbcsr_mm_multrec_finalize 10 9.0 0.026 0.038 0.026 0.038 5 +2: dbcsr_iterator_stop 176 7.8 0.011 0.033 0.012 0.033 0 +2: dbcsr_copy 10 4.0 0.007 0.029 0.007 0.029 6 +2: merge_index 13 6.8 0.009 0.024 0.009 0.024 6 +2: mp_bcast_iv 5 1.0 0.018 0.024 0.018 0.024 4 +2: mp_sum_r 1 1.0 0.014 0.024 0.014 0.024 3 +2: mp_max_r 1 1.0 0.013 0.024 0.013 0.024 0 +2: mp_cart_create 1 5.0 0.019 0.023 0.019 0.023 3 +2: dbcsr_special_finalize 80 7.0 0.001 0.001 0.006 0.019 5 +2: quick_finalize 83 7.9 0.005 0.017 0.007 0.019 6 +2: mp_sum_i 1 1.0 0.010 0.016 0.010 0.016 0 +2: mp_sum_rv 1 1.0 0.009 0.013 0.009 0.013 2 +2: mp_sum_root_rm 2 4.0 0.002 0.013 0.002 0.013 0 +2: mp_max_rv 1 1.0 0.009 0.012 0.009 0.012 6 +2: mp_max_d 1 1.0 0.005 0.012 0.005 0.012 4 +2: dbcsr_make_untransposed_blocks 20 5.0 0.002 0.009 0.003 0.010 4 +2: mp_sum_lm3 1 1.0 0.005 0.008 0.005 0.008 1 +2: mp_min_rv 1 1.0 0.008 0.008 0.008 0.008 5 +2: dbcsr_destroy 287 5.9 0.001 0.001 0.003 0.006 5 +2: dbcsr_mm_multrec_init 10 6.0 0.000 0.000 0.004 0.006 1 +2: dbcsr_mm_csr_init 10 7.0 0.003 0.006 0.003 0.006 2 +2: dbcsr_data_release 1280 7.8 0.002 0.006 0.002 0.006 5 +2: dbcsr_make_index_list 80 6.0 0.002 0.005 0.002 0.005 4 +2: dbcsr_sort_indices 96 8.6 0.002 0.005 0.002 0.005 1 +2: tree_to_linear_d 3 6.0 0.001 0.005 0.001 0.005 6 +2: dbcsr_distribution_new 56 5.4 0.001 0.004 0.001 0.004 3 +2: multiply_cannon_metrocomm2 60 7.0 0.001 0.001 0.002 0.002 4 +2: make_images_pack 20 7.0 0.002 0.002 0.002 0.002 4 +2: dbcsr_data_new 721 7.6 0.002 0.002 0.002 0.002 4 +2: dbcsr_add_wm_from_matrix 10 5.0 0.000 0.000 0.001 0.001 6 +2: mp_isend_dv 60 8.0 0.001 0.001 0.001 0.001 6 +2: dbcsr_switch_data_area 183 8.3 0.001 0.001 0.001 0.001 3 +2: dbcsr_work_create 96 6.7 0.001 0.001 0.001 0.001 5 +2: dbcsr_fill_wm_from_matrix 10 6.0 0.001 0.001 0.001 0.001 0 +2: dbcsr_work_destroy_all 96 7.6 0.000 0.000 0.001 0.001 4 +2: dbcsr_data_copy_aa2 13 6.8 0.001 0.001 0.001 0.001 4 +2: dbcsr_iterator_seek 176 8.8 0.000 0.001 0.000 0.001 1 +2: mp_isend_iv 100 8.0 0.000 0.000 0.000 0.000 1 +2: mp_irecv_iv 100 8.0 0.000 0.000 0.000 0.000 6 +2: mp_alltoall_d11v 9 5.0 0.000 0.000 0.000 0.000 6 +2: dbcsr_make_dbcsr_index 96 8.6 0.000 0.000 0.000 0.000 4 +2: dbcsr_index_prune_deleted 80 7.0 0.000 0.000 0.000 0.000 1 +2: mp_irecv_dv 60 8.0 0.000 0.000 0.000 0.000 2 +2: dbcsr_make_index_local_row 80 6.0 0.000 0.000 0.000 0.000 6 +2: dbcsr_get_local_rows 20 5.5 0.000 0.000 0.000 0.000 6 +2: multiply_cannon_metrocomm3 70 7.0 0.000 0.000 0.000 0.000 0 +2: dbcsr_dist_bin 4 3.0 0.000 0.000 0.000 0.000 0 +2: dbcsr_mm_sched_init 10 8.0 0.000 0.000 0.000 0.000 6 +2: dbcsr_verify_matrix 3 4.0 0.000 0.000 0.000 0.000 0 +2: mp_alltoall_i11v 9 5.0 0.000 0.000 0.000 0.000 5 +2: mp_comm_free 4 2.0 0.000 0.000 0.000 0.000 3 +2: dbcsr_get_data_size_used 16 5.8 0.000 0.000 0.000 0.000 6 2: fill_hash_tables 10 8.0 0.000 0.000 0.000 0.000 4 -2: dbcsr_get_global_row_map 10 5.0 0.000 0.000 0.000 0.000 10 -2: mp_sum_r 1 1.0 0.000 0.000 0.000 0.000 0 -2: mp_sum_lm3 1 1.0 0.000 0.000 0.000 0.000 5 -2: dbcsr_get_global_col_map 10 5.0 0.000 0.000 0.000 0.000 7 -2: mp_sum_i 1 1.0 0.000 0.000 0.000 0.000 10 -2: mp_sum_rv 1 1.0 0.000 0.000 0.000 0.000 7 -2: mp_min_rv 1 1.0 0.000 0.000 0.000 0.000 9 -2: mp_max_d 1 1.0 0.000 0.000 0.000 0.000 9 -2: mp_max_rv 1 1.0 0.000 0.000 0.000 0.000 10 -2: dbcsr_mm_sched_finalize 10 10.0 0.000 0.000 0.000 0.000 7 +2: dbcsr_get_local_cols 20 5.5 0.000 0.000 0.000 0.000 2 +2: dbcsr_get_global_row_map 10 5.0 0.000 0.000 0.000 0.000 5 +2: dbcsr_get_global_col_map 10 5.0 0.000 0.000 0.000 0.000 0 +2: dbcsr_mm_sched_finalize 10 10.0 0.000 0.000 0.000 0.000 4 2: dbcsr_mm_hostdrv_init 10 9.0 0.000 0.000 0.000 0.000 2 2: ------------------------------------------------------------------------------- 2: - 2/19 Test #2: dbcsr_perf:inputs/test_rect1_dense.perf ............... Passed 0.58 sec + 2/19 Test #2: dbcsr_perf:inputs/test_rect1_dense.perf ............... Passed 8.37 sec test 3 Start 3: dbcsr_perf:inputs/test_rect1_sparse.perf -3: Test command: /usr/bin/mpiexec "-n" "12" "/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/tests/dbcsr_perf" "/build/reproducible-path/dbcsr-2.6.0/tests/inputs/test_rect1_sparse.perf" +3: Test command: /usr/bin/mpiexec "-n" "7" "/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/tests/dbcsr_perf" "/build/reproducible-path/dbcsr-2.6.0/tests/inputs/test_rect1_sparse.perf" 3: Working Directory: /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/tests 3: Environment variables: 3: OMP_NUM_THREADS=2 @@ -2147,12 +2180,12 @@ 3: DBCSR| Use Communication thread T (D) 3: DBCSR| Communication thread load 100 (D) 3: DBCSR| MPI: My process id 0 -3: DBCSR| MPI: Number of processes 12 +3: DBCSR| MPI: Number of processes 7 3: DBCSR| OMP: Current number of threads 2 3: DBCSR| OMP: Max number of threads 2 3: DBCSR| Split modifier for TAS multiplication algorithm 1.0E+00 (D) 3: numthreads 2 -3: numnodes 12 +3: numnodes 7 3: matrix_sizes 5000 1000 1000 3: sparsities 0.90000000000000002 0.90000000000000002 0.90000000000000002 3: trans NN @@ -2169,7 +2202,7 @@ 3: ******************************************************************************** 3: -- PERF dbcsr_multiply (N, N, 3 , N, N, N) 3: matrix sizes A( 5000 x 1000), B( 1000 x 1000) and C( 5000 x 1000) -3: numnodes (nprows X npcols) = 12( 12 X 1) +3: numnodes (nprows X npcols) = 7( 7 X 1) 3: nthreads = 2 3: checksum(A) = 0.167223715953740E+06 3: checksum(B) = 0.336183330312199E+05 @@ -2179,12 +2212,12 @@ 3: 3: 3: mean std minmin maxmax -3: time = 80.66E-03 2.59E-03 64.38E-03 96.46E-03 seconds -3: perf total = 1.21E+09 40.84E+06 1.05E+09 1.50E+09 FLOPS -3: perf per node = 100.62E+06 3.40E+06 87.42E+06 125.15E+06 FLOPS -3: perf per thread = 50.31E+06 1.70E+06 43.71E+06 62.57E+06 FLOPS -3: load imbalance = 0.78E-01 0.25E-02 0.62E-01 0.89E-01 -3: rel load imbal = 0.92E+00 0.25E-03 0.92E+00 0.92E+00 +3: time = 1.21E+00 101.44E-03 748.50E-03 1.75E+00 seconds +3: perf total = 87.83E+06 7.14E+06 57.97E+06 129.08E+06 FLOPS +3: perf per node = 12.55E+06 1.02E+06 8.28E+06 18.44E+06 FLOPS +3: perf per thread = 6.27E+06 510.21E+03 4.14E+06 9.22E+06 FLOPS +3: load imbalance = 0.11E+01 0.88E-01 0.67E+00 0.15E+01 +3: rel load imbal = 0.86E+00 0.39E-03 0.86E+00 0.86E+00 3: ******************************************************************************** 3: 3: ------------------------------------------------------------------------------- @@ -2196,35 +2229,35 @@ 3: flops 5 x 5 x 5 1011962500 100.0% 0.0% 0.0% 3: flops inhomo. stacks 0 0.0% 0.0% 0.0% 3: flops total 1.011962E+09 100.0% 0.0% 0.0% -3: flops max/rank 86.315000E+06 100.0% 0.0% 0.0% +3: flops max/rank 148.020000E+06 100.0% 0.0% 0.0% 3: matmuls inhomo. stacks 0 0.0% 0.0% 0.0% 3: matmuls total 4047850 100.0% 0.0% 0.0% -3: number of processed stacks 5720 100.0% 0.0% 0.0% -3: average stack size 707.7 0.0 0.0 -3: marketing flops 99.999998E+09 +3: number of processed stacks 4580 100.0% 0.0% 0.0% +3: average stack size 883.8 0.0 0.0 +3: marketing flops 99.999990E+09 3: ------------------------------------------------------------------------------- 3: # multiplications 10 -3: max memory usage/rank 111.865856E+06 -3: # max total images/rank 12 +3: max memory usage/rank 90.660864E+06 +3: # max total images/rank 7 3: # max 3D layers 1 -3: # MPI messages exchanged 1320 +3: # MPI messages exchanged 420 3: MPI messages size (bytes): -3: total size 88.946000E+06 -3: min size 57.200000E+03 -3: max size 76.200000E+03 -3: average size 67.383336E+03 +3: total size 48.516000E+06 +3: min size 112.200000E+03 +3: max size 121.000000E+03 +3: average size 115.514289E+03 3: MPI breakdown and total messages size (bytes): 3: size <= 128 0 0 3: 128 < size <= 8192 0 0 3: 8192 < size <= 32768 0 0 -3: 32768 < size <= 131072 1320 88946000 +3: 32768 < size <= 131072 420 48516000 3: 131072 < size <= 4194304 0 0 3: 4194304 < size <= 16777216 0 0 3: 16777216 < size 0 0 3: ------------------------------------------------------------------------------- 3: 3: *** WARNING in dbcsr_mm.F:291 :: Using a non-square number of MPI ranks *** -3: *** might lead to poor performance. Used ranks: 12 Suggested: 9 25 *** +3: *** might lead to poor performance. Used ranks: 7 Suggested: 9 16 *** 3: 3: ------------------------------------------------------------------------------- 3: - - @@ -2233,10 +2266,10 @@ 3: ------------------------------------------------------------------------------- 3: ROUTINE CALLS AVE VOLUME [Bytes] 3: MP_Bcast 2 12. -3: MP_Allreduce 88 33. -3: MP_Alltoall 41 75779. -3: MP_ISend 260 33230. -3: MP_IRecv 260 33711. +3: MP_Allreduce 88 24. +3: MP_Alltoall 41 128465. +3: MP_ISend 160 54844. +3: MP_IRecv 160 54698. 3: ------------------------------------------------------------------------------- 3: 3: ------------------------------------------------------------------------------- @@ -2246,114 +2279,114 @@ 3: ------------------------------------------------------------------------------- 3: SUBROUTINE CALLS ASD SELF TIME TOTAL TIME MAXRANK 3: MAXIMUM AVERAGE MAXIMUM AVERAGE MAXIMUM -3: dbcsr_performance_driver 1 1.0 0.000 0.000 0.968 0.971 0 -3: dbcsr_perf_multiply_low 1 2.0 0.000 0.000 0.968 0.971 0 -3: perf_multiply 1 3.0 0.000 0.000 0.944 0.955 0 -3: dbcsr_multiply_generic 10 4.0 0.002 0.002 0.807 0.819 8 -3: multiply_cannon 10 5.0 0.008 0.017 0.512 0.560 3 -3: multiply_cannon_loop 10 6.0 0.007 0.024 0.429 0.486 3 -3: multiply_cannon_multrec 120 7.0 0.260 0.301 0.261 0.302 10 -3: multiply_cannon_metrocomm1 120 7.0 0.001 0.001 0.159 0.194 11 -3: mp_waitall_1 680 8.2 0.158 0.193 0.158 0.193 1 -3: make_m2s 20 5.0 0.001 0.001 0.120 0.140 9 -3: make_images 20 6.0 0.029 0.044 0.116 0.136 9 -3: mp_sum_l 145 2.7 0.077 0.116 0.077 0.116 3 -3: dbcsr_multiply_generic_mpsum_f 10 5.0 0.000 0.000 0.077 0.116 6 -3: make_images_sizes 20 7.0 0.000 0.000 0.067 0.076 11 -3: mp_alltoall_i44 20 8.0 0.067 0.076 0.067 0.076 7 -3: mp_allgather_i34 10 6.0 0.058 0.071 0.058 0.071 1 -3: dbcsr_checksum 5 4.0 0.026 0.036 0.056 0.061 5 -3: dbcsr_finalize 17 4.8 0.000 0.000 0.042 0.060 2 -3: dbcsr_merge_all 13 5.8 0.007 0.015 0.037 0.055 7 -3: dbcsr_redistribute 3 4.0 0.020 0.029 0.036 0.052 8 -3: mp_sync 10 4.0 0.040 0.052 0.040 0.052 1 -3: mp_sum_d 76 1.3 0.030 0.039 0.030 0.039 7 -3: dbcsr_copy 30 4.7 0.008 0.010 0.026 0.034 7 -3: dbcsr_make_untransposed_blocks 20 5.0 0.027 0.032 0.027 0.032 7 -3: dbcsr_create_new 297 6.8 0.020 0.030 0.023 0.032 10 -3: dbcsr_make_random_matrix 3 3.0 0.019 0.023 0.024 0.031 0 -3: dbcsr_sort_indices 146 8.8 0.019 0.025 0.019 0.025 8 -3: mp_alltoall_i22 3 5.0 0.014 0.023 0.014 0.023 7 -3: buffer_matrices_ensure_size 20 6.0 0.004 0.022 0.004 0.022 6 -3: merge_index 13 6.8 0.005 0.011 0.005 0.011 8 -3: dbcsr_add_wm_from_matrix 10 5.0 0.001 0.004 0.007 0.010 0 -3: make_images_data 20 7.0 0.000 0.000 0.003 0.010 9 -3: hybrid_alltoall_any 20 8.0 0.003 0.010 0.003 0.010 9 -3: dbcsr_special_finalize 130 7.0 0.001 0.001 0.009 0.009 9 -3: dbcsr_fill_wm_from_matrix 10 6.0 0.006 0.009 0.006 0.009 8 -3: setup_rec_index_2d 20 6.0 0.007 0.009 0.007 0.009 0 -3: dbcsr_data_copy_aa2 13 6.8 0.005 0.009 0.005 0.009 4 -3: dbcsr_merge_single_wm 120 8.0 0.003 0.003 0.007 0.008 10 -3: dbcsr_data_release 830 7.1 0.005 0.007 0.005 0.007 8 -3: make_images_pack 20 7.0 0.005 0.006 0.005 0.006 8 -3: dbcsr_work_destroy_all 146 7.8 0.001 0.002 0.005 0.006 9 -3: dbcsr_init_lib_low 1 1.0 0.002 0.005 0.002 0.005 1 -3: setup_buffer_matrices 20 6.0 0.000 0.000 0.003 0.005 6 -3: dbcsr_mm_multrec_init 10 6.0 0.000 0.000 0.002 0.004 6 -3: dbcsr_mm_csr_init 10 7.0 0.001 0.002 0.002 0.004 0 -3: dbcsr_destroy 287 5.4 0.001 0.001 0.002 0.004 11 -3: dbcsr_make_index_exist 297 7.8 0.002 0.003 0.002 0.003 6 -3: tree_to_linear_d 3 6.0 0.002 0.003 0.002 0.003 4 -3: dbcsr_make_index_list 130 6.0 0.002 0.003 0.002 0.003 10 -3: mp_max_l 89 1.0 0.002 0.003 0.002 0.003 7 -3: multiply_cannon_metrocomm2 110 7.0 0.001 0.001 0.002 0.003 8 -3: dbcsr_sort_data 120 9.0 0.002 0.002 0.002 0.002 8 -3: fill_hash_tables 10 8.0 0.002 0.002 0.002 0.002 6 -3: multiply_cannon_multrec_finali 10 8.0 0.000 0.000 0.001 0.001 2 -3: dbcsr_mm_multrec_finalize 10 9.0 0.001 0.001 0.001 0.001 3 -3: dbcsr_make_dbcsr_index 146 8.8 0.001 0.001 0.001 0.001 10 -3: dbcsr_make_index_local_row 130 6.0 0.001 0.001 0.001 0.001 9 -3: mp_isend_dv 110 8.0 0.001 0.001 0.001 0.001 4 -3: mp_maxloc_dv 201 1.0 0.001 0.001 0.001 0.001 1 -3: quick_finalize 13 7.5 0.000 0.000 0.001 0.001 9 -3: dbcsr_data_new 571 7.5 0.001 0.001 0.001 0.001 8 -3: mp_bcast_av 98 1.0 0.000 0.000 0.001 0.001 0 -3: mp_cart_sub 2 5.0 0.001 0.001 0.001 0.001 0 -3: dbcsr_work_create 146 6.8 0.000 0.000 0.001 0.001 3 -3: mp_cart_create 1 5.0 0.000 0.001 0.000 0.001 7 -3: dbcsr_switch_data_area 33 7.0 0.000 0.001 0.000 0.001 8 -3: dbcsr_iterator_start 76 6.8 0.000 0.000 0.001 0.001 6 -3: mp_isend_iv 150 8.0 0.000 0.001 0.000 0.001 8 -3: mp_bcast_i 99 2.0 0.000 0.001 0.000 0.001 5 -3: mp_max_i 92 1.0 0.000 0.000 0.000 0.000 0 +3: dbcsr_performance_driver 1 1.0 0.000 0.000 14.440 14.456 0 +3: dbcsr_perf_multiply_low 1 2.0 0.000 0.001 14.439 14.456 0 +3: perf_multiply 1 3.0 0.000 0.001 14.262 14.305 0 +3: dbcsr_multiply_generic 10 4.0 0.003 0.003 12.074 12.188 6 +3: multiply_cannon 10 5.0 0.112 0.163 6.160 6.591 6 +3: make_m2s 20 5.0 0.002 0.002 3.340 4.137 5 +3: multiply_cannon_loop 10 6.0 0.459 0.565 3.794 4.133 2 +3: make_images 20 6.0 0.337 0.417 3.134 3.528 5 +3: make_images_sizes 20 7.0 0.000 0.000 2.204 2.656 6 +3: mp_alltoall_i44 20 8.0 2.204 2.656 2.204 2.656 4 +3: mp_sum_l 145 2.7 2.381 2.596 2.381 2.596 0 +3: mp_allgather_i34 10 6.0 1.902 2.333 1.902 2.333 2 +3: multiply_cannon_metrocomm1 70 7.0 0.001 0.002 1.672 2.056 2 +3: mp_waitall_1 480 8.2 1.671 2.055 1.671 2.055 2 +3: mp_maxloc_dv 201 1.0 1.688 1.932 1.688 1.932 4 +3: multiply_cannon_multrec 70 7.0 1.655 1.906 1.660 1.913 5 +3: mp_sum_d 76 1.3 1.369 1.619 1.369 1.619 3 +3: dbcsr_checksum 5 4.0 0.551 0.718 0.961 1.055 6 +3: mp_max_l 89 1.0 0.776 0.993 0.776 0.993 6 +3: mp_max_i 92 1.0 0.821 0.948 0.821 0.948 4 +3: dbcsr_redistribute 3 4.0 0.345 0.537 0.797 0.882 0 +3: dbcsr_multiply_generic_mpsum_f 10 5.0 0.000 0.000 0.691 0.864 4 +3: dbcsr_special_finalize 80 7.0 0.079 0.209 0.276 0.738 5 +3: dbcsr_create_new 197 6.7 0.334 0.410 0.584 0.733 5 +3: dbcsr_copy 30 4.7 0.189 0.240 0.500 0.680 1 +3: dbcsr_finalize 17 4.8 0.016 0.029 0.490 0.612 2 +3: dbcsr_make_index_list 80 6.0 0.201 0.606 0.201 0.606 5 +3: dbcsr_merge_all 13 5.8 0.284 0.386 0.448 0.565 2 +3: dbcsr_merge_single_wm 70 8.0 0.106 0.282 0.180 0.492 5 +3: mp_alltoall_i22 3 5.0 0.298 0.467 0.298 0.467 1 +3: mp_sync 10 4.0 0.340 0.449 0.340 0.449 5 +3: setup_rec_index_2d 20 6.0 0.122 0.364 0.122 0.364 4 +3: mp_bcast_av 98 1.0 0.001 0.002 0.210 0.331 5 +3: mp_bcast_i 99 2.0 0.209 0.329 0.209 0.329 5 +3: dbcsr_make_index_exist 197 7.7 0.248 0.322 0.248 0.322 5 +3: setup_buffer_matrices 20 6.0 0.001 0.001 0.088 0.280 4 +3: dbcsr_make_random_matrix 3 3.0 0.087 0.104 0.177 0.271 0 +3: buffer_matrices_ensure_size 20 6.0 0.127 0.252 0.127 0.252 4 +3: make_images_data 20 7.0 0.001 0.001 0.119 0.251 5 +3: hybrid_alltoall_any 20 8.0 0.117 0.249 0.118 0.250 1 +3: mp_sum_b 20 5.0 0.207 0.244 0.207 0.244 0 +3: dbcsr_make_untransposed_blocks 20 5.0 0.157 0.222 0.158 0.222 0 +3: dbcsr_sort_data 70 9.0 0.068 0.206 0.068 0.206 5 +3: dbcsr_add_wm_from_matrix 10 5.0 0.082 0.157 0.104 0.189 0 +3: merge_index 13 6.8 0.062 0.096 0.062 0.096 2 +3: mp_cart_create 1 5.0 0.080 0.094 0.080 0.094 6 +3: dbcsr_sort_indices 96 8.6 0.069 0.090 0.069 0.090 6 +3: mp_cart_sub 2 5.0 0.067 0.072 0.067 0.072 4 +3: dbcsr_data_release 630 7.1 0.041 0.065 0.041 0.065 4 +3: mp_sum_lv 2 1.0 0.038 0.052 0.038 0.052 6 +3: dbcsr_init_lib_low 1 1.0 0.025 0.050 0.025 0.050 0 +3: dbcsr_work_destroy_all 96 7.6 0.002 0.009 0.027 0.047 6 +3: dbcsr_data_copy_aa2 13 6.8 0.027 0.038 0.027 0.038 5 +3: quick_finalize 13 7.5 0.015 0.036 0.017 0.037 5 +3: mp_sum_i 1 1.0 0.023 0.036 0.023 0.036 2 +3: dbcsr_fill_wm_from_matrix 10 6.0 0.021 0.031 0.022 0.032 0 +3: mp_bcast_iv 2 1.0 0.013 0.028 0.013 0.028 5 +3: dbcsr_mm_multrec_init 10 6.0 0.000 0.000 0.012 0.024 4 +3: dbcsr_mm_csr_init 10 7.0 0.007 0.021 0.012 0.024 0 +3: mp_max_d 1 1.0 0.016 0.020 0.016 0.020 3 +3: mp_sum_rv 1 1.0 0.013 0.020 0.013 0.020 2 +3: mp_min_rv 1 1.0 0.008 0.020 0.008 0.020 4 +3: mp_sum_r 1 1.0 0.009 0.020 0.009 0.020 0 +3: dbcsr_make_dbcsr_index 96 8.6 0.005 0.018 0.005 0.018 0 +3: mp_sum_lm3 1 1.0 0.012 0.016 0.012 0.016 3 +3: mp_max_r 1 1.0 0.007 0.016 0.007 0.016 3 +3: fill_hash_tables 10 8.0 0.005 0.015 0.005 0.015 4 +3: dbcsr_destroy 187 5.4 0.002 0.009 0.006 0.013 1 +3: tree_to_linear_d 3 6.0 0.007 0.013 0.007 0.013 6 +3: make_images_pack 20 7.0 0.011 0.012 0.011 0.012 2 +3: mp_max_rv 1 1.0 0.009 0.012 0.009 0.012 0 +3: multiply_cannon_multrec_finali 10 8.0 0.000 0.000 0.005 0.012 2 +3: dbcsr_mm_multrec_finalize 10 9.0 0.005 0.012 0.005 0.012 0 +3: mp_alltoall_d11v 9 5.0 0.004 0.010 0.004 0.010 2 +3: dbcsr_data_new 421 7.3 0.003 0.010 0.003 0.010 4 +3: dbcsr_make_index_local_row 80 6.0 0.003 0.009 0.003 0.009 0 +3: multiply_cannon_metrocomm2 60 7.0 0.001 0.001 0.003 0.003 1 +3: dbcsr_work_create 96 6.7 0.001 0.001 0.001 0.001 5 +3: dbcsr_iterator_start 76 6.8 0.001 0.001 0.001 0.001 6 +3: mp_isend_iv 100 8.0 0.001 0.001 0.001 0.001 6 +3: mp_irecv_iv 100 8.0 0.001 0.001 0.001 0.001 6 +3: dbcsr_iterator_seek 76 7.8 0.001 0.001 0.001 0.001 2 +3: mp_irecv_dv 60 8.0 0.001 0.001 0.001 0.001 4 +3: dbcsr_distribution_new 26 4.7 0.001 0.001 0.001 0.001 1 +3: dbcsr_iterator_stop 76 6.8 0.000 0.000 0.000 0.001 6 +3: mp_isend_dv 60 8.0 0.000 0.001 0.000 0.001 6 +3: dbcsr_switch_data_area 33 7.0 0.000 0.000 0.000 0.000 6 3: dbcsr_dist_bin 4 3.0 0.000 0.000 0.000 0.000 0 -3: mp_irecv_dv 110 8.0 0.000 0.000 0.000 0.000 8 -3: dbcsr_iterator_seek 76 7.8 0.000 0.000 0.000 0.000 11 -3: mp_alltoall_d11v 9 5.0 0.000 0.000 0.000 0.000 4 -3: dbcsr_distribution_new 26 4.7 0.000 0.000 0.000 0.000 9 -3: mp_irecv_iv 150 8.0 0.000 0.000 0.000 0.000 7 -3: dbcsr_iterator_stop 76 6.8 0.000 0.000 0.000 0.000 9 -3: dbcsr_get_data_size_used 16 5.8 0.000 0.000 0.000 0.000 11 -3: dbcsr_verify_matrix 3 4.0 0.000 0.000 0.000 0.000 4 -3: mp_sum_b 20 5.0 0.000 0.000 0.000 0.000 1 -3: mp_max_r 1 1.0 0.000 0.000 0.000 0.000 3 -3: mp_sum_root_rm 2 4.0 0.000 0.000 0.000 0.000 0 -3: multiply_cannon_metrocomm3 120 7.0 0.000 0.000 0.000 0.000 8 -3: mp_comm_free 4 2.0 0.000 0.000 0.000 0.000 10 -3: dbcsr_get_local_rows 10 5.0 0.000 0.000 0.000 0.000 10 -3: mp_alltoall_i11v 9 5.0 0.000 0.000 0.000 0.000 8 -3: dbcsr_mm_sched_init 10 8.0 0.000 0.000 0.000 0.000 6 -3: dbcsr_get_local_cols 10 5.0 0.000 0.000 0.000 0.000 7 -3: dbcsr_get_global_row_map 10 5.0 0.000 0.000 0.000 0.000 8 -3: mp_sum_lv 2 1.0 0.000 0.000 0.000 0.000 7 -3: mp_sum_lm3 1 1.0 0.000 0.000 0.000 0.000 1 -3: mp_min_rv 1 1.0 0.000 0.000 0.000 0.000 1 -3: mp_sum_rv 1 1.0 0.000 0.000 0.000 0.000 6 -3: mp_sum_r 1 1.0 0.000 0.000 0.000 0.000 8 -3: mp_bcast_iv 2 1.0 0.000 0.000 0.000 0.000 6 -3: dbcsr_mm_sched_finalize 10 10.0 0.000 0.000 0.000 0.000 11 -3: mp_max_rv 1 1.0 0.000 0.000 0.000 0.000 11 -3: dbcsr_get_global_col_map 10 5.0 0.000 0.000 0.000 0.000 1 -3: mp_sum_i 1 1.0 0.000 0.000 0.000 0.000 9 -3: mp_max_d 1 1.0 0.000 0.000 0.000 0.000 8 -3: dbcsr_mm_hostdrv_init 10 9.0 0.000 0.000 0.000 0.000 6 +3: dbcsr_verify_matrix 3 4.0 0.000 0.000 0.000 0.000 0 +3: dbcsr_get_data_size_used 16 5.8 0.000 0.000 0.000 0.000 6 +3: mp_sum_root_rm 2 4.0 0.000 0.000 0.000 0.000 2 +3: multiply_cannon_metrocomm3 70 7.0 0.000 0.000 0.000 0.000 5 +3: dbcsr_mm_sched_init 10 8.0 0.000 0.000 0.000 0.000 0 +3: mp_comm_free 4 2.0 0.000 0.000 0.000 0.000 0 +3: mp_alltoall_i11v 9 5.0 0.000 0.000 0.000 0.000 2 +3: dbcsr_get_local_rows 10 5.0 0.000 0.000 0.000 0.000 2 +3: dbcsr_mm_sched_finalize 10 10.0 0.000 0.000 0.000 0.000 4 +3: dbcsr_get_global_row_map 10 5.0 0.000 0.000 0.000 0.000 4 +3: dbcsr_get_local_cols 10 5.0 0.000 0.000 0.000 0.000 2 +3: dbcsr_get_global_col_map 10 5.0 0.000 0.000 0.000 0.000 3 +3: dbcsr_mm_hostdrv_init 10 9.0 0.000 0.000 0.000 0.000 0 3: ------------------------------------------------------------------------------- 3: - 3/19 Test #3: dbcsr_perf:inputs/test_rect1_sparse.perf .............. Passed 1.05 sec + 3/19 Test #3: dbcsr_perf:inputs/test_rect1_sparse.perf .............. Passed 22.50 sec test 4 Start 4: dbcsr_perf:inputs/test_rect2_dense.perf -4: Test command: /usr/bin/mpiexec "-n" "12" "/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/tests/dbcsr_perf" "/build/reproducible-path/dbcsr-2.6.0/tests/inputs/test_rect2_dense.perf" +4: Test command: /usr/bin/mpiexec "-n" "7" "/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/tests/dbcsr_perf" "/build/reproducible-path/dbcsr-2.6.0/tests/inputs/test_rect2_dense.perf" 4: Working Directory: /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/tests 4: Environment variables: 4: OMP_NUM_THREADS=2 @@ -2372,12 +2405,12 @@ 4: DBCSR| Use Communication thread T (D) 4: DBCSR| Communication thread load 100 (D) 4: DBCSR| MPI: My process id 0 -4: DBCSR| MPI: Number of processes 12 +4: DBCSR| MPI: Number of processes 7 4: DBCSR| OMP: Current number of threads 2 4: DBCSR| OMP: Max number of threads 2 4: DBCSR| Split modifier for TAS multiplication algorithm 1.0E+00 (D) 4: numthreads 2 -4: numnodes 12 +4: numnodes 7 4: matrix_sizes 100 100 1000 4: sparsities 0.0000000000000000 0.0000000000000000 0.0000000000000000 4: trans TN @@ -2394,7 +2427,7 @@ 4: ******************************************************************************** 4: -- PERF dbcsr_multiply (T, N, 3 , N, N, N) 4: matrix sizes A( 1000 x 100), B( 1000 x 100) and C( 100 x 100) -4: numnodes (nprows X npcols) = 12( 12 X 1) +4: numnodes (nprows X npcols) = 7( 7 X 1) 4: nthreads = 2 4: checksum(A) = 0.333563309139543E+05 4: checksum(B) = 0.333056034107568E+05 @@ -2404,12 +2437,12 @@ 4: 4: 4: mean std minmin maxmax -4: time = 37.43E-03 2.29E-03 27.00E-03 53.36E-03 seconds -4: perf total = 522.82E+06 29.46E+06 374.83E+06 680.07E+06 FLOPS -4: perf per node = 43.57E+06 2.46E+06 31.24E+06 56.67E+06 FLOPS -4: perf per thread = 21.78E+06 1.23E+06 15.62E+06 28.34E+06 FLOPS -4: load imbalance = 0.36E-01 0.21E-02 0.27E-01 0.49E-01 -4: rel load imbal = 0.92E+00 0.29E-03 0.92E+00 0.92E+00 +4: time = 590.94E-03 48.13E-03 375.83E-03 916.01E-03 seconds +4: perf total = 34.48E+06 2.72E+06 21.83E+06 48.50E+06 FLOPS +4: perf per node = 4.93E+06 388.98E+03 3.12E+06 6.93E+06 FLOPS +4: perf per thread = 2.46E+06 194.49E+03 1.56E+06 3.46E+06 FLOPS +4: load imbalance = 0.53E+00 0.43E-01 0.36E+00 0.79E+00 +4: rel load imbal = 0.86E+00 0.79E-03 0.86E+00 0.87E+00 4: ******************************************************************************** 4: 4: ------------------------------------------------------------------------------- @@ -2418,41 +2451,41 @@ 4: - - 4: ------------------------------------------------------------------------------- 4: COUNTER TOTAL BLAS SMM ACC -4: flops 10 x 100 x 80 6400000 100.0% 0.0% 0.0% -4: flops 10 x 100 x 85 13600000 100.0% 0.0% 0.0% -4: flops 5 x 100 x 80 57600000 100.0% 0.0% 0.0% -4: flops 5 x 100 x 85 122400000 100.0% 0.0% 0.0% +4: flops 5 x 100 x 140 33600000 100.0% 0.0% 0.0% +4: flops 5 x 100 x 145 46400000 100.0% 0.0% 0.0% +4: flops 10 x 100 x 140 50400000 100.0% 0.0% 0.0% +4: flops 10 x 100 x 145 69600000 100.0% 0.0% 0.0% 4: flops inhomo. stacks 0 0.0% 0.0% 0.0% 4: flops total 200.000000E+06 100.0% 0.0% 0.0% -4: flops max/rank 20.000000E+06 100.0% 0.0% 0.0% +4: flops max/rank 30.000000E+06 100.0% 0.0% 0.0% 4: matmuls inhomo. stacks 0 0.0% 0.0% 0.0% -4: matmuls total 2280 100.0% 0.0% 0.0% -4: number of processed stacks 2280 100.0% 0.0% 0.0% +4: matmuls total 980 100.0% 0.0% 0.0% +4: number of processed stacks 980 100.0% 0.0% 0.0% 4: average stack size 1.0 0.0 0.0 -4: marketing flops 200.000016E+06 +4: marketing flops 199.999968E+06 4: ------------------------------------------------------------------------------- 4: # multiplications 10 -4: max memory usage/rank 100.540416E+06 -4: # max total images/rank 12 +4: max memory usage/rank 74.067968E+06 +4: # max total images/rank 7 4: # max 3D layers 1 -4: # MPI messages exchanged 1320 +4: # MPI messages exchanged 420 4: MPI messages size (bytes): -4: total size 88.000000E+06 -4: min size 64.000000E+03 -4: max size 68.000000E+03 -4: average size 66.666664E+03 +4: total size 48.000000E+06 +4: min size 112.000000E+03 +4: max size 116.000000E+03 +4: average size 114.285711E+03 4: MPI breakdown and total messages size (bytes): 4: size <= 128 0 0 4: 128 < size <= 8192 0 0 4: 8192 < size <= 32768 0 0 -4: 32768 < size <= 131072 1320 88000000 +4: 32768 < size <= 131072 420 48000000 4: 131072 < size <= 4194304 0 0 4: 4194304 < size <= 16777216 0 0 4: 16777216 < size 0 0 4: ------------------------------------------------------------------------------- 4: 4: *** WARNING in dbcsr_mm.F:291 :: Using a non-square number of MPI ranks *** -4: *** might lead to poor performance. Used ranks: 12 Suggested: 9 25 *** +4: *** might lead to poor performance. Used ranks: 7 Suggested: 9 16 *** 4: 4: ------------------------------------------------------------------------------- 4: - - @@ -2461,10 +2494,10 @@ 4: ------------------------------------------------------------------------------- 4: ROUTINE CALLS AVE VOLUME [Bytes] 4: MP_Bcast 5 12. -4: MP_Allreduce 94 32. -4: MP_Alltoall 41 14576. -4: MP_ISend 480 16894. -4: MP_IRecv 480 17344. +4: MP_Allreduce 94 24. +4: MP_Alltoall 41 25033. +4: MP_ISend 280 29426. +4: MP_IRecv 280 29440. 4: ------------------------------------------------------------------------------- 4: 4: ------------------------------------------------------------------------------- @@ -2474,121 +2507,121 @@ 4: ------------------------------------------------------------------------------- 4: SUBROUTINE CALLS ASD SELF TIME TOTAL TIME MAXRANK 4: MAXIMUM AVERAGE MAXIMUM AVERAGE MAXIMUM -4: dbcsr_performance_driver 1 1.0 0.000 0.000 0.433 0.436 0 -4: dbcsr_perf_multiply_low 1 2.0 0.000 0.000 0.433 0.436 0 -4: perf_multiply 1 3.0 0.000 0.000 0.429 0.434 0 -4: dbcsr_multiply_generic 10 4.0 0.001 0.002 0.374 0.382 9 -4: multiply_cannon 10 5.0 0.007 0.012 0.144 0.167 5 -4: make_m2s 20 5.0 0.001 0.001 0.136 0.143 10 -4: make_images 20 6.0 0.016 0.024 0.122 0.131 8 -4: multiply_cannon_loop 10 6.0 0.002 0.011 0.105 0.127 9 -4: mp_waitall_1 680 8.2 0.101 0.122 0.101 0.122 8 -4: multiply_cannon_metrocomm1 120 7.0 0.001 0.001 0.074 0.097 3 -4: mp_sum_l 145 2.7 0.074 0.088 0.074 0.088 2 -4: make_images_sizes 20 7.0 0.000 0.000 0.063 0.071 9 -4: mp_alltoall_i44 20 8.0 0.063 0.071 0.063 0.071 11 -4: dbcsr_multiply_generic_mpsum_f 10 5.0 0.000 0.000 0.052 0.063 0 -4: multiply_cannon_multrec 120 7.0 0.026 0.046 0.026 0.046 9 -4: make_images_data 20 7.0 0.001 0.001 0.030 0.035 7 -4: hybrid_alltoall_any 20 8.0 0.001 0.004 0.028 0.034 6 -4: mp_allgather_i34 10 6.0 0.028 0.033 0.028 0.033 0 -4: mp_sync 10 4.0 0.021 0.025 0.021 0.025 11 -4: dbcsr_redistribute 3 4.0 0.005 0.010 0.019 0.023 10 -4: dbcsr_special_finalize 130 7.0 0.000 0.000 0.009 0.023 3 -4: quick_finalize 133 8.0 0.007 0.021 0.008 0.022 2 -4: dbcsr_create_new 457 6.8 0.013 0.018 0.015 0.020 2 -4: mp_alltoall_i22 3 5.0 0.013 0.017 0.013 0.017 5 -4: dbcsr_make_images_dense 20 6.0 0.001 0.001 0.012 0.017 6 -4: dbcsr_checksum 5 4.0 0.003 0.005 0.014 0.015 6 -4: mp_sum_d 76 1.3 0.012 0.014 0.012 0.014 5 -4: dbcsr_make_dists_dense 10 5.0 0.005 0.013 0.005 0.013 4 -4: dbcsr_make_dense_low 140 6.9 0.001 0.002 0.009 0.013 7 -4: dbcsr_make_undense 10 5.0 0.000 0.000 0.005 0.013 6 -4: make_dense_data 140 7.9 0.004 0.009 0.007 0.011 8 -4: dbcsr_new_transposed 10 5.0 0.000 0.000 0.006 0.010 6 -4: dbcsr_init_lib_low 1 1.0 0.003 0.009 0.003 0.009 11 -4: mp_max_l 96 1.0 0.006 0.007 0.006 0.007 11 -4: dbcsr_make_dense 10 5.0 0.000 0.000 0.001 0.006 11 -4: dbcsr_make_random_matrix 3 3.0 0.003 0.003 0.004 0.004 3 -4: dbcsr_iterator_start 226 8.1 0.002 0.004 0.002 0.004 4 -4: dbcsr_iterator_stop 226 8.1 0.001 0.004 0.001 0.004 1 -4: dbcsr_finalize 17 4.8 0.000 0.000 0.002 0.003 9 -4: make_images_pack 20 7.0 0.002 0.002 0.002 0.003 3 -4: dbcsr_make_index_exist 457 7.8 0.002 0.002 0.002 0.002 6 -4: dbcsr_copy 10 4.0 0.000 0.002 0.001 0.002 5 -4: setup_buffer_matrices 20 6.0 0.000 0.000 0.002 0.002 6 -4: dbcsr_destroy 447 5.9 0.001 0.001 0.001 0.002 6 -4: dbcsr_make_index_list 130 6.0 0.001 0.002 0.001 0.002 6 -4: multiply_cannon_metrocomm2 110 7.0 0.001 0.001 0.002 0.002 6 -4: dbcsr_merge_all 13 5.8 0.000 0.001 0.001 0.002 8 -4: dbcsr_data_release 1850 7.9 0.001 0.002 0.001 0.002 6 -4: mp_isend_dv 220 8.5 0.001 0.002 0.001 0.002 7 -4: dbcsr_add_wm_from_matrix 10 5.0 0.000 0.001 0.001 0.002 10 -4: dbcsr_sort_indices 156 8.6 0.001 0.002 0.001 0.002 4 -4: mp_bcast_av 105 1.0 0.000 0.001 0.001 0.001 3 -4: dbcsr_data_new 1031 7.8 0.001 0.001 0.001 0.001 6 -4: mp_maxloc_dv 215 1.0 0.001 0.001 0.001 0.001 6 -4: dbcsr_fill_wm_from_matrix 10 6.0 0.000 0.001 0.000 0.001 6 -4: mp_cart_sub 2 5.0 0.001 0.001 0.001 0.001 0 -4: setup_rec_index_2d 20 6.0 0.001 0.001 0.001 0.001 6 -4: transpose_index_local 10 6.0 0.000 0.000 0.001 0.001 6 -4: tree_to_linear_d 3 6.0 0.000 0.001 0.000 0.001 2 -4: mp_bcast_i 106 2.0 0.001 0.001 0.001 0.001 8 -4: mp_max_i 102 1.0 0.001 0.001 0.001 0.001 9 -4: dbcsr_mm_multrec_init 10 6.0 0.000 0.000 0.001 0.001 5 -4: dbcsr_mm_csr_init 10 7.0 0.001 0.001 0.001 0.001 8 -4: buffer_matrices_ensure_size 20 6.0 0.000 0.001 0.000 0.001 7 -4: dbcsr_make_untransposed_blocks 20 5.0 0.000 0.001 0.000 0.001 9 -4: dbcsr_switch_data_area 293 8.3 0.000 0.000 0.001 0.001 7 -4: multiply_cannon_multrec_finali 10 8.0 0.000 0.000 0.000 0.001 0 -4: dbcsr_mm_multrec_finalize 10 9.0 0.000 0.001 0.000 0.001 3 -4: dbcsr_work_create 146 6.8 0.000 0.000 0.000 0.000 11 +4: dbcsr_performance_driver 1 1.0 0.000 0.000 7.181 7.192 0 +4: dbcsr_perf_multiply_low 1 2.0 0.004 0.024 7.180 7.192 6 +4: perf_multiply 1 3.0 0.003 0.008 7.150 7.173 4 +4: dbcsr_multiply_generic 10 4.0 0.005 0.019 5.909 5.998 0 +4: multiply_cannon 10 5.0 0.129 0.168 2.262 2.346 3 +4: make_m2s 20 5.0 0.001 0.002 1.786 1.815 0 +4: make_images 20 6.0 0.180 0.209 1.712 1.758 2 +4: multiply_cannon_loop 10 6.0 0.190 0.254 1.540 1.706 2 +4: mp_waitall_1 480 8.2 1.332 1.595 1.332 1.595 0 +4: mp_sum_l 145 2.7 1.155 1.336 1.155 1.336 4 +4: multiply_cannon_metrocomm1 70 7.0 0.001 0.001 1.000 1.225 4 +4: make_images_sizes 20 7.0 0.000 0.000 0.920 1.045 1 +4: mp_alltoall_i44 20 8.0 0.920 1.045 0.920 1.045 5 +4: dbcsr_redistribute 3 4.0 0.172 0.326 0.565 0.597 1 +4: dbcsr_create_new 307 6.7 0.307 0.401 0.413 0.554 0 +4: mp_allgather_i34 10 6.0 0.423 0.488 0.423 0.488 3 +4: mp_alltoall_i22 3 5.0 0.349 0.481 0.349 0.481 5 +4: make_images_data 20 7.0 0.001 0.001 0.410 0.451 0 +4: mp_sync 10 4.0 0.352 0.428 0.352 0.428 1 +4: dbcsr_multiply_generic_mpsum_f 10 5.0 0.000 0.000 0.356 0.421 3 +4: hybrid_alltoall_any 20 8.0 0.073 0.101 0.338 0.406 6 +4: multiply_cannon_multrec 70 7.0 0.343 0.399 0.348 0.400 2 +4: dbcsr_checksum 5 4.0 0.077 0.137 0.297 0.332 3 +4: dbcsr_special_finalize 80 7.0 0.001 0.001 0.182 0.308 0 +4: quick_finalize 83 7.9 0.183 0.305 0.187 0.307 0 +4: mp_sum_d 76 1.3 0.228 0.280 0.228 0.280 5 +4: dbcsr_new_transposed 10 5.0 0.017 0.040 0.175 0.255 0 +4: mp_sum_b 20 5.0 0.221 0.251 0.221 0.251 6 +4: dbcsr_make_undense 10 5.0 0.020 0.047 0.142 0.236 3 +4: setup_rec_index_2d 20 6.0 0.095 0.203 0.095 0.203 3 +4: dbcsr_make_index_exist 307 7.7 0.105 0.152 0.105 0.152 0 +4: dbcsr_make_dense 10 5.0 0.000 0.000 0.093 0.149 0 +4: dbcsr_finalize 17 4.8 0.003 0.016 0.060 0.139 3 +4: dbcsr_make_dense_low 90 6.9 0.002 0.002 0.047 0.127 0 +4: make_dense_data 90 7.9 0.024 0.049 0.044 0.124 0 +4: dbcsr_merge_all 13 5.8 0.045 0.085 0.051 0.123 3 +4: mp_max_i 102 1.0 0.079 0.113 0.079 0.113 2 +4: dbcsr_make_dists_dense 10 5.0 0.090 0.103 0.090 0.103 3 +4: mp_max_l 96 1.0 0.088 0.098 0.088 0.098 1 +4: mp_sum_lv 5 1.0 0.087 0.095 0.087 0.095 0 +4: dbcsr_iterator_start 176 7.8 0.029 0.085 0.029 0.086 0 +4: dbcsr_make_images_dense 20 6.0 0.001 0.001 0.032 0.085 0 +4: buffer_matrices_ensure_size 20 6.0 0.051 0.081 0.051 0.081 3 +4: dbcsr_init_lib_low 1 1.0 0.031 0.060 0.031 0.060 6 +4: setup_buffer_matrices 20 6.0 0.000 0.001 0.019 0.058 6 +4: dbcsr_make_random_matrix 3 3.0 0.006 0.012 0.027 0.054 5 +4: dbcsr_copy 10 4.0 0.017 0.044 0.017 0.044 5 +4: mp_cart_create 1 5.0 0.030 0.036 0.030 0.036 5 +4: mp_bcast_av 105 1.0 0.008 0.017 0.024 0.030 2 +4: merge_index 13 6.8 0.004 0.028 0.004 0.028 3 +4: mp_bcast_i 106 2.0 0.016 0.025 0.016 0.025 1 +4: mp_sum_i 1 1.0 0.018 0.024 0.018 0.024 6 +4: mp_sum_lm3 1 1.0 0.020 0.024 0.020 0.024 2 +4: mp_maxloc_dv 215 1.0 0.018 0.022 0.018 0.022 6 +4: multiply_cannon_multrec_finali 10 8.0 0.000 0.000 0.005 0.021 0 +4: dbcsr_mm_multrec_finalize 10 9.0 0.005 0.020 0.005 0.020 5 +4: dbcsr_iterator_stop 176 7.8 0.010 0.019 0.010 0.019 0 +4: dbcsr_add_wm_from_matrix 10 5.0 0.001 0.008 0.003 0.017 0 +4: mp_bcast_iv 5 1.0 0.006 0.016 0.006 0.016 0 +4: mp_max_r 1 1.0 0.009 0.016 0.009 0.016 4 +4: mp_max_rv 1 1.0 0.006 0.016 0.006 0.016 0 +4: dbcsr_sort_indices 106 8.5 0.006 0.015 0.006 0.015 2 +4: dbcsr_make_index_list 80 6.0 0.003 0.014 0.003 0.014 3 +4: mp_min_rv 1 1.0 0.008 0.012 0.008 0.012 6 +4: mp_sum_r 1 1.0 0.005 0.012 0.005 0.012 2 +4: mp_cart_sub 2 5.0 0.008 0.009 0.008 0.009 3 +4: mp_sum_root_rm 2 4.0 0.002 0.009 0.002 0.009 0 +4: dbcsr_make_untransposed_blocks 20 5.0 0.003 0.008 0.003 0.009 0 +4: dbcsr_fill_wm_from_matrix 10 6.0 0.001 0.008 0.002 0.008 0 +4: mp_max_d 1 1.0 0.005 0.008 0.005 0.008 3 +4: mp_sum_rv 1 1.0 0.007 0.008 0.007 0.008 0 +4: dbcsr_mm_multrec_init 10 6.0 0.000 0.000 0.004 0.008 5 +4: dbcsr_mm_csr_init 10 7.0 0.004 0.008 0.004 0.008 3 +4: transpose_index_local 10 6.0 0.000 0.000 0.002 0.006 1 +4: make_images_pack 20 7.0 0.005 0.005 0.005 0.005 6 +4: dbcsr_destroy 297 5.8 0.001 0.002 0.003 0.003 0 +4: dbcsr_data_release 1300 7.8 0.003 0.003 0.003 0.003 1 +4: dbcsr_data_new 731 7.6 0.002 0.002 0.002 0.002 6 +4: multiply_cannon_metrocomm2 60 7.0 0.001 0.001 0.002 0.002 0 +4: mp_isend_dv 120 8.5 0.001 0.001 0.001 0.001 3 +4: dbcsr_switch_data_area 193 8.1 0.001 0.001 0.001 0.001 0 +4: dbcsr_work_create 96 6.7 0.001 0.001 0.001 0.001 5 +4: mp_isend_iv 160 8.0 0.001 0.001 0.001 0.001 5 +4: tree_to_linear_d 3 6.0 0.001 0.001 0.001 0.001 0 +4: dbcsr_work_destroy_all 96 7.6 0.000 0.000 0.001 0.001 0 +4: mp_irecv_dv 120 8.5 0.000 0.001 0.000 0.001 1 +4: dbcsr_iterator_seek 176 8.8 0.000 0.001 0.000 0.001 5 4: dbcsr_distribution_new 66 5.5 0.000 0.000 0.000 0.000 0 -4: mp_irecv_dv 220 8.5 0.000 0.000 0.000 0.000 6 -4: dbcsr_work_destroy_all 146 7.8 0.000 0.000 0.000 0.000 10 -4: mp_isend_iv 260 8.0 0.000 0.000 0.000 0.000 11 -4: dbcsr_iterator_seek 226 9.1 0.000 0.000 0.000 0.000 7 -4: dbcsr_index_prune_deleted 130 7.0 0.000 0.000 0.000 0.000 4 -4: mp_irecv_iv 260 8.0 0.000 0.000 0.000 0.000 6 -4: merge_index 13 6.8 0.000 0.000 0.000 0.000 9 -4: mp_sum_b 20 5.0 0.000 0.000 0.000 0.000 10 -4: dbcsr_make_index_local_row 130 6.0 0.000 0.000 0.000 0.000 6 -4: mp_cart_create 1 5.0 0.000 0.000 0.000 0.000 7 +4: mp_irecv_iv 160 8.0 0.000 0.000 0.000 0.000 1 +4: dbcsr_make_dbcsr_index 106 8.5 0.000 0.000 0.000 0.000 0 +4: mp_alltoall_d11v 9 5.0 0.000 0.000 0.000 0.000 0 +4: dbcsr_data_copy_aa2 13 6.8 0.000 0.000 0.000 0.000 3 +4: dbcsr_index_prune_deleted 80 7.0 0.000 0.000 0.000 0.000 4 +4: dbcsr_make_index_local_row 80 6.0 0.000 0.000 0.000 0.000 2 4: dbcsr_dist_bin 5 3.0 0.000 0.000 0.000 0.000 1 -4: dbcsr_make_dbcsr_index 156 8.6 0.000 0.000 0.000 0.000 3 -4: mp_max_r 1 1.0 0.000 0.000 0.000 0.000 6 -4: dbcsr_data_copy_aa2 13 6.7 0.000 0.000 0.000 0.000 6 -4: mp_alltoall_d11v 9 5.0 0.000 0.000 0.000 0.000 10 -4: dbcsr_get_local_rows 20 5.5 0.000 0.000 0.000 0.000 4 -4: mp_sum_root_rm 2 4.0 0.000 0.000 0.000 0.000 4 -4: multiply_cannon_metrocomm3 120 7.0 0.000 0.000 0.000 0.000 10 -4: mp_sum_lv 5 1.0 0.000 0.000 0.000 0.000 2 -4: mp_comm_free 4 2.0 0.000 0.000 0.000 0.000 3 -4: dbcsr_verify_matrix 3 4.0 0.000 0.000 0.000 0.000 6 -4: dbcsr_mm_sched_finalize 10 10.0 0.000 0.000 0.000 0.000 10 -4: dbcsr_mm_sched_init 10 8.0 0.000 0.000 0.000 0.000 9 -4: mp_bcast_iv 5 1.0 0.000 0.000 0.000 0.000 9 -4: mp_alltoall_i11v 9 5.0 0.000 0.000 0.000 0.000 3 -4: dbcsr_get_data_size_used 16 5.8 0.000 0.000 0.000 0.000 10 -4: dbcsr_get_local_cols 20 5.5 0.000 0.000 0.000 0.000 6 -4: fill_hash_tables 10 8.0 0.000 0.000 0.000 0.000 4 -4: dbcsr_get_global_row_map 10 5.0 0.000 0.000 0.000 0.000 4 -4: mp_sum_lm3 1 1.0 0.000 0.000 0.000 0.000 0 +4: dbcsr_get_local_rows 20 5.5 0.000 0.000 0.000 0.000 0 +4: multiply_cannon_metrocomm3 70 7.0 0.000 0.000 0.000 0.000 1 +4: mp_alltoall_i11v 9 5.0 0.000 0.000 0.000 0.000 1 +4: dbcsr_mm_sched_init 10 8.0 0.000 0.000 0.000 0.000 2 +4: dbcsr_verify_matrix 3 4.0 0.000 0.000 0.000 0.000 4 +4: dbcsr_get_local_cols 20 5.5 0.000 0.000 0.000 0.000 1 +4: mp_comm_free 4 2.0 0.000 0.000 0.000 0.000 1 +4: dbcsr_get_data_size_used 16 5.8 0.000 0.000 0.000 0.000 0 +4: fill_hash_tables 10 8.0 0.000 0.000 0.000 0.000 5 +4: dbcsr_get_global_row_map 10 5.0 0.000 0.000 0.000 0.000 0 4: dbcsr_get_global_col_map 10 5.0 0.000 0.000 0.000 0.000 6 -4: mp_sum_r 1 1.0 0.000 0.000 0.000 0.000 8 -4: mp_max_d 1 1.0 0.000 0.000 0.000 0.000 0 -4: mp_sum_rv 1 1.0 0.000 0.000 0.000 0.000 9 -4: mp_min_rv 1 1.0 0.000 0.000 0.000 0.000 8 -4: mp_max_rv 1 1.0 0.000 0.000 0.000 0.000 9 -4: mp_sum_i 1 1.0 0.000 0.000 0.000 0.000 1 -4: dbcsr_mm_hostdrv_init 10 9.0 0.000 0.000 0.000 0.000 5 +4: dbcsr_mm_sched_finalize 10 10.0 0.000 0.000 0.000 0.000 5 +4: dbcsr_mm_hostdrv_init 10 9.0 0.000 0.000 0.000 0.000 1 4: ------------------------------------------------------------------------------- 4: - 4/19 Test #4: dbcsr_perf:inputs/test_rect2_dense.perf ............... Passed 0.51 sec + 4/19 Test #4: dbcsr_perf:inputs/test_rect2_dense.perf ............... Passed 8.18 sec test 5 Start 5: dbcsr_perf:inputs/test_rect2_sparse.perf -5: Test command: /usr/bin/mpiexec "-n" "12" "/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/tests/dbcsr_perf" "/build/reproducible-path/dbcsr-2.6.0/tests/inputs/test_rect2_sparse.perf" +5: Test command: /usr/bin/mpiexec "-n" "7" "/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/tests/dbcsr_perf" "/build/reproducible-path/dbcsr-2.6.0/tests/inputs/test_rect2_sparse.perf" 5: Working Directory: /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/tests 5: Environment variables: 5: OMP_NUM_THREADS=2 @@ -2607,12 +2640,12 @@ 5: DBCSR| Use Communication thread T (D) 5: DBCSR| Communication thread load 100 (D) 5: DBCSR| MPI: My process id 0 -5: DBCSR| MPI: Number of processes 12 +5: DBCSR| MPI: Number of processes 7 5: DBCSR| OMP: Current number of threads 2 5: DBCSR| OMP: Max number of threads 2 5: DBCSR| Split modifier for TAS multiplication algorithm 1.0E+00 (D) 5: numthreads 2 -5: numnodes 12 +5: numnodes 7 5: matrix_sizes 1000 1000 5000 5: sparsities 0.90000000000000002 0.90000000000000002 0.90000000000000002 5: trans TN @@ -2629,7 +2662,7 @@ 5: ******************************************************************************** 5: -- PERF dbcsr_multiply (T, N, 3 , N, N, N) 5: matrix sizes A( 5000 x 1000), B( 5000 x 1000) and C( 1000 x 1000) -5: numnodes (nprows X npcols) = 12( 12 X 1) +5: numnodes (nprows X npcols) = 7( 7 X 1) 5: nthreads = 2 5: checksum(A) = 0.167223715953740E+06 5: checksum(B) = 0.166538681814745E+06 @@ -2639,12 +2672,12 @@ 5: 5: 5: mean std minmin maxmax -5: time = 67.86E-03 2.36E-03 60.08E-03 83.24E-03 seconds -5: perf total = 1.44E+09 45.27E+06 1.21E+09 1.59E+09 FLOPS -5: perf per node = 120.24E+06 3.77E+06 100.49E+06 132.80E+06 FLOPS -5: perf per thread = 60.12E+06 1.89E+06 50.24E+06 66.40E+06 FLOPS -5: load imbalance = 0.65E-01 0.22E-02 0.58E-01 0.76E-01 -5: rel load imbal = 0.92E+00 0.19E-03 0.92E+00 0.92E+00 +5: time = 856.29E-03 136.03E-03 595.23E-03 2.15E+00 seconds +5: perf total = 126.91E+06 9.31E+06 46.64E+06 158.47E+06 FLOPS +5: perf per node = 18.13E+06 1.33E+06 6.66E+06 22.64E+06 FLOPS +5: perf per thread = 9.06E+06 665.20E+03 3.33E+06 11.32E+06 FLOPS +5: load imbalance = 0.76E+00 0.12E+00 0.55E+00 0.18E+01 +5: rel load imbal = 0.86E+00 0.84E-03 0.86E+00 0.87E+00 5: ******************************************************************************** 5: 5: ------------------------------------------------------------------------------- @@ -2656,35 +2689,35 @@ 5: flops 5 x 5 x 5 1003697500 100.0% 0.0% 0.0% 5: flops inhomo. stacks 0 0.0% 0.0% 0.0% 5: flops total 1.003698E+09 100.0% 0.0% 0.0% -5: flops max/rank 88.107500E+06 100.0% 0.0% 0.0% +5: flops max/rank 149.005000E+06 100.0% 0.0% 0.0% 5: matmuls inhomo. stacks 0 0.0% 0.0% 0.0% 5: matmuls total 4014790 100.0% 0.0% 0.0% -5: number of processed stacks 5710 100.0% 0.0% 0.0% -5: average stack size 703.1 0.0 0.0 -5: marketing flops 99.999998E+09 +5: number of processed stacks 4460 100.0% 0.0% 0.0% +5: average stack size 900.2 0.0 0.0 +5: marketing flops 99.999990E+09 5: ------------------------------------------------------------------------------- 5: # multiplications 10 -5: max memory usage/rank 105.365504E+06 -5: # max total images/rank 12 +5: max memory usage/rank 84.484096E+06 +5: # max total images/rank 7 5: # max 3D layers 1 -5: # MPI messages exchanged 1320 +5: # MPI messages exchanged 420 5: MPI messages size (bytes): -5: total size 439.868000E+06 -5: min size 324.400000E+03 -5: max size 344.600000E+03 -5: average size 333.233344E+03 +5: total size 239.928000E+06 +5: min size 561.200000E+03 +5: max size 583.400000E+03 +5: average size 571.257125E+03 5: MPI breakdown and total messages size (bytes): 5: size <= 128 0 0 5: 128 < size <= 8192 0 0 5: 8192 < size <= 32768 0 0 5: 32768 < size <= 131072 0 0 -5: 131072 < size <= 4194304 1320 439868000 +5: 131072 < size <= 4194304 420 239928000 5: 4194304 < size <= 16777216 0 0 5: 16777216 < size 0 0 5: ------------------------------------------------------------------------------- 5: 5: *** WARNING in dbcsr_mm.F:291 :: Using a non-square number of MPI ranks *** -5: *** might lead to poor performance. Used ranks: 12 Suggested: 9 25 *** +5: *** might lead to poor performance. Used ranks: 7 Suggested: 9 16 *** 5: 5: ------------------------------------------------------------------------------- 5: - - @@ -2693,10 +2726,10 @@ 5: ------------------------------------------------------------------------------- 5: ROUTINE CALLS AVE VOLUME [Bytes] 5: MP_Bcast 2 12. -5: MP_Allreduce 88 33. -5: MP_Alltoall 41 75049. -5: MP_ISend 480 89514. -5: MP_IRecv 480 89269. +5: MP_Allreduce 88 24. +5: MP_Alltoall 41 128384. +5: MP_ISend 280 154701. +5: MP_IRecv 280 154122. 5: ------------------------------------------------------------------------------- 5: 5: ------------------------------------------------------------------------------- @@ -2706,116 +2739,116 @@ 5: ------------------------------------------------------------------------------- 5: SUBROUTINE CALLS ASD SELF TIME TOTAL TIME MAXRANK 5: MAXIMUM AVERAGE MAXIMUM AVERAGE MAXIMUM -5: dbcsr_performance_driver 1 1.0 0.000 0.000 0.797 0.799 0 -5: dbcsr_perf_multiply_low 1 2.0 0.000 0.000 0.797 0.798 0 -5: perf_multiply 1 3.0 0.000 0.000 0.774 0.779 0 -5: dbcsr_multiply_generic 10 4.0 0.002 0.002 0.679 0.686 7 -5: multiply_cannon 10 5.0 0.011 0.024 0.388 0.415 8 -5: multiply_cannon_loop 10 6.0 0.005 0.013 0.323 0.352 4 -5: mp_waitall_1 680 8.2 0.200 0.218 0.200 0.218 1 -5: multiply_cannon_metrocomm1 120 7.0 0.001 0.001 0.174 0.194 7 -5: make_m2s 20 5.0 0.001 0.002 0.165 0.177 7 -5: make_images 20 6.0 0.032 0.052 0.161 0.173 6 -5: multiply_cannon_multrec 120 7.0 0.142 0.164 0.143 0.165 9 -5: mp_sum_l 145 2.7 0.076 0.089 0.076 0.089 7 -5: make_images_sizes 20 7.0 0.000 0.000 0.062 0.074 6 -5: mp_alltoall_i44 20 8.0 0.062 0.074 0.062 0.074 0 -5: dbcsr_multiply_generic_mpsum_f 10 5.0 0.000 0.000 0.044 0.058 8 -5: dbcsr_redistribute 3 4.0 0.019 0.032 0.039 0.043 4 -5: dbcsr_create_new 307 6.8 0.026 0.039 0.029 0.041 9 -5: make_images_data 20 7.0 0.001 0.001 0.032 0.040 7 -5: hybrid_alltoall_any 20 8.0 0.002 0.005 0.030 0.038 3 -5: mp_allgather_i34 10 6.0 0.028 0.038 0.028 0.038 0 -5: dbcsr_copy 30 4.7 0.003 0.007 0.018 0.033 4 -5: dbcsr_checksum 5 4.0 0.013 0.024 0.029 0.031 8 -5: mp_sync 10 4.0 0.024 0.030 0.024 0.030 8 -5: buffer_matrices_ensure_size 20 6.0 0.005 0.029 0.005 0.029 2 -5: mp_alltoall_i22 3 5.0 0.018 0.028 0.018 0.028 9 -5: dbcsr_special_finalize 130 7.0 0.001 0.002 0.018 0.027 1 -5: dbcsr_make_random_matrix 3 3.0 0.018 0.022 0.022 0.027 7 -5: dbcsr_new_transposed 10 5.0 0.001 0.004 0.012 0.026 2 -5: dbcsr_merge_single_wm 120 8.0 0.010 0.020 0.015 0.024 6 -5: mp_sum_d 76 1.3 0.017 0.024 0.017 0.024 9 -5: dbcsr_mm_multrec_init 10 6.0 0.000 0.000 0.003 0.021 7 -5: dbcsr_mm_csr_init 10 7.0 0.003 0.021 0.003 0.021 3 -5: setup_rec_index_2d 20 6.0 0.014 0.021 0.014 0.021 3 -5: dbcsr_finalize 17 4.8 0.000 0.000 0.014 0.020 7 -5: dbcsr_merge_all 13 5.8 0.003 0.011 0.012 0.018 9 -5: make_images_pack 20 7.0 0.013 0.014 0.014 0.014 7 -5: dbcsr_sort_indices 156 8.6 0.012 0.013 0.012 0.013 7 -5: dbcsr_init_lib_low 1 1.0 0.002 0.007 0.002 0.007 1 -5: merge_index 13 6.8 0.002 0.006 0.002 0.006 0 -5: dbcsr_make_index_exist 307 7.8 0.002 0.006 0.002 0.006 2 -5: dbcsr_make_untransposed_blocks 20 5.0 0.006 0.006 0.006 0.006 5 -5: transpose_index_local 10 6.0 0.000 0.000 0.005 0.006 7 -5: dbcsr_data_release 850 7.1 0.003 0.005 0.003 0.005 7 -5: quick_finalize 13 7.5 0.001 0.003 0.002 0.004 5 -5: setup_buffer_matrices 20 6.0 0.000 0.000 0.003 0.004 7 -5: dbcsr_destroy 297 5.4 0.001 0.001 0.003 0.004 7 -5: mp_max_l 91 1.0 0.003 0.004 0.003 0.004 4 -5: mp_isend_dv 220 8.5 0.002 0.004 0.002 0.004 3 -5: dbcsr_make_index_list 130 6.0 0.003 0.003 0.003 0.003 9 -5: dbcsr_sort_data 120 9.0 0.002 0.002 0.002 0.002 7 -5: dbcsr_add_wm_from_matrix 10 5.0 0.000 0.001 0.002 0.002 9 -5: tree_to_linear_d 3 6.0 0.002 0.002 0.002 0.002 10 -5: multiply_cannon_metrocomm2 110 7.0 0.001 0.001 0.002 0.002 7 -5: dbcsr_work_destroy_all 146 7.8 0.000 0.000 0.001 0.002 9 -5: dbcsr_fill_wm_from_matrix 10 6.0 0.001 0.001 0.001 0.001 2 -5: dbcsr_data_copy_aa2 13 6.8 0.001 0.001 0.001 0.001 4 -5: mp_maxloc_dv 205 1.0 0.001 0.001 0.001 0.001 6 -5: dbcsr_data_new 581 7.5 0.001 0.001 0.001 0.001 0 -5: mp_bcast_av 100 1.0 0.000 0.000 0.001 0.001 7 -5: mp_cart_sub 2 5.0 0.001 0.001 0.001 0.001 4 -5: mp_max_i 94 1.0 0.001 0.001 0.001 0.001 6 -5: mp_isend_iv 260 8.0 0.001 0.001 0.001 0.001 9 -5: multiply_cannon_multrec_finali 10 8.0 0.000 0.000 0.001 0.001 2 -5: dbcsr_mm_multrec_finalize 10 9.0 0.001 0.001 0.001 0.001 10 -5: mp_bcast_i 101 2.0 0.001 0.001 0.001 0.001 9 -5: dbcsr_work_create 146 6.8 0.000 0.000 0.001 0.001 7 -5: dbcsr_dist_bin 5 3.0 0.001 0.001 0.001 0.001 8 -5: mp_cart_create 1 5.0 0.000 0.001 0.000 0.001 9 -5: dbcsr_distribution_new 36 5.0 0.001 0.001 0.001 0.001 7 -5: dbcsr_make_dbcsr_index 156 8.6 0.001 0.001 0.001 0.001 7 -5: dbcsr_iterator_start 76 6.8 0.000 0.000 0.001 0.001 9 -5: mp_irecv_dv 220 8.5 0.000 0.000 0.000 0.000 9 -5: mp_irecv_iv 260 8.0 0.000 0.000 0.000 0.000 10 -5: dbcsr_make_index_local_row 130 6.0 0.000 0.000 0.000 0.000 10 -5: fill_hash_tables 10 8.0 0.000 0.000 0.000 0.000 8 -5: dbcsr_iterator_seek 76 7.8 0.000 0.000 0.000 0.000 7 -5: mp_alltoall_d11v 9 5.0 0.000 0.000 0.000 0.000 7 -5: dbcsr_iterator_stop 76 6.8 0.000 0.000 0.000 0.000 7 -5: mp_sum_b 20 5.0 0.000 0.000 0.000 0.000 5 -5: dbcsr_verify_matrix 3 4.0 0.000 0.000 0.000 0.000 7 -5: dbcsr_switch_data_area 43 6.8 0.000 0.000 0.000 0.000 7 -5: mp_max_r 1 1.0 0.000 0.000 0.000 0.000 10 -5: dbcsr_get_data_size_used 16 5.8 0.000 0.000 0.000 0.000 7 -5: multiply_cannon_metrocomm3 120 7.0 0.000 0.000 0.000 0.000 7 -5: mp_sum_root_rm 2 4.0 0.000 0.000 0.000 0.000 0 -5: mp_comm_free 4 2.0 0.000 0.000 0.000 0.000 7 -5: mp_sum_lm3 1 1.0 0.000 0.000 0.000 0.000 9 -5: mp_alltoall_i11v 9 5.0 0.000 0.000 0.000 0.000 0 -5: dbcsr_mm_sched_init 10 8.0 0.000 0.000 0.000 0.000 3 -5: mp_min_rv 1 1.0 0.000 0.000 0.000 0.000 9 -5: dbcsr_get_local_rows 10 5.0 0.000 0.000 0.000 0.000 8 -5: mp_bcast_iv 2 1.0 0.000 0.000 0.000 0.000 8 -5: mp_sum_r 1 1.0 0.000 0.000 0.000 0.000 3 -5: mp_sum_lv 2 1.0 0.000 0.000 0.000 0.000 4 +5: dbcsr_performance_driver 1 1.0 0.000 0.000 10.312 10.332 0 +5: dbcsr_perf_multiply_low 1 2.0 0.007 0.044 10.311 10.332 6 +5: perf_multiply 1 3.0 0.000 0.001 10.172 10.261 0 +5: dbcsr_multiply_generic 10 4.0 0.004 0.004 8.563 8.705 3 +5: multiply_cannon 10 5.0 0.073 0.121 4.212 4.372 3 +5: multiply_cannon_loop 10 6.0 0.347 0.416 3.071 3.226 0 +5: make_m2s 20 5.0 0.002 0.002 2.085 2.659 5 +5: mp_waitall_1 480 8.2 2.389 2.600 2.389 2.600 6 +5: make_images 20 6.0 0.258 0.310 2.035 2.357 5 +5: mp_sum_l 145 2.7 2.226 2.353 2.226 2.353 5 +5: multiply_cannon_metrocomm1 70 7.0 0.002 0.006 1.917 2.153 1 +5: mp_maxloc_dv 205 1.0 1.403 1.510 1.403 1.510 3 +5: mp_sum_d 76 1.3 1.075 1.277 1.075 1.277 6 +5: make_images_sizes 20 7.0 0.000 0.000 0.912 1.117 6 +5: mp_alltoall_i44 20 8.0 0.912 1.117 0.912 1.117 6 +5: mp_allgather_i34 10 6.0 0.820 0.973 0.820 0.973 5 +5: multiply_cannon_multrec 70 7.0 0.797 0.966 0.799 0.967 5 +5: dbcsr_create_new 207 6.7 0.363 0.529 0.532 0.903 3 +5: dbcsr_redistribute 3 4.0 0.369 0.468 0.718 0.819 0 +5: mp_max_l 91 1.0 0.709 0.817 0.709 0.817 6 +5: mp_max_i 94 1.0 0.742 0.792 0.742 0.792 0 +5: make_images_data 20 7.0 0.001 0.001 0.557 0.679 6 +5: dbcsr_multiply_generic_mpsum_f 10 5.0 0.000 0.000 0.448 0.588 5 +5: dbcsr_special_finalize 80 7.0 0.026 0.117 0.208 0.560 3 +5: hybrid_alltoall_any 20 8.0 0.079 0.202 0.442 0.531 5 +5: dbcsr_checksum 5 4.0 0.185 0.261 0.465 0.510 4 +5: mp_sync 10 4.0 0.390 0.502 0.390 0.502 1 +5: dbcsr_copy 30 4.7 0.071 0.095 0.318 0.422 3 +5: dbcsr_merge_single_wm 70 8.0 0.103 0.255 0.162 0.413 3 +5: mp_alltoall_i22 3 5.0 0.255 0.393 0.255 0.393 6 +5: dbcsr_make_index_exist 207 7.7 0.168 0.374 0.168 0.374 3 +5: mp_sum_b 20 5.0 0.287 0.331 0.287 0.331 0 +5: dbcsr_make_index_list 80 6.0 0.047 0.300 0.047 0.300 3 +5: dbcsr_finalize 17 4.8 0.006 0.016 0.220 0.299 5 +5: mp_bcast_av 100 1.0 0.001 0.002 0.150 0.298 2 +5: mp_bcast_i 101 2.0 0.149 0.296 0.149 0.296 5 +5: dbcsr_merge_all 13 5.8 0.145 0.224 0.206 0.294 6 +5: setup_buffer_matrices 20 6.0 0.001 0.001 0.045 0.273 3 +5: dbcsr_make_random_matrix 3 3.0 0.078 0.100 0.133 0.264 2 +5: dbcsr_new_transposed 10 5.0 0.020 0.041 0.206 0.264 3 +5: buffer_matrices_ensure_size 20 6.0 0.098 0.217 0.098 0.217 3 +5: setup_rec_index_2d 20 6.0 0.097 0.201 0.097 0.201 3 +5: dbcsr_sort_data 70 9.0 0.056 0.154 0.056 0.154 3 +5: mp_cart_sub 2 5.0 0.072 0.080 0.072 0.080 3 +5: dbcsr_make_untransposed_blocks 20 5.0 0.044 0.072 0.044 0.072 0 +5: make_images_pack 20 7.0 0.039 0.071 0.039 0.072 6 +5: dbcsr_add_wm_from_matrix 10 5.0 0.019 0.062 0.022 0.066 1 +5: dbcsr_sort_indices 106 8.5 0.045 0.059 0.045 0.059 1 +5: mp_sum_lv 2 1.0 0.040 0.052 0.040 0.052 6 +5: dbcsr_init_lib_low 1 1.0 0.024 0.039 0.024 0.039 2 +5: quick_finalize 13 7.5 0.012 0.018 0.023 0.035 5 +5: mp_bcast_iv 2 1.0 0.010 0.032 0.010 0.032 2 +5: merge_index 13 6.8 0.020 0.025 0.020 0.025 6 +5: mp_sum_lm3 1 1.0 0.018 0.024 0.018 0.024 6 +5: dbcsr_data_copy_aa2 13 6.8 0.010 0.022 0.010 0.022 3 +5: mp_max_d 1 1.0 0.011 0.021 0.011 0.021 4 +5: mp_min_rv 1 1.0 0.012 0.020 0.012 0.020 2 +5: mp_sum_r 1 1.0 0.014 0.020 0.014 0.020 6 +5: mp_sum_i 1 1.0 0.013 0.020 0.013 0.020 2 +5: dbcsr_data_release 650 7.0 0.015 0.019 0.015 0.019 0 +5: multiply_cannon_metrocomm2 60 7.0 0.001 0.001 0.008 0.017 6 +5: mp_max_rv 1 1.0 0.013 0.016 0.013 0.016 5 +5: mp_max_r 1 1.0 0.012 0.016 0.012 0.016 2 +5: mp_cart_create 1 5.0 0.011 0.015 0.011 0.015 5 +5: mp_isend_iv 160 8.0 0.004 0.015 0.004 0.015 5 +5: dbcsr_destroy 197 5.4 0.002 0.010 0.008 0.013 3 +5: tree_to_linear_d 3 6.0 0.006 0.012 0.006 0.012 6 +5: mp_sum_rv 1 1.0 0.008 0.012 0.008 0.012 0 +5: transpose_index_local 10 6.0 0.000 0.001 0.009 0.010 5 +5: dbcsr_mm_multrec_init 10 6.0 0.000 0.000 0.003 0.010 3 +5: dbcsr_mm_csr_init 10 7.0 0.002 0.009 0.003 0.010 4 +5: mp_irecv_dv 120 8.5 0.004 0.009 0.004 0.009 1 +5: dbcsr_make_dbcsr_index 106 8.5 0.002 0.009 0.002 0.009 0 +5: dbcsr_iterator_stop 76 6.8 0.002 0.008 0.002 0.009 2 +5: mp_alltoall_d11v 9 5.0 0.004 0.008 0.004 0.008 5 +5: dbcsr_data_new 431 7.3 0.003 0.007 0.003 0.007 1 +5: dbcsr_work_create 96 6.7 0.001 0.005 0.002 0.005 5 +5: dbcsr_work_destroy_all 96 7.6 0.001 0.002 0.004 0.005 5 +5: mp_sum_root_rm 2 4.0 0.001 0.004 0.001 0.004 0 +5: dbcsr_fill_wm_from_matrix 10 6.0 0.003 0.004 0.003 0.004 6 +5: mp_irecv_iv 160 8.0 0.001 0.002 0.001 0.002 5 +5: dbcsr_iterator_start 76 6.8 0.001 0.001 0.001 0.001 2 +5: multiply_cannon_multrec_finali 10 8.0 0.000 0.000 0.001 0.001 6 +5: dbcsr_mm_multrec_finalize 10 9.0 0.001 0.001 0.001 0.001 3 +5: dbcsr_distribution_new 36 5.0 0.001 0.001 0.001 0.001 6 +5: mp_isend_dv 120 8.5 0.001 0.001 0.001 0.001 3 +5: fill_hash_tables 10 8.0 0.001 0.001 0.001 0.001 3 +5: dbcsr_iterator_seek 76 7.8 0.001 0.001 0.001 0.001 2 +5: dbcsr_dist_bin 5 3.0 0.000 0.000 0.000 0.000 6 +5: dbcsr_make_index_local_row 80 6.0 0.000 0.000 0.000 0.000 2 +5: dbcsr_switch_data_area 43 6.8 0.000 0.000 0.000 0.000 5 +5: dbcsr_verify_matrix 3 4.0 0.000 0.000 0.000 0.000 3 +5: dbcsr_get_data_size_used 16 5.8 0.000 0.000 0.000 0.000 5 +5: multiply_cannon_metrocomm3 70 7.0 0.000 0.000 0.000 0.000 6 +5: mp_alltoall_i11v 9 5.0 0.000 0.000 0.000 0.000 4 +5: dbcsr_mm_sched_init 10 8.0 0.000 0.000 0.000 0.000 6 +5: mp_comm_free 4 2.0 0.000 0.000 0.000 0.000 3 +5: dbcsr_get_local_rows 10 5.0 0.000 0.000 0.000 0.000 3 5: dbcsr_get_local_cols 10 5.0 0.000 0.000 0.000 0.000 3 -5: mp_sum_rv 1 1.0 0.000 0.000 0.000 0.000 4 -5: dbcsr_get_global_col_map 10 5.0 0.000 0.000 0.000 0.000 9 -5: dbcsr_mm_sched_finalize 10 10.0 0.000 0.000 0.000 0.000 10 -5: mp_sum_i 1 1.0 0.000 0.000 0.000 0.000 11 -5: dbcsr_get_global_row_map 10 5.0 0.000 0.000 0.000 0.000 1 -5: mp_max_d 1 1.0 0.000 0.000 0.000 0.000 3 -5: mp_max_rv 1 1.0 0.000 0.000 0.000 0.000 4 -5: dbcsr_mm_hostdrv_init 10 9.0 0.000 0.000 0.000 0.000 11 +5: dbcsr_mm_sched_finalize 10 10.0 0.000 0.000 0.000 0.000 2 +5: dbcsr_get_global_row_map 10 5.0 0.000 0.000 0.000 0.000 5 +5: dbcsr_get_global_col_map 10 5.0 0.000 0.000 0.000 0.000 2 +5: dbcsr_mm_hostdrv_init 10 9.0 0.000 0.000 0.000 0.000 4 5: ------------------------------------------------------------------------------- 5: - 5/19 Test #5: dbcsr_perf:inputs/test_rect2_sparse.perf .............. Passed 0.88 sec + 5/19 Test #5: dbcsr_perf:inputs/test_rect2_sparse.perf .............. Passed 16.59 sec test 6 Start 6: dbcsr_perf:inputs/test_singleblock.perf -6: Test command: /usr/bin/mpiexec "-n" "12" "/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/tests/dbcsr_perf" "/build/reproducible-path/dbcsr-2.6.0/tests/inputs/test_singleblock.perf" +6: Test command: /usr/bin/mpiexec "-n" "7" "/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/tests/dbcsr_perf" "/build/reproducible-path/dbcsr-2.6.0/tests/inputs/test_singleblock.perf" 6: Working Directory: /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/tests 6: Environment variables: 6: OMP_NUM_THREADS=2 @@ -2834,12 +2867,12 @@ 6: DBCSR| Use Communication thread T (D) 6: DBCSR| Communication thread load 100 (D) 6: DBCSR| MPI: My process id 0 -6: DBCSR| MPI: Number of processes 12 +6: DBCSR| MPI: Number of processes 7 6: DBCSR| OMP: Current number of threads 2 6: DBCSR| OMP: Max number of threads 2 6: DBCSR| Split modifier for TAS multiplication algorithm 1.0E+00 (D) 6: numthreads 2 -6: numnodes 12 +6: numnodes 7 6: matrix_sizes 50 50 50 6: sparsities 0.0000000000000000 0.0000000000000000 0.0000000000000000 6: trans NN @@ -2856,7 +2889,7 @@ 6: ******************************************************************************** 6: -- PERF dbcsr_multiply (N, N, 3 , N, N, N) 6: matrix sizes A( 50 x 50), B( 50 x 50) and C( 50 x 50) -6: numnodes (nprows X npcols) = 12( 4 X 3) +6: numnodes (nprows X npcols) = 7( 7 X 1) 6: nthreads = 2 6: checksum(A) = 0.836558506590987E+03 6: checksum(B) = 0.818177978508558E+03 @@ -2866,12 +2899,12 @@ 6: 6: 6: mean std minmin maxmax -6: time = 22.58E-03 2.55E-03 15.62E-03 41.62E-03 seconds -6: perf total = 10.91E+06 830.21E+03 6.01E+06 13.77E+06 FLOPS -6: perf per node = 909.28E+03 69.18E+03 500.54E+03 1.15E+06 FLOPS -6: perf per thread = 454.64E+03 34.59E+03 250.27E+03 573.84E+03 FLOPS -6: load imbalance = 0.23E-01 0.24E-02 0.17E-01 0.38E-01 -6: rel load imbal = 0.92E+00 0.70E-03 0.92E+00 0.93E+00 +6: time = 150.57E-03 55.48E-03 36.42E-03 523.46E-03 seconds +6: perf total = 3.12E+06 480.75E+03 477.60E+03 5.65E+06 FLOPS +6: perf per node = 445.63E+03 68.68E+03 68.23E+03 806.63E+03 FLOPS +6: perf per thread = 222.82E+03 34.34E+03 34.11E+03 403.31E+03 FLOPS +6: load imbalance = 0.14E+00 0.49E-01 0.39E-01 0.45E+00 +6: rel load imbal = 0.87E+00 0.15E-02 0.86E+00 0.88E+00 6: ******************************************************************************** 6: 6: ------------------------------------------------------------------------------- @@ -2891,19 +2924,19 @@ 6: marketing flops 2.500000E+06 6: ------------------------------------------------------------------------------- 6: # multiplications 10 -6: max memory usage/rank 99.713024E+06 -6: # max total images/rank 4 +6: max memory usage/rank 72.740864E+06 +6: # max total images/rank 7 6: # max 3D layers 1 -6: # MPI messages exchanged 2040 +6: # MPI messages exchanged 420 6: MPI messages size (bytes): -6: total size 1.000000E+06 +6: total size 1.200000E+06 6: min size 0.000000E+00 6: max size 20.000000E+03 -6: average size 490.196075E+00 +6: average size 2.857143E+03 6: MPI breakdown and total messages size (bytes): -6: size <= 128 1990 0 +6: size <= 128 360 0 6: 128 < size <= 8192 0 0 -6: 8192 < size <= 32768 50 1000000 +6: 8192 < size <= 32768 60 1200000 6: 32768 < size <= 131072 0 0 6: 131072 < size <= 4194304 0 0 6: 4194304 < size <= 16777216 0 0 @@ -2911,7 +2944,7 @@ 6: ------------------------------------------------------------------------------- 6: 6: *** WARNING in dbcsr_mm.F:291 :: Using a non-square number of MPI ranks *** -6: *** might lead to poor performance. Used ranks: 12 Suggested: 9 25 *** +6: *** might lead to poor performance. Used ranks: 7 Suggested: 9 16 *** 6: 6: ------------------------------------------------------------------------------- 6: - - @@ -2920,10 +2953,10 @@ 6: ------------------------------------------------------------------------------- 6: ROUTINE CALLS AVE VOLUME [Bytes] 6: MP_Bcast 2 12. -6: MP_Allreduce 88 33. -6: MP_Alltoall 41 6352. -6: MP_ISend 380 1112. -6: MP_IRecv 380 58. +6: MP_Allreduce 88 24. +6: MP_Alltoall 41 6132. +6: MP_ISend 160 1301. +6: MP_IRecv 160 50. 6: ------------------------------------------------------------------------------- 6: 6: ------------------------------------------------------------------------------- @@ -2933,120 +2966,119 @@ 6: ------------------------------------------------------------------------------- 6: SUBROUTINE CALLS ASD SELF TIME TOTAL TIME MAXRANK 6: MAXIMUM AVERAGE MAXIMUM AVERAGE MAXIMUM -6: dbcsr_performance_driver 1 1.0 0.000 0.000 0.277 0.279 0 -6: dbcsr_perf_multiply_low 1 2.0 0.000 0.002 0.277 0.279 9 -6: perf_multiply 1 3.0 0.000 0.000 0.276 0.279 0 -6: dbcsr_multiply_generic 10 4.0 0.001 0.001 0.226 0.237 11 -6: make_m2s 20 5.0 0.001 0.001 0.092 0.098 2 -6: make_images 20 6.0 0.013 0.029 0.087 0.094 6 -6: multiply_cannon 10 5.0 0.008 0.017 0.075 0.088 7 -6: make_images_sizes 20 7.0 0.000 0.000 0.071 0.086 0 -6: mp_alltoall_i44 20 8.0 0.071 0.086 0.071 0.086 4 -6: multiply_cannon_loop 10 6.0 0.001 0.002 0.039 0.060 3 -6: mp_sum_l 141 2.8 0.044 0.057 0.044 0.057 0 -6: dbcsr_multiply_generic_mpsum_f 10 5.0 0.000 0.000 0.043 0.055 7 -6: mp_waitall_1 440 8.3 0.028 0.049 0.028 0.049 10 -6: multiply_cannon_metrocomm1 120 7.0 0.000 0.000 0.016 0.030 7 -6: mp_allgather_i34 10 6.0 0.025 0.030 0.025 0.030 0 -6: mp_sync 10 4.0 0.023 0.028 0.023 0.028 0 -6: dbcsr_create_new 267 6.7 0.013 0.024 0.014 0.025 6 -6: dbcsr_make_dists_dense 10 5.0 0.006 0.022 0.006 0.022 6 -6: multiply_cannon_metrocomm3 120 7.0 0.000 0.000 0.012 0.020 6 -6: multiply_cannon_multrec 120 7.0 0.006 0.018 0.007 0.019 1 -6: dbcsr_redistribute 3 4.0 0.000 0.000 0.014 0.018 0 -6: dbcsr_make_undense 10 5.0 0.000 0.000 0.006 0.018 0 -6: mp_alltoall_i22 3 5.0 0.012 0.017 0.012 0.017 8 -6: mp_sum_d 72 1.3 0.009 0.013 0.009 0.013 9 -6: dbcsr_checksum 5 4.0 0.001 0.005 0.010 0.012 6 -6: multiply_cannon_multrec_finali 10 8.0 0.000 0.000 0.001 0.007 7 -6: dbcsr_mm_multrec_finalize 10 9.0 0.001 0.007 0.001 0.007 3 -6: dbcsr_init_lib_low 1 1.0 0.002 0.007 0.002 0.007 3 -6: dbcsr_mm_multrec_init 10 6.0 0.000 0.000 0.001 0.004 6 -6: dbcsr_mm_csr_init 10 7.0 0.001 0.004 0.001 0.004 9 -6: mp_max_l 94 1.0 0.003 0.003 0.003 0.003 5 -6: dbcsr_make_images_dense 20 6.0 0.001 0.001 0.002 0.003 7 -6: dbcsr_make_untransposed_blocks 20 5.0 0.000 0.003 0.001 0.003 11 -6: mp_maxloc_dv 211 1.0 0.002 0.003 0.002 0.003 2 -6: dbcsr_make_dense_low 80 6.9 0.001 0.001 0.001 0.002 6 -6: setup_buffer_matrices 20 6.0 0.000 0.000 0.001 0.002 7 -6: dbcsr_copy 10 4.0 0.001 0.002 0.001 0.002 4 -6: dbcsr_make_dense 10 5.0 0.000 0.000 0.001 0.002 2 -6: dbcsr_make_index_exist 267 7.7 0.001 0.002 0.001 0.002 11 -6: make_dense_data 80 7.9 0.000 0.001 0.000 0.001 0 -6: multiply_cannon_metrocomm2 90 7.0 0.000 0.000 0.001 0.001 6 -6: mp_bcast_av 103 1.0 0.000 0.001 0.001 0.001 7 -6: make_images_data 20 7.0 0.000 0.000 0.001 0.001 0 -6: mp_cart_sub 2 5.0 0.001 0.001 0.001 0.001 0 -6: dbcsr_special_finalize 70 7.0 0.000 0.000 0.001 0.001 6 -6: dbcsr_destroy 257 5.9 0.000 0.000 0.001 0.001 6 -6: mp_irecv_dv 170 8.0 0.001 0.001 0.001 0.001 7 -6: multiply_cannon_metrocomm4 80 7.0 0.000 0.000 0.001 0.001 11 -6: dbcsr_make_random_matrix 3 3.0 0.000 0.000 0.000 0.001 0 -6: dbcsr_finalize 17 4.8 0.000 0.000 0.001 0.001 6 -6: dbcsr_data_release 1070 7.6 0.001 0.001 0.001 0.001 11 -6: mp_bcast_i 104 2.0 0.000 0.001 0.000 0.001 10 -6: dbcsr_data_new 611 7.4 0.000 0.001 0.000 0.001 0 -6: quick_finalize 73 7.9 0.000 0.000 0.000 0.001 0 -6: hybrid_alltoall_any 20 8.0 0.000 0.000 0.000 0.001 0 -6: mp_max_i 97 1.0 0.000 0.000 0.000 0.000 0 -6: dbcsr_iterator_start 116 6.9 0.000 0.000 0.000 0.000 0 -6: dbcsr_merge_all 13 5.8 0.000 0.000 0.000 0.000 7 -6: dbcsr_add_wm_from_matrix 10 5.0 0.000 0.000 0.000 0.000 0 -6: dbcsr_switch_data_area 163 8.2 0.000 0.000 0.000 0.000 2 -6: dbcsr_make_index_list 70 6.0 0.000 0.000 0.000 0.000 3 -6: mp_isend_dv 170 8.0 0.000 0.000 0.000 0.000 9 -6: dbcsr_work_create 86 6.7 0.000 0.000 0.000 0.000 9 -6: dbcsr_iterator_stop 116 6.9 0.000 0.000 0.000 0.000 0 -6: setup_rec_index_2d 20 6.0 0.000 0.000 0.000 0.000 7 -6: mp_isend_iv 210 8.0 0.000 0.000 0.000 0.000 0 -6: dbcsr_work_destroy_all 86 7.6 0.000 0.000 0.000 0.000 2 -6: make_images_pack 20 7.0 0.000 0.000 0.000 0.000 6 -6: buffer_matrices_ensure_size 20 6.0 0.000 0.000 0.000 0.000 1 -6: mp_irecv_iv 210 8.0 0.000 0.000 0.000 0.000 0 -6: dbcsr_fill_wm_from_matrix 10 6.0 0.000 0.000 0.000 0.000 2 -6: mp_sum_b 20 5.0 0.000 0.000 0.000 0.000 10 -6: dbcsr_index_prune_deleted 70 7.0 0.000 0.000 0.000 0.000 6 -6: dbcsr_distribution_new 56 5.4 0.000 0.000 0.000 0.000 6 +6: dbcsr_performance_driver 1 1.0 0.000 0.000 2.022 2.037 0 +6: dbcsr_perf_multiply_low 1 2.0 0.000 0.000 2.022 2.036 3 +6: perf_multiply 1 3.0 0.000 0.001 2.021 2.035 0 +6: dbcsr_multiply_generic 10 4.0 0.002 0.002 1.506 1.549 2 +6: multiply_cannon 10 5.0 0.041 0.065 0.566 0.633 4 +6: make_m2s 20 5.0 0.001 0.001 0.440 0.482 2 +6: make_images 20 6.0 0.073 0.097 0.401 0.452 6 +6: multiply_cannon_loop 10 6.0 0.039 0.081 0.323 0.415 0 +6: make_images_sizes 20 7.0 0.000 0.000 0.316 0.396 2 +6: mp_alltoall_i44 20 8.0 0.316 0.396 0.316 0.396 5 +6: mp_sum_l 141 2.8 0.330 0.389 0.330 0.389 4 +6: multiply_cannon_metrocomm1 70 7.0 0.001 0.001 0.218 0.287 0 +6: mp_waitall_1 480 8.2 0.217 0.287 0.217 0.287 1 +6: dbcsr_create_new 297 6.7 0.121 0.182 0.160 0.245 3 +6: dbcsr_redistribute 3 4.0 0.004 0.029 0.198 0.230 0 +6: dbcsr_multiply_generic_mpsum_f 10 5.0 0.000 0.000 0.165 0.209 2 +6: mp_sync 10 4.0 0.161 0.207 0.161 0.207 3 +6: mp_allgather_i34 10 6.0 0.142 0.184 0.142 0.184 3 +6: dbcsr_checksum 5 4.0 0.023 0.043 0.098 0.116 4 +6: mp_alltoall_i22 3 5.0 0.077 0.110 0.077 0.110 5 +6: setup_buffer_matrices 20 6.0 0.000 0.000 0.026 0.110 4 +6: multiply_cannon_multrec 70 7.0 0.052 0.091 0.065 0.102 0 +6: mp_sum_d 72 1.3 0.075 0.096 0.075 0.096 0 +6: dbcsr_make_index_exist 297 7.7 0.039 0.090 0.039 0.090 4 +6: mp_cart_sub 2 5.0 0.077 0.084 0.077 0.084 3 +6: mp_sum_b 20 5.0 0.058 0.072 0.058 0.072 0 +6: dbcsr_make_undense 10 5.0 0.000 0.001 0.036 0.071 0 +6: setup_rec_index_2d 20 6.0 0.028 0.061 0.028 0.061 5 +6: dbcsr_make_dists_dense 10 5.0 0.040 0.060 0.040 0.060 4 +6: dbcsr_finalize 17 4.8 0.000 0.000 0.012 0.050 2 +6: dbcsr_merge_all 13 5.8 0.011 0.049 0.011 0.049 4 +6: dbcsr_make_dense 10 5.0 0.000 0.000 0.017 0.049 2 +6: mp_cart_create 1 5.0 0.039 0.046 0.039 0.046 3 +6: dbcsr_init_lib_low 1 1.0 0.021 0.039 0.021 0.039 3 +6: make_images_data 20 7.0 0.001 0.001 0.007 0.038 0 +6: multiply_cannon_multrec_finali 10 8.0 0.000 0.000 0.014 0.037 2 +6: dbcsr_mm_multrec_finalize 10 9.0 0.014 0.037 0.014 0.037 1 +6: hybrid_alltoall_any 20 8.0 0.006 0.037 0.006 0.037 0 +6: dbcsr_make_images_dense 20 6.0 0.001 0.001 0.011 0.026 0 +6: mp_max_l 93 1.0 0.018 0.023 0.018 0.023 4 +6: dbcsr_make_untransposed_blocks 20 5.0 0.005 0.021 0.005 0.022 4 +6: dbcsr_copy 10 4.0 0.009 0.016 0.009 0.016 4 +6: dbcsr_make_dense_low 90 6.9 0.002 0.002 0.003 0.005 0 +6: mp_bcast_av 102 1.0 0.001 0.001 0.002 0.005 5 +6: dbcsr_mm_multrec_init 10 6.0 0.000 0.000 0.003 0.005 2 +6: dbcsr_mm_csr_init 10 7.0 0.003 0.005 0.003 0.005 4 +6: mp_max_i 96 1.0 0.002 0.004 0.002 0.004 1 +6: mp_bcast_i 103 2.0 0.001 0.004 0.001 0.004 2 +6: make_dense_data 90 7.9 0.000 0.002 0.001 0.003 0 +6: dbcsr_destroy 287 5.9 0.001 0.001 0.002 0.003 2 +6: dbcsr_data_release 1160 7.6 0.002 0.002 0.002 0.002 2 +6: dbcsr_special_finalize 80 7.0 0.001 0.001 0.002 0.002 0 +6: mp_maxloc_dv 209 1.0 0.002 0.002 0.002 0.002 1 +6: multiply_cannon_metrocomm2 60 7.0 0.001 0.001 0.001 0.002 0 +6: dbcsr_data_new 661 7.4 0.001 0.002 0.001 0.002 2 +6: quick_finalize 83 7.9 0.001 0.001 0.001 0.001 4 +6: dbcsr_make_index_list 80 6.0 0.001 0.001 0.001 0.001 2 +6: dbcsr_iterator_start 116 6.9 0.001 0.001 0.001 0.001 0 +6: dbcsr_make_random_matrix 3 3.0 0.000 0.001 0.001 0.001 0 +6: dbcsr_switch_data_area 183 8.3 0.001 0.001 0.001 0.001 5 +6: dbcsr_iterator_stop 116 6.9 0.000 0.001 0.001 0.001 5 +6: dbcsr_add_wm_from_matrix 10 5.0 0.000 0.000 0.001 0.001 0 +6: dbcsr_work_create 96 6.7 0.000 0.001 0.001 0.001 5 +6: mp_isend_dv 60 8.0 0.000 0.001 0.000 0.001 5 +6: dbcsr_work_destroy_all 96 7.6 0.000 0.000 0.001 0.001 4 +6: make_images_pack 20 7.0 0.000 0.000 0.000 0.000 2 +6: dbcsr_fill_wm_from_matrix 10 6.0 0.000 0.000 0.000 0.000 5 +6: mp_isend_iv 100 8.0 0.000 0.000 0.000 0.000 0 +6: buffer_matrices_ensure_size 20 6.0 0.000 0.000 0.000 0.000 2 +6: dbcsr_index_prune_deleted 80 7.0 0.000 0.000 0.000 0.000 0 6: dbcsr_iterator_seek 116 7.9 0.000 0.000 0.000 0.000 0 -6: mp_max_r 1 1.0 0.000 0.000 0.000 0.000 5 +6: dbcsr_distribution_new 56 5.4 0.000 0.000 0.000 0.000 2 +6: mp_irecv_dv 60 8.0 0.000 0.000 0.000 0.000 2 +6: mp_irecv_iv 100 8.0 0.000 0.000 0.000 0.000 0 +6: dbcsr_make_index_local_row 80 6.0 0.000 0.000 0.000 0.000 3 +6: dbcsr_sort_indices 36 7.4 0.000 0.000 0.000 0.000 0 +6: dbcsr_make_dbcsr_index 96 8.6 0.000 0.000 0.000 0.000 5 +6: mp_max_r 1 1.0 0.000 0.000 0.000 0.000 1 6: dbcsr_mm_sched_finalize 10 10.0 0.000 0.000 0.000 0.000 0 -6: dbcsr_make_index_local_row 70 6.0 0.000 0.000 0.000 0.000 2 +6: dbcsr_get_local_rows 20 5.5 0.000 0.000 0.000 0.000 1 +6: merge_index 13 6.8 0.000 0.000 0.000 0.000 0 +6: mp_alltoall_d11v 9 5.0 0.000 0.000 0.000 0.000 0 +6: dbcsr_mm_sched_init 10 8.0 0.000 0.000 0.000 0.000 0 6: mp_sum_root_rm 2 4.0 0.000 0.000 0.000 0.000 0 +6: multiply_cannon_metrocomm3 70 7.0 0.000 0.000 0.000 0.000 6 6: tree_to_linear_d 3 6.0 0.000 0.000 0.000 0.000 0 -6: dbcsr_sort_indices 36 7.3 0.000 0.000 0.000 0.000 0 -6: mp_cart_create 1 5.0 0.000 0.000 0.000 0.000 11 -6: dbcsr_make_dbcsr_index 86 8.6 0.000 0.000 0.000 0.000 6 -6: dbcsr_get_local_rows 20 5.5 0.000 0.000 0.000 0.000 6 -6: merge_index 13 6.8 0.000 0.000 0.000 0.000 0 -6: mp_comm_free 4 2.0 0.000 0.000 0.000 0.000 1 +6: mp_comm_free 4 2.0 0.000 0.000 0.000 0.000 3 +6: dbcsr_mm_hostdrv_init 10 9.0 0.000 0.000 0.000 0.000 4 +6: dbcsr_get_global_row_map 10 5.0 0.000 0.000 0.000 0.000 5 6: dbcsr_get_local_cols 20 5.5 0.000 0.000 0.000 0.000 2 -6: dbcsr_mm_sched_init 10 8.0 0.000 0.000 0.000 0.000 2 -6: mp_alltoall_d11v 9 5.0 0.000 0.000 0.000 0.000 0 -6: mp_sum_lm3 1 1.0 0.000 0.000 0.000 0.000 8 -6: fill_hash_tables 10 8.0 0.000 0.000 0.000 0.000 6 -6: mp_sum_lv 2 1.0 0.000 0.000 0.000 0.000 4 -6: mp_alltoall_i11v 9 5.0 0.000 0.000 0.000 0.000 11 +6: dbcsr_get_data_size_used 16 5.8 0.000 0.000 0.000 0.000 2 +6: mp_alltoall_i11v 9 5.0 0.000 0.000 0.000 0.000 0 +6: mp_sum_lv 2 1.0 0.000 0.000 0.000 0.000 0 +6: fill_hash_tables 10 8.0 0.000 0.000 0.000 0.000 2 6: dbcsr_data_copy_aa2 3 6.0 0.000 0.000 0.000 0.000 0 -6: dbcsr_get_data_size_used 16 5.8 0.000 0.000 0.000 0.000 7 -6: mp_bcast_iv 2 1.0 0.000 0.000 0.000 0.000 10 -6: dbcsr_get_global_row_map 10 5.0 0.000 0.000 0.000 0.000 3 -6: dbcsr_dist_bin 4 3.0 0.000 0.000 0.000 0.000 10 -6: mp_sum_rv 1 1.0 0.000 0.000 0.000 0.000 4 6: mp_sum_r 1 1.0 0.000 0.000 0.000 0.000 0 -6: dbcsr_get_global_col_map 10 5.0 0.000 0.000 0.000 0.000 3 -6: mp_max_d 1 1.0 0.000 0.000 0.000 0.000 3 -6: mp_sum_i 1 1.0 0.000 0.000 0.000 0.000 11 -6: mp_max_rv 1 1.0 0.000 0.000 0.000 0.000 3 -6: mp_min_rv 1 1.0 0.000 0.000 0.000 0.000 3 -6: dbcsr_mm_hostdrv_init 10 9.0 0.000 0.000 0.000 0.000 4 -6: dbcsr_verify_matrix 3 4.0 0.000 0.000 0.000 0.000 0 +6: mp_sum_rv 1 1.0 0.000 0.000 0.000 0.000 2 +6: dbcsr_get_global_col_map 10 5.0 0.000 0.000 0.000 0.000 2 +6: dbcsr_dist_bin 4 3.0 0.000 0.000 0.000 0.000 6 +6: mp_sum_lm3 1 1.0 0.000 0.000 0.000 0.000 1 +6: mp_bcast_iv 2 1.0 0.000 0.000 0.000 0.000 2 +6: mp_min_rv 1 1.0 0.000 0.000 0.000 0.000 1 +6: mp_sum_i 1 1.0 0.000 0.000 0.000 0.000 1 +6: mp_max_d 1 1.0 0.000 0.000 0.000 0.000 1 +6: mp_max_rv 1 1.0 0.000 0.000 0.000 0.000 2 +6: dbcsr_verify_matrix 3 4.0 0.000 0.000 0.000 0.000 2 6: ------------------------------------------------------------------------------- 6: - 6/19 Test #6: dbcsr_perf:inputs/test_singleblock.perf ............... Passed 0.34 sec + 6/19 Test #6: dbcsr_perf:inputs/test_singleblock.perf ............... Passed 2.45 sec test 7 Start 7: dbcsr_perf:inputs/test_square_dense.perf -7: Test command: /usr/bin/mpiexec "-n" "12" "/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/tests/dbcsr_perf" "/build/reproducible-path/dbcsr-2.6.0/tests/inputs/test_square_dense.perf" +7: Test command: /usr/bin/mpiexec "-n" "7" "/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/tests/dbcsr_perf" "/build/reproducible-path/dbcsr-2.6.0/tests/inputs/test_square_dense.perf" 7: Working Directory: /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/tests 7: Environment variables: 7: OMP_NUM_THREADS=2 @@ -3065,12 +3097,12 @@ 7: DBCSR| Use Communication thread T (D) 7: DBCSR| Communication thread load 100 (D) 7: DBCSR| MPI: My process id 0 -7: DBCSR| MPI: Number of processes 12 +7: DBCSR| MPI: Number of processes 7 7: DBCSR| OMP: Current number of threads 2 7: DBCSR| OMP: Max number of threads 2 7: DBCSR| Split modifier for TAS multiplication algorithm 1.0E+00 (D) 7: numthreads 2 -7: numnodes 12 +7: numnodes 7 7: matrix_sizes 100 100 100 7: sparsities 0.0000000000000000 0.0000000000000000 0.0000000000000000 7: trans NN @@ -3087,7 +3119,7 @@ 7: ******************************************************************************** 7: -- PERF dbcsr_multiply (N, N, 3 , N, N, N) 7: matrix sizes A( 100 x 100), B( 100 x 100) and C( 100 x 100) -7: numnodes (nprows X npcols) = 12( 4 X 3) +7: numnodes (nprows X npcols) = 7( 7 X 1) 7: nthreads = 2 7: checksum(A) = 0.331411242617276E+04 7: checksum(B) = 0.342949174893408E+04 @@ -3097,12 +3129,12 @@ 7: 7: 7: mean std minmin maxmax -7: time = 20.20E-03 2.61E-03 12.31E-03 42.02E-03 seconds -7: perf total = 99.83E+06 9.03E+06 47.59E+06 136.99E+06 FLOPS -7: perf per node = 8.32E+06 752.58E+03 3.97E+06 11.42E+06 FLOPS -7: perf per thread = 4.16E+06 376.29E+03 1.98E+06 5.71E+06 FLOPS -7: load imbalance = 0.21E-01 0.24E-02 0.14E-01 0.39E-01 -7: rel load imbal = 0.93E+00 0.80E-03 0.92E+00 0.93E+00 +7: time = 36.73E-03 4.23E-03 20.56E-03 68.27E-03 seconds +7: perf total = 54.95E+06 6.27E+06 29.30E+06 83.68E+06 FLOPS +7: perf per node = 7.85E+06 895.98E+03 4.19E+06 11.95E+06 FLOPS +7: perf per thread = 3.92E+06 447.99E+03 2.09E+06 5.98E+06 FLOPS +7: load imbalance = 0.36E-01 0.38E-02 0.21E-01 0.59E-01 +7: rel load imbal = 0.87E+00 0.15E-02 0.86E+00 0.88E+00 7: ******************************************************************************** 7: 7: ------------------------------------------------------------------------------- @@ -3111,37 +3143,33 @@ 7: - - 7: ------------------------------------------------------------------------------- 7: COUNTER TOTAL BLAS SMM ACC -7: flops 10 x 30 x 5 480000 100.0% 0.0% 0.0% -7: flops 15 x 30 x 5 720000 100.0% 0.0% 0.0% -7: flops 10 x 35 x 5 1120000 100.0% 0.0% 0.0% -7: flops 15 x 35 x 5 1680000 100.0% 0.0% 0.0% -7: flops 10 x 30 x 10 1920000 100.0% 0.0% 0.0% -7: flops 15 x 30 x 10 2880000 100.0% 0.0% 0.0% -7: flops 10 x 35 x 10 4480000 100.0% 0.0% 0.0% -7: flops 15 x 35 x 10 6720000 100.0% 0.0% 0.0% +7: flops 5 x 100 x 10 800000 100.0% 0.0% 0.0% +7: flops 10 x 100 x 10 1200000 100.0% 0.0% 0.0% +7: flops 5 x 100 x 15 7200000 100.0% 0.0% 0.0% +7: flops 10 x 100 x 15 10800000 100.0% 0.0% 0.0% 7: flops inhomo. stacks 0 0.0% 0.0% 0.0% 7: flops total 20.000000E+06 100.0% 0.0% 0.0% -7: flops max/rank 1.750000E+06 100.0% 0.0% 0.0% +7: flops max/rank 3.000000E+06 100.0% 0.0% 0.0% 7: matmuls inhomo. stacks 0 0.0% 0.0% 0.0% -7: matmuls total 2880 100.0% 0.0% 0.0% -7: number of processed stacks 2880 100.0% 0.0% 0.0% +7: matmuls total 980 100.0% 0.0% 0.0% +7: number of processed stacks 980 100.0% 0.0% 0.0% 7: average stack size 1.0 0.0 0.0 7: marketing flops 20.000000E+06 7: ------------------------------------------------------------------------------- 7: # multiplications 10 -7: max memory usage/rank 99.360768E+06 -7: # max total images/rank 4 +7: max memory usage/rank 72.544256E+06 +7: # max total images/rank 7 7: # max 3D layers 1 -7: # MPI messages exchanged 2040 +7: # MPI messages exchanged 420 7: MPI messages size (bytes): -7: total size 4.000000E+06 -7: min size 1.000000E+03 -7: max size 2.800000E+03 -7: average size 1.960784E+03 +7: total size 4.800000E+06 +7: min size 8.000000E+03 +7: max size 12.000000E+03 +7: average size 11.428571E+03 7: MPI breakdown and total messages size (bytes): 7: size <= 128 0 0 -7: 128 < size <= 8192 2040 4000000 -7: 8192 < size <= 32768 0 0 +7: 128 < size <= 8192 60 480000 +7: 8192 < size <= 32768 360 4320000 7: 32768 < size <= 131072 0 0 7: 131072 < size <= 4194304 0 0 7: 4194304 < size <= 16777216 0 0 @@ -3149,7 +3177,7 @@ 7: ------------------------------------------------------------------------------- 7: 7: *** WARNING in dbcsr_mm.F:291 :: Using a non-square number of MPI ranks *** -7: *** might lead to poor performance. Used ranks: 12 Suggested: 9 25 *** +7: *** might lead to poor performance. Used ranks: 7 Suggested: 9 16 *** 7: 7: ------------------------------------------------------------------------------- 7: - - @@ -3157,11 +3185,11 @@ 7: - - 7: ------------------------------------------------------------------------------- 7: ROUTINE CALLS AVE VOLUME [Bytes] -7: MP_Bcast 9 12. -7: MP_Allreduce 102 32. -7: MP_Alltoall 41 2627. -7: MP_ISend 420 1044. -7: MP_IRecv 420 1020. +7: MP_Bcast 5 12. +7: MP_Allreduce 94 24. +7: MP_Alltoall 41 3929. +7: MP_ISend 160 4600. +7: MP_IRecv 160 4600. 7: ------------------------------------------------------------------------------- 7: 7: ------------------------------------------------------------------------------- @@ -3171,120 +3199,119 @@ 7: ------------------------------------------------------------------------------- 7: SUBROUTINE CALLS ASD SELF TIME TOTAL TIME MAXRANK 7: MAXIMUM AVERAGE MAXIMUM AVERAGE MAXIMUM -7: dbcsr_performance_driver 1 1.0 0.000 0.000 0.265 0.266 0 -7: dbcsr_perf_multiply_low 1 2.0 0.000 0.000 0.264 0.266 0 -7: perf_multiply 1 3.0 0.000 0.000 0.264 0.265 0 -7: dbcsr_multiply_generic 10 4.0 0.001 0.001 0.202 0.208 6 -7: make_m2s 20 5.0 0.001 0.001 0.102 0.114 0 -7: make_images 20 6.0 0.011 0.027 0.095 0.108 10 -7: make_images_sizes 20 7.0 0.000 0.000 0.061 0.079 11 -7: mp_alltoall_i44 20 8.0 0.061 0.079 0.061 0.079 3 -7: multiply_cannon 10 5.0 0.006 0.015 0.065 0.076 0 -7: mp_waitall_1 440 8.3 0.039 0.063 0.039 0.063 7 -7: make_images_data 20 7.0 0.000 0.000 0.021 0.044 5 -7: multiply_cannon_loop 10 6.0 0.001 0.002 0.029 0.038 8 -7: hybrid_alltoall_any 20 8.0 0.001 0.003 0.016 0.038 6 -7: mp_allgather_i34 10 6.0 0.027 0.034 0.027 0.034 2 -7: mp_sum_l 145 2.7 0.023 0.031 0.023 0.031 7 -7: dbcsr_multiply_generic_mpsum_f 10 5.0 0.000 0.000 0.023 0.031 0 -7: dbcsr_checksum 5 4.0 0.003 0.020 0.027 0.028 6 -7: mp_sum_d 76 1.3 0.025 0.028 0.025 0.028 10 -7: mp_sync 10 4.0 0.021 0.024 0.021 0.024 2 -7: multiply_cannon_metrocomm3 120 7.0 0.000 0.000 0.009 0.018 11 -7: multiply_cannon_metrocomm1 120 7.0 0.000 0.000 0.010 0.016 6 -7: dbcsr_redistribute 3 4.0 0.002 0.005 0.013 0.016 3 -7: dbcsr_create_new 267 6.7 0.007 0.012 0.008 0.013 0 -7: multiply_cannon_multrec 120 7.0 0.004 0.010 0.006 0.012 8 -7: mp_alltoall_i22 3 5.0 0.010 0.012 0.010 0.012 2 -7: dbcsr_make_dists_dense 10 5.0 0.004 0.011 0.005 0.011 5 -7: dbcsr_make_undense 10 5.0 0.000 0.000 0.004 0.010 11 -7: dbcsr_init_lib_low 1 1.0 0.002 0.007 0.002 0.007 11 -7: dbcsr_make_dense 10 5.0 0.000 0.000 0.001 0.005 5 -7: dbcsr_make_images_dense 20 6.0 0.001 0.001 0.004 0.004 5 -7: multiply_cannon_multrec_finali 10 8.0 0.000 0.000 0.001 0.003 6 -7: dbcsr_mm_multrec_finalize 10 9.0 0.001 0.003 0.001 0.003 11 -7: dbcsr_make_dense_low 80 6.9 0.001 0.001 0.003 0.003 5 -7: mp_max_l 95 1.0 0.002 0.003 0.002 0.003 2 -7: dbcsr_mm_multrec_init 10 6.0 0.000 0.000 0.001 0.003 6 -7: dbcsr_mm_csr_init 10 7.0 0.001 0.003 0.001 0.003 8 -7: dbcsr_copy 10 4.0 0.000 0.002 0.000 0.002 11 -7: make_dense_data 80 7.9 0.001 0.001 0.002 0.002 3 -7: dbcsr_special_finalize 70 7.0 0.000 0.000 0.001 0.002 5 -7: buffer_matrices_ensure_size 20 6.0 0.000 0.002 0.000 0.002 0 -7: dbcsr_finalize 17 4.8 0.000 0.000 0.001 0.002 0 -7: quick_finalize 73 7.9 0.001 0.001 0.001 0.002 1 -7: multiply_cannon_metrocomm2 90 7.0 0.000 0.001 0.001 0.001 0 -7: dbcsr_merge_all 13 5.8 0.000 0.001 0.001 0.001 5 -7: setup_rec_index_2d 20 6.0 0.000 0.001 0.000 0.001 8 -7: dbcsr_make_index_exist 267 7.7 0.001 0.001 0.001 0.001 5 -7: mp_maxloc_dv 213 1.0 0.001 0.001 0.001 0.001 7 -7: setup_buffer_matrices 20 6.0 0.000 0.000 0.001 0.001 6 -7: dbcsr_iterator_start 166 7.8 0.001 0.001 0.001 0.001 5 -7: mp_cart_sub 2 5.0 0.001 0.001 0.001 0.001 6 -7: dbcsr_make_random_matrix 3 3.0 0.000 0.001 0.001 0.001 0 -7: dbcsr_destroy 257 5.9 0.000 0.001 0.001 0.001 5 -7: mp_bcast_av 104 1.0 0.000 0.000 0.001 0.001 5 -7: mp_isend_iv 230 8.0 0.000 0.001 0.000 0.001 7 -7: multiply_cannon_metrocomm4 80 7.0 0.000 0.000 0.001 0.001 5 -7: dbcsr_data_release 1170 7.8 0.001 0.001 0.001 0.001 5 -7: mp_irecv_dv 210 8.2 0.001 0.001 0.001 0.001 1 -7: dbcsr_add_wm_from_matrix 10 5.0 0.000 0.000 0.000 0.001 1 -7: dbcsr_data_new 661 7.5 0.001 0.001 0.001 0.001 6 -7: dbcsr_iterator_stop 166 7.8 0.000 0.001 0.000 0.001 0 -7: mp_max_i 105 1.0 0.000 0.001 0.000 0.001 0 -7: mp_bcast_i 105 2.0 0.000 0.000 0.000 0.000 6 -7: dbcsr_fill_wm_from_matrix 10 6.0 0.000 0.000 0.000 0.000 0 -7: make_images_pack 20 7.0 0.000 0.000 0.000 0.000 6 -7: dbcsr_make_index_list 70 6.0 0.000 0.000 0.000 0.000 5 -7: dbcsr_switch_data_area 163 8.2 0.000 0.000 0.000 0.000 5 -7: dbcsr_make_untransposed_blocks 20 5.0 0.000 0.000 0.000 0.000 6 -7: mp_isend_dv 210 8.2 0.000 0.000 0.000 0.000 4 -7: dbcsr_work_create 86 6.7 0.000 0.000 0.000 0.000 10 -7: dbcsr_work_destroy_all 86 7.6 0.000 0.000 0.000 0.000 5 -7: dbcsr_sort_indices 86 8.6 0.000 0.000 0.000 0.000 6 -7: dbcsr_iterator_seek 166 8.8 0.000 0.000 0.000 0.000 10 -7: mp_irecv_iv 230 8.0 0.000 0.000 0.000 0.000 9 -7: dbcsr_index_prune_deleted 70 7.0 0.000 0.000 0.000 0.000 0 +7: dbcsr_performance_driver 1 1.0 0.000 0.000 0.498 0.502 0 +7: dbcsr_perf_multiply_low 1 2.0 0.000 0.000 0.498 0.502 0 +7: perf_multiply 1 3.0 0.000 0.000 0.496 0.500 0 +7: dbcsr_multiply_generic 10 4.0 0.002 0.002 0.367 0.411 0 +7: multiply_cannon 10 5.0 0.015 0.060 0.139 0.152 5 +7: make_m2s 20 5.0 0.001 0.001 0.147 0.151 2 +7: make_images 20 6.0 0.032 0.063 0.133 0.137 5 +7: multiply_cannon_loop 10 6.0 0.002 0.002 0.077 0.127 6 +7: make_images_sizes 20 7.0 0.000 0.000 0.092 0.122 2 +7: mp_alltoall_i44 20 8.0 0.092 0.122 0.092 0.122 2 +7: multiply_cannon_metrocomm1 70 7.0 0.001 0.001 0.053 0.084 1 +7: mp_waitall_1 480 8.2 0.053 0.083 0.053 0.083 2 +7: mp_sum_l 145 2.7 0.044 0.067 0.044 0.067 5 +7: dbcsr_create_new 297 6.7 0.019 0.063 0.022 0.067 5 +7: dbcsr_multiply_generic_mpsum_f 10 5.0 0.000 0.000 0.042 0.065 2 +7: multiply_cannon_multrec 70 7.0 0.020 0.063 0.021 0.064 0 +7: mp_sync 10 4.0 0.047 0.063 0.047 0.063 1 +7: dbcsr_make_undense 10 5.0 0.001 0.001 0.016 0.060 3 +7: dbcsr_make_dists_dense 10 5.0 0.016 0.060 0.016 0.060 0 +7: mp_allgather_i34 10 6.0 0.041 0.056 0.041 0.056 5 +7: dbcsr_checksum 5 4.0 0.009 0.023 0.045 0.050 0 +7: mp_sum_d 76 1.3 0.036 0.050 0.036 0.050 2 +7: dbcsr_redistribute 3 4.0 0.011 0.021 0.033 0.038 3 +7: mp_alltoall_i22 3 5.0 0.020 0.029 0.020 0.029 2 +7: dbcsr_copy 10 4.0 0.004 0.012 0.004 0.012 5 +7: dbcsr_make_images_dense 20 6.0 0.001 0.001 0.011 0.012 2 +7: dbcsr_init_lib_low 1 1.0 0.004 0.010 0.004 0.010 5 +7: mp_max_l 94 1.0 0.007 0.009 0.007 0.009 2 +7: dbcsr_make_dense_low 90 6.9 0.002 0.002 0.008 0.009 3 +7: make_dense_data 90 7.9 0.003 0.003 0.006 0.006 3 +7: dbcsr_add_wm_from_matrix 10 5.0 0.001 0.004 0.001 0.004 0 +7: dbcsr_special_finalize 80 7.0 0.001 0.001 0.003 0.003 3 +7: dbcsr_make_index_exist 297 7.7 0.003 0.003 0.003 0.003 6 +7: setup_buffer_matrices 20 6.0 0.000 0.000 0.003 0.003 1 +7: dbcsr_iterator_start 176 7.8 0.002 0.002 0.002 0.003 1 +7: make_images_data 20 7.0 0.001 0.001 0.002 0.002 2 +7: mp_maxloc_dv 211 1.0 0.002 0.002 0.002 0.002 2 +7: multiply_cannon_metrocomm2 60 7.0 0.001 0.001 0.002 0.002 2 +7: dbcsr_destroy 287 5.9 0.001 0.001 0.002 0.002 1 +7: dbcsr_data_release 1280 7.8 0.002 0.002 0.002 0.002 3 +7: quick_finalize 83 7.9 0.001 0.001 0.002 0.002 3 +7: mp_bcast_av 103 1.0 0.001 0.001 0.002 0.002 5 +7: dbcsr_make_dense 10 5.0 0.000 0.000 0.002 0.002 6 +7: dbcsr_finalize 17 4.8 0.000 0.000 0.002 0.002 1 +7: dbcsr_iterator_stop 176 7.8 0.001 0.001 0.002 0.002 2 +7: dbcsr_data_new 721 7.6 0.001 0.002 0.001 0.002 6 +7: dbcsr_make_random_matrix 3 3.0 0.001 0.001 0.001 0.001 4 +7: dbcsr_make_index_list 80 6.0 0.001 0.001 0.001 0.001 6 +7: mp_cart_sub 2 5.0 0.001 0.001 0.001 0.001 0 +7: mp_isend_dv 60 8.0 0.001 0.001 0.001 0.001 6 +7: mp_max_i 100 1.0 0.001 0.001 0.001 0.001 6 +7: hybrid_alltoall_any 20 8.0 0.001 0.001 0.001 0.001 6 +7: dbcsr_merge_all 13 5.8 0.001 0.001 0.001 0.001 6 +7: dbcsr_switch_data_area 183 8.3 0.001 0.001 0.001 0.001 1 +7: mp_bcast_i 104 2.0 0.001 0.001 0.001 0.001 4 +7: multiply_cannon_multrec_finali 10 8.0 0.000 0.000 0.001 0.001 4 +7: dbcsr_mm_multrec_finalize 10 9.0 0.001 0.001 0.001 0.001 3 +7: setup_rec_index_2d 20 6.0 0.001 0.001 0.001 0.001 1 +7: dbcsr_make_untransposed_blocks 20 5.0 0.000 0.001 0.001 0.001 2 +7: make_images_pack 20 7.0 0.000 0.001 0.001 0.001 4 +7: dbcsr_mm_multrec_init 10 6.0 0.000 0.000 0.001 0.001 6 +7: buffer_matrices_ensure_size 20 6.0 0.000 0.001 0.000 0.001 5 +7: dbcsr_mm_csr_init 10 7.0 0.001 0.001 0.001 0.001 3 +7: dbcsr_work_create 96 6.7 0.000 0.001 0.001 0.001 1 +7: dbcsr_work_destroy_all 96 7.6 0.000 0.001 0.001 0.001 1 +7: dbcsr_fill_wm_from_matrix 10 6.0 0.000 0.000 0.000 0.001 1 +7: dbcsr_iterator_seek 176 8.8 0.000 0.000 0.000 0.000 6 +7: dbcsr_sort_indices 96 8.6 0.000 0.000 0.000 0.000 6 +7: mp_isend_iv 100 8.0 0.000 0.000 0.000 0.000 6 +7: dbcsr_index_prune_deleted 80 7.0 0.000 0.000 0.000 0.000 6 7: dbcsr_distribution_new 56 5.4 0.000 0.000 0.000 0.000 5 -7: mp_sum_b 20 5.0 0.000 0.000 0.000 0.000 3 -7: merge_index 13 6.8 0.000 0.000 0.000 0.000 4 -7: mp_max_r 1 1.0 0.000 0.000 0.000 0.000 9 -7: dbcsr_make_index_local_row 70 6.0 0.000 0.000 0.000 0.000 5 -7: mp_sum_lv 9 1.0 0.000 0.000 0.000 0.000 0 -7: dbcsr_make_dbcsr_index 86 8.6 0.000 0.000 0.000 0.000 8 -7: mp_cart_create 1 5.0 0.000 0.000 0.000 0.000 5 -7: tree_to_linear_d 3 6.0 0.000 0.000 0.000 0.000 0 -7: mp_sum_root_rm 2 4.0 0.000 0.000 0.000 0.000 8 -7: mp_comm_free 4 2.0 0.000 0.000 0.000 0.000 6 -7: dbcsr_get_local_rows 20 5.5 0.000 0.000 0.000 0.000 5 +7: mp_irecv_iv 100 8.0 0.000 0.000 0.000 0.000 1 +7: mp_sum_b 20 5.0 0.000 0.000 0.000 0.000 4 +7: dbcsr_make_index_local_row 80 6.0 0.000 0.000 0.000 0.000 6 +7: dbcsr_make_dbcsr_index 96 8.6 0.000 0.000 0.000 0.000 3 +7: mp_max_r 1 1.0 0.000 0.000 0.000 0.000 4 +7: merge_index 13 6.8 0.000 0.000 0.000 0.000 1 +7: mp_irecv_dv 60 8.0 0.000 0.000 0.000 0.000 6 +7: multiply_cannon_metrocomm3 70 7.0 0.000 0.000 0.000 0.000 3 +7: tree_to_linear_d 3 6.0 0.000 0.000 0.000 0.000 6 +7: mp_cart_create 1 5.0 0.000 0.000 0.000 0.000 6 7: mp_alltoall_d11v 9 5.0 0.000 0.000 0.000 0.000 6 -7: dbcsr_data_copy_aa2 13 6.8 0.000 0.000 0.000 0.000 0 -7: mp_bcast_iv 9 1.0 0.000 0.000 0.000 0.000 9 -7: mp_sum_lm3 1 1.0 0.000 0.000 0.000 0.000 11 -7: dbcsr_mm_sched_init 10 8.0 0.000 0.000 0.000 0.000 9 +7: dbcsr_data_copy_aa2 13 6.8 0.000 0.000 0.000 0.000 4 +7: mp_sum_lv 5 1.0 0.000 0.000 0.000 0.000 6 +7: dbcsr_get_local_rows 20 5.5 0.000 0.000 0.000 0.000 6 +7: dbcsr_mm_sched_init 10 8.0 0.000 0.000 0.000 0.000 1 +7: mp_sum_root_rm 2 4.0 0.000 0.000 0.000 0.000 0 +7: mp_comm_free 4 2.0 0.000 0.000 0.000 0.000 6 7: dbcsr_get_local_cols 20 5.5 0.000 0.000 0.000 0.000 5 -7: dbcsr_dist_bin 4 3.0 0.000 0.000 0.000 0.000 0 -7: mp_alltoall_i11v 9 5.0 0.000 0.000 0.000 0.000 10 -7: fill_hash_tables 10 8.0 0.000 0.000 0.000 0.000 6 -7: dbcsr_mm_sched_finalize 10 10.0 0.000 0.000 0.000 0.000 1 -7: dbcsr_get_data_size_used 16 5.8 0.000 0.000 0.000 0.000 0 -7: dbcsr_verify_matrix 3 4.0 0.000 0.000 0.000 0.000 7 +7: mp_alltoall_i11v 9 5.0 0.000 0.000 0.000 0.000 4 +7: fill_hash_tables 10 8.0 0.000 0.000 0.000 0.000 1 +7: dbcsr_get_data_size_used 16 5.8 0.000 0.000 0.000 0.000 6 +7: mp_bcast_iv 5 1.0 0.000 0.000 0.000 0.000 4 +7: dbcsr_mm_sched_finalize 10 10.0 0.000 0.000 0.000 0.000 4 7: dbcsr_get_global_row_map 10 5.0 0.000 0.000 0.000 0.000 5 +7: dbcsr_dist_bin 4 3.0 0.000 0.000 0.000 0.000 6 +7: dbcsr_get_global_col_map 10 5.0 0.000 0.000 0.000 0.000 5 +7: mp_sum_lm3 1 1.0 0.000 0.000 0.000 0.000 4 +7: dbcsr_mm_hostdrv_init 10 9.0 0.000 0.000 0.000 0.000 6 +7: dbcsr_verify_matrix 3 4.0 0.000 0.000 0.000 0.000 4 7: mp_sum_r 1 1.0 0.000 0.000 0.000 0.000 0 -7: dbcsr_get_global_col_map 10 5.0 0.000 0.000 0.000 0.000 6 -7: mp_sum_i 1 1.0 0.000 0.000 0.000 0.000 1 -7: mp_max_d 1 1.0 0.000 0.000 0.000 0.000 8 -7: mp_sum_rv 1 1.0 0.000 0.000 0.000 0.000 2 -7: mp_min_rv 1 1.0 0.000 0.000 0.000 0.000 11 -7: mp_max_rv 1 1.0 0.000 0.000 0.000 0.000 0 -7: dbcsr_mm_hostdrv_init 10 9.0 0.000 0.000 0.000 0.000 10 +7: mp_max_rv 1 1.0 0.000 0.000 0.000 0.000 6 +7: mp_max_d 1 1.0 0.000 0.000 0.000 0.000 6 +7: mp_sum_rv 1 1.0 0.000 0.000 0.000 0.000 6 +7: mp_sum_i 1 1.0 0.000 0.000 0.000 0.000 4 +7: mp_min_rv 1 1.0 0.000 0.000 0.000 0.000 4 7: ------------------------------------------------------------------------------- 7: - 7/19 Test #7: dbcsr_perf:inputs/test_square_dense.perf .............. Passed 0.32 sec + 7/19 Test #7: dbcsr_perf:inputs/test_square_dense.perf .............. Passed 0.59 sec test 8 Start 8: dbcsr_perf:inputs/test_square_sparse.perf -8: Test command: /usr/bin/mpiexec "-n" "12" "/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/tests/dbcsr_perf" "/build/reproducible-path/dbcsr-2.6.0/tests/inputs/test_square_sparse.perf" +8: Test command: /usr/bin/mpiexec "-n" "7" "/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/tests/dbcsr_perf" "/build/reproducible-path/dbcsr-2.6.0/tests/inputs/test_square_sparse.perf" 8: Working Directory: /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/tests 8: Environment variables: 8: OMP_NUM_THREADS=2 @@ -3303,12 +3330,12 @@ 8: DBCSR| Use Communication thread T (D) 8: DBCSR| Communication thread load 100 (D) 8: DBCSR| MPI: My process id 0 -8: DBCSR| MPI: Number of processes 12 +8: DBCSR| MPI: Number of processes 7 8: DBCSR| OMP: Current number of threads 2 8: DBCSR| OMP: Max number of threads 2 8: DBCSR| Split modifier for TAS multiplication algorithm 1.0E+00 (D) 8: numthreads 2 -8: numnodes 12 +8: numnodes 7 8: matrix_sizes 1000 1000 1000 8: sparsities 0.90000000000000002 0.90000000000000002 0.90000000000000002 8: trans NN @@ -3325,7 +3352,7 @@ 8: ******************************************************************************** 8: -- PERF dbcsr_multiply (N, N, 3 , N, N, N) 8: matrix sizes A( 1000 x 1000), B( 1000 x 1000) and C( 1000 x 1000) -8: numnodes (nprows X npcols) = 12( 4 X 3) +8: numnodes (nprows X npcols) = 7( 7 X 1) 8: nthreads = 2 8: checksum(A) = 0.330113256255407E+05 8: checksum(B) = 0.336183330312199E+05 @@ -3335,12 +3362,12 @@ 8: 8: 8: mean std minmin maxmax -8: time = 36.43E-03 2.83E-03 26.95E-03 59.83E-03 seconds -8: perf total = 532.11E+06 30.67E+06 331.07E+06 663.79E+06 FLOPS -8: perf per node = 44.34E+06 2.56E+06 27.59E+06 55.32E+06 FLOPS -8: perf per thread = 22.17E+06 1.28E+06 13.79E+06 27.66E+06 FLOPS -8: load imbalance = 0.36E-01 0.25E-02 0.28E-01 0.55E-01 -8: rel load imbal = 0.92E+00 0.55E-03 0.92E+00 0.92E+00 +8: time = 82.59E-03 3.09E-03 67.21E-03 106.79E-03 seconds +8: perf total = 229.66E+06 7.72E+06 185.48E+06 268.70E+06 FLOPS +8: perf per node = 32.81E+06 1.10E+06 26.50E+06 38.39E+06 FLOPS +8: perf per thread = 16.40E+06 551.64E+03 13.25E+06 19.19E+06 FLOPS +8: load imbalance = 0.75E-01 0.25E-02 0.64E-01 0.92E-01 +8: rel load imbal = 0.86E+00 0.95E-03 0.86E+00 0.87E+00 8: ******************************************************************************** 8: 8: ------------------------------------------------------------------------------- @@ -3352,35 +3379,35 @@ 8: flops 5 x 5 x 5 198075000 100.0% 0.0% 0.0% 8: flops inhomo. stacks 0 0.0% 0.0% 0.0% 8: flops total 198.075000E+06 100.0% 0.0% 0.0% -8: flops max/rank 17.092500E+06 100.0% 0.0% 0.0% +8: flops max/rank 28.655000E+06 100.0% 0.0% 0.0% 8: matmuls inhomo. stacks 0 0.0% 0.0% 0.0% 8: matmuls total 792300 100.0% 0.0% 0.0% -8: number of processed stacks 2880 100.0% 0.0% 0.0% -8: average stack size 275.1 0.0 0.0 -8: marketing flops 20.000000E+09 +8: number of processed stacks 1040 100.0% 0.0% 0.0% +8: average stack size 761.8 0.0 0.0 +8: marketing flops 19.999998E+09 8: ------------------------------------------------------------------------------- 8: # multiplications 10 -8: max memory usage/rank 102.805504E+06 -8: # max total images/rank 4 +8: max memory usage/rank 78.557184E+06 +8: # max total images/rank 7 8: # max 3D layers 1 -8: # MPI messages exchanged 2040 +8: # MPI messages exchanged 420 8: MPI messages size (bytes): -8: total size 40.026000E+06 -8: min size 10.800000E+03 -8: max size 27.800000E+03 -8: average size 19.620588E+03 +8: total size 48.516000E+06 +8: min size 112.200000E+03 +8: max size 121.000000E+03 +8: average size 115.514289E+03 8: MPI breakdown and total messages size (bytes): 8: size <= 128 0 0 8: 128 < size <= 8192 0 0 -8: 8192 < size <= 32768 2040 40026000 -8: 32768 < size <= 131072 0 0 +8: 8192 < size <= 32768 0 0 +8: 32768 < size <= 131072 420 48516000 8: 131072 < size <= 4194304 0 0 8: 4194304 < size <= 16777216 0 0 8: 16777216 < size 0 0 8: ------------------------------------------------------------------------------- 8: 8: *** WARNING in dbcsr_mm.F:291 :: Using a non-square number of MPI ranks *** -8: *** might lead to poor performance. Used ranks: 12 Suggested: 9 25 *** +8: *** might lead to poor performance. Used ranks: 7 Suggested: 9 16 *** 8: 8: ------------------------------------------------------------------------------- 8: - - @@ -3389,10 +3416,10 @@ 8: ------------------------------------------------------------------------------- 8: ROUTINE CALLS AVE VOLUME [Bytes] 8: MP_Bcast 2 12. -8: MP_Allreduce 88 33. -8: MP_Alltoall 41 20769. -8: MP_ISend 420 9839. -8: MP_IRecv 420 10264. +8: MP_Allreduce 88 24. +8: MP_Alltoall 41 34895. +8: MP_ISend 160 48998. +8: MP_IRecv 160 48853. 8: ------------------------------------------------------------------------------- 8: 8: ------------------------------------------------------------------------------- @@ -3402,115 +3429,114 @@ 8: ------------------------------------------------------------------------------- 8: SUBROUTINE CALLS ASD SELF TIME TOTAL TIME MAXRANK 8: MAXIMUM AVERAGE MAXIMUM AVERAGE MAXIMUM -8: dbcsr_performance_driver 1 1.0 0.000 0.000 0.444 0.446 0 -8: dbcsr_perf_multiply_low 1 2.0 0.000 0.000 0.443 0.446 0 -8: perf_multiply 1 3.0 0.000 0.000 0.436 0.442 0 -8: dbcsr_multiply_generic 10 4.0 0.001 0.001 0.364 0.369 9 -8: make_m2s 20 5.0 0.001 0.001 0.149 0.164 6 -8: make_images 20 6.0 0.017 0.031 0.147 0.162 3 -8: multiply_cannon 10 5.0 0.005 0.011 0.130 0.151 5 -8: make_images_sizes 20 7.0 0.000 0.000 0.095 0.113 2 -8: mp_alltoall_i44 20 8.0 0.095 0.113 0.095 0.113 7 -8: multiply_cannon_loop 10 6.0 0.002 0.004 0.079 0.093 8 -8: mp_sum_l 145 2.7 0.054 0.079 0.054 0.079 7 -8: dbcsr_multiply_generic_mpsum_f 10 5.0 0.000 0.000 0.054 0.078 9 -8: mp_waitall_1 440 8.3 0.043 0.075 0.043 0.075 8 -8: multiply_cannon_multrec 120 7.0 0.050 0.067 0.051 0.067 5 -8: mp_allgather_i34 10 6.0 0.040 0.054 0.040 0.054 11 -8: make_images_data 20 7.0 0.000 0.000 0.023 0.047 3 -8: hybrid_alltoall_any 20 8.0 0.001 0.010 0.019 0.041 6 -8: dbcsr_special_finalize 70 7.0 0.001 0.005 0.009 0.035 2 -8: dbcsr_add_wm_from_matrix 10 5.0 0.003 0.029 0.004 0.030 5 -8: dbcsr_redistribute 3 4.0 0.007 0.010 0.024 0.029 0 -8: dbcsr_merge_single_wm 70 8.0 0.005 0.023 0.007 0.029 2 -8: mp_sync 10 4.0 0.023 0.028 0.023 0.028 10 -8: multiply_cannon_metrocomm1 120 7.0 0.000 0.000 0.013 0.027 9 -8: dbcsr_checksum 5 4.0 0.007 0.009 0.023 0.025 10 -8: dbcsr_create_new 177 6.7 0.012 0.024 0.014 0.025 3 -8: multiply_cannon_metrocomm3 120 7.0 0.000 0.000 0.009 0.024 6 -8: dbcsr_copy 30 4.7 0.002 0.005 0.014 0.024 0 -8: mp_alltoall_i22 3 5.0 0.016 0.023 0.016 0.023 5 -8: mp_sum_d 76 1.3 0.016 0.020 0.016 0.020 5 -8: dbcsr_finalize 17 4.8 0.000 0.000 0.009 0.012 6 -8: dbcsr_merge_all 13 5.8 0.002 0.005 0.008 0.011 3 -8: dbcsr_make_random_matrix 3 3.0 0.005 0.006 0.007 0.010 4 -8: dbcsr_make_untransposed_blocks 20 5.0 0.006 0.009 0.006 0.009 4 -8: dbcsr_init_lib_low 1 1.0 0.003 0.008 0.003 0.008 4 -8: setup_rec_index_2d 20 6.0 0.003 0.007 0.003 0.007 3 -8: dbcsr_sort_data 70 9.0 0.001 0.005 0.001 0.005 2 -8: dbcsr_sort_indices 86 8.6 0.004 0.004 0.004 0.004 8 -8: dbcsr_mm_multrec_init 10 6.0 0.000 0.000 0.002 0.004 3 -8: dbcsr_mm_csr_init 10 7.0 0.001 0.004 0.002 0.004 3 -8: dbcsr_make_index_exist 177 7.7 0.001 0.004 0.001 0.004 6 -8: mp_max_l 90 1.0 0.003 0.003 0.003 0.003 11 -8: multiply_cannon_metrocomm2 90 7.0 0.000 0.001 0.002 0.003 9 -8: mp_isend_dv 210 8.2 0.002 0.002 0.002 0.002 8 -8: dbcsr_data_release 580 7.0 0.002 0.002 0.002 0.002 1 -8: make_images_pack 20 7.0 0.002 0.002 0.002 0.002 10 -8: multiply_cannon_metrocomm4 80 7.0 0.000 0.000 0.001 0.002 2 -8: setup_buffer_matrices 20 6.0 0.000 0.000 0.001 0.002 2 -8: dbcsr_work_destroy_all 86 7.6 0.000 0.000 0.001 0.002 6 -8: dbcsr_fill_wm_from_matrix 10 6.0 0.001 0.001 0.001 0.002 5 -8: merge_index 13 6.8 0.001 0.001 0.001 0.001 10 -8: mp_maxloc_dv 203 1.0 0.001 0.001 0.001 0.001 1 -8: mp_isend_iv 230 8.0 0.001 0.001 0.001 0.001 4 -8: dbcsr_data_copy_aa2 13 6.8 0.001 0.001 0.001 0.001 1 -8: mp_cart_sub 2 5.0 0.001 0.001 0.001 0.001 6 -8: mp_bcast_av 99 1.0 0.000 0.000 0.001 0.001 9 -8: mp_irecv_dv 210 8.2 0.001 0.001 0.001 0.001 1 -8: dbcsr_make_index_list 70 6.0 0.001 0.001 0.001 0.001 6 -8: dbcsr_destroy 167 5.4 0.000 0.000 0.001 0.001 8 -8: mp_irecv_iv 230 8.0 0.000 0.001 0.000 0.001 5 -8: multiply_cannon_multrec_finali 10 8.0 0.000 0.000 0.001 0.001 11 +8: dbcsr_performance_driver 1 1.0 0.000 0.000 1.029 1.031 0 +8: dbcsr_perf_multiply_low 1 2.0 0.000 0.000 1.029 1.030 0 +8: perf_multiply 1 3.0 0.000 0.000 1.008 1.019 0 +8: dbcsr_multiply_generic 10 4.0 0.002 0.002 0.826 0.852 2 +8: multiply_cannon 10 5.0 0.012 0.031 0.453 0.519 6 +8: multiply_cannon_loop 10 6.0 0.008 0.046 0.363 0.409 3 +8: multiply_cannon_metrocomm1 70 7.0 0.001 0.001 0.228 0.273 3 +8: mp_waitall_1 480 8.2 0.227 0.273 0.227 0.273 2 +8: mp_sum_l 145 2.7 0.151 0.219 0.151 0.219 6 +8: dbcsr_multiply_generic_mpsum_f 10 5.0 0.000 0.000 0.124 0.192 6 +8: multiply_cannon_multrec 70 7.0 0.124 0.182 0.125 0.183 3 +8: make_m2s 20 5.0 0.001 0.001 0.156 0.161 4 +8: make_images 20 6.0 0.025 0.034 0.153 0.158 1 +8: make_images_sizes 20 7.0 0.000 0.000 0.110 0.130 6 +8: mp_alltoall_i44 20 8.0 0.110 0.130 0.110 0.130 3 +8: mp_allgather_i34 10 6.0 0.065 0.094 0.065 0.094 3 +8: dbcsr_redistribute 3 4.0 0.021 0.036 0.064 0.073 2 +8: dbcsr_finalize 17 4.8 0.000 0.000 0.031 0.071 4 +8: dbcsr_merge_all 13 5.8 0.010 0.030 0.027 0.068 3 +8: dbcsr_checksum 5 4.0 0.023 0.033 0.062 0.065 3 +8: dbcsr_create_new 197 6.7 0.025 0.061 0.028 0.064 6 +8: mp_sync 10 4.0 0.052 0.064 0.052 0.064 0 +8: dbcsr_copy 30 4.7 0.006 0.010 0.027 0.062 1 +8: mp_alltoall_i22 3 5.0 0.040 0.055 0.040 0.055 6 +8: mp_sum_d 76 1.3 0.039 0.048 0.039 0.048 0 +8: dbcsr_make_random_matrix 3 3.0 0.009 0.010 0.021 0.042 0 +8: dbcsr_make_untransposed_blocks 20 5.0 0.014 0.022 0.015 0.022 4 +8: merge_index 13 6.8 0.004 0.011 0.004 0.011 3 +8: dbcsr_data_copy_aa2 13 6.8 0.004 0.010 0.004 0.010 3 +8: dbcsr_sort_indices 96 8.6 0.008 0.009 0.008 0.009 3 +8: tree_to_linear_d 3 6.0 0.002 0.009 0.002 0.009 3 +8: setup_rec_index_2d 20 6.0 0.006 0.009 0.006 0.009 6 +8: dbcsr_init_lib_low 1 1.0 0.002 0.008 0.002 0.008 3 +8: dbcsr_special_finalize 80 7.0 0.001 0.001 0.007 0.008 3 +8: mp_max_l 89 1.0 0.005 0.006 0.005 0.006 0 +8: make_images_pack 20 7.0 0.004 0.005 0.004 0.005 4 +8: dbcsr_mm_multrec_init 10 6.0 0.000 0.000 0.002 0.005 2 +8: dbcsr_data_release 630 7.1 0.004 0.005 0.004 0.005 6 +8: dbcsr_mm_csr_init 10 7.0 0.001 0.004 0.002 0.005 6 +8: dbcsr_merge_single_wm 70 8.0 0.002 0.002 0.004 0.005 3 +8: dbcsr_work_destroy_all 96 7.6 0.001 0.002 0.003 0.005 1 +8: dbcsr_add_wm_from_matrix 10 5.0 0.000 0.000 0.004 0.005 2 +8: dbcsr_fill_wm_from_matrix 10 6.0 0.003 0.004 0.003 0.004 4 +8: make_images_data 20 7.0 0.001 0.001 0.003 0.004 2 +8: setup_buffer_matrices 20 6.0 0.000 0.000 0.003 0.003 3 +8: dbcsr_destroy 187 5.4 0.001 0.001 0.002 0.003 4 +8: dbcsr_make_index_list 80 6.0 0.002 0.002 0.002 0.002 4 +8: hybrid_alltoall_any 20 8.0 0.002 0.002 0.002 0.002 2 +8: mp_max_i 92 1.0 0.002 0.002 0.002 0.002 0 +8: dbcsr_make_index_exist 197 7.7 0.002 0.002 0.002 0.002 3 +8: multiply_cannon_metrocomm2 60 7.0 0.001 0.001 0.002 0.002 3 +8: mp_maxloc_dv 201 1.0 0.002 0.002 0.002 0.002 0 +8: buffer_matrices_ensure_size 20 6.0 0.001 0.002 0.001 0.002 3 +8: dbcsr_sort_data 70 9.0 0.001 0.002 0.001 0.002 4 +8: quick_finalize 13 7.5 0.000 0.000 0.001 0.002 4 +8: mp_cart_sub 2 5.0 0.001 0.001 0.001 0.001 0 +8: mp_bcast_av 98 1.0 0.001 0.001 0.001 0.001 4 +8: multiply_cannon_multrec_finali 10 8.0 0.000 0.000 0.001 0.001 4 8: dbcsr_mm_multrec_finalize 10 9.0 0.001 0.001 0.001 0.001 5 -8: buffer_matrices_ensure_size 20 6.0 0.001 0.001 0.001 0.001 1 -8: fill_hash_tables 10 8.0 0.000 0.001 0.000 0.001 1 -8: tree_to_linear_d 3 6.0 0.000 0.001 0.000 0.001 9 -8: mp_bcast_i 100 2.0 0.000 0.001 0.000 0.001 5 -8: dbcsr_data_new 391 7.2 0.000 0.000 0.000 0.000 0 -8: mp_max_i 93 1.0 0.000 0.000 0.000 0.000 11 -8: dbcsr_iterator_start 76 6.8 0.000 0.000 0.000 0.000 2 -8: dbcsr_work_create 86 6.7 0.000 0.000 0.000 0.000 9 -8: dbcsr_make_index_local_row 70 6.0 0.000 0.000 0.000 0.000 6 -8: dbcsr_make_dbcsr_index 86 8.6 0.000 0.000 0.000 0.000 6 -8: dbcsr_iterator_seek 76 7.8 0.000 0.000 0.000 0.000 6 -8: dbcsr_distribution_new 26 4.7 0.000 0.000 0.000 0.000 9 -8: mp_cart_create 1 5.0 0.000 0.000 0.000 0.000 8 -8: dbcsr_iterator_stop 76 6.8 0.000 0.000 0.000 0.000 3 -8: quick_finalize 3 6.0 0.000 0.000 0.000 0.000 4 -8: dbcsr_dist_bin 4 3.0 0.000 0.000 0.000 0.000 11 -8: mp_alltoall_d11v 9 5.0 0.000 0.000 0.000 0.000 7 -8: mp_sum_b 20 5.0 0.000 0.000 0.000 0.000 11 -8: mp_max_r 1 1.0 0.000 0.000 0.000 0.000 9 -8: dbcsr_switch_data_area 23 6.1 0.000 0.000 0.000 0.000 6 -8: mp_sum_root_rm 2 4.0 0.000 0.000 0.000 0.000 8 -8: dbcsr_verify_matrix 3 4.0 0.000 0.000 0.000 0.000 7 +8: dbcsr_data_new 421 7.3 0.001 0.001 0.001 0.001 0 +8: dbcsr_work_create 96 6.7 0.001 0.001 0.001 0.001 3 +8: fill_hash_tables 10 8.0 0.001 0.001 0.001 0.001 3 +8: dbcsr_iterator_start 76 6.8 0.000 0.000 0.001 0.001 4 +8: mp_bcast_i 99 2.0 0.001 0.001 0.001 0.001 5 +8: mp_isend_iv 100 8.0 0.001 0.001 0.001 0.001 3 +8: dbcsr_make_dbcsr_index 96 8.6 0.000 0.000 0.000 0.000 4 +8: mp_irecv_iv 100 8.0 0.000 0.000 0.000 0.000 4 +8: mp_cart_create 1 5.0 0.000 0.000 0.000 0.000 4 +8: dbcsr_distribution_new 26 4.7 0.000 0.000 0.000 0.000 2 +8: dbcsr_iterator_stop 76 6.8 0.000 0.000 0.000 0.000 0 +8: dbcsr_make_index_local_row 80 6.0 0.000 0.000 0.000 0.000 3 +8: mp_alltoall_d11v 9 5.0 0.000 0.000 0.000 0.000 1 +8: mp_irecv_dv 60 8.0 0.000 0.000 0.000 0.000 6 +8: dbcsr_iterator_seek 76 7.8 0.000 0.000 0.000 0.000 4 +8: mp_isend_dv 60 8.0 0.000 0.000 0.000 0.000 3 +8: mp_sum_b 20 5.0 0.000 0.000 0.000 0.000 6 +8: dbcsr_switch_data_area 33 7.0 0.000 0.000 0.000 0.000 4 +8: dbcsr_dist_bin 4 3.0 0.000 0.000 0.000 0.000 0 +8: dbcsr_verify_matrix 3 4.0 0.000 0.000 0.000 0.000 5 +8: mp_max_r 1 1.0 0.000 0.000 0.000 0.000 6 +8: multiply_cannon_metrocomm3 70 7.0 0.000 0.000 0.000 0.000 3 +8: mp_sum_root_rm 2 4.0 0.000 0.000 0.000 0.000 0 8: dbcsr_get_data_size_used 16 5.8 0.000 0.000 0.000 0.000 0 -8: mp_comm_free 4 2.0 0.000 0.000 0.000 0.000 0 -8: dbcsr_mm_sched_init 10 8.0 0.000 0.000 0.000 0.000 11 +8: dbcsr_mm_sched_init 10 8.0 0.000 0.000 0.000 0.000 6 8: mp_alltoall_i11v 9 5.0 0.000 0.000 0.000 0.000 4 -8: dbcsr_mm_hostdrv_init 10 9.0 0.000 0.000 0.000 0.000 0 -8: dbcsr_get_local_rows 10 5.0 0.000 0.000 0.000 0.000 6 -8: dbcsr_get_local_cols 10 5.0 0.000 0.000 0.000 0.000 9 -8: mp_sum_lv 2 1.0 0.000 0.000 0.000 0.000 7 -8: dbcsr_mm_sched_finalize 10 10.0 0.000 0.000 0.000 0.000 2 +8: mp_comm_free 4 2.0 0.000 0.000 0.000 0.000 3 +8: mp_sum_lv 2 1.0 0.000 0.000 0.000 0.000 0 +8: dbcsr_get_local_rows 10 5.0 0.000 0.000 0.000 0.000 3 +8: dbcsr_mm_sched_finalize 10 10.0 0.000 0.000 0.000 0.000 4 +8: dbcsr_get_local_cols 10 5.0 0.000 0.000 0.000 0.000 0 8: mp_sum_lm3 1 1.0 0.000 0.000 0.000 0.000 0 -8: mp_sum_rv 1 1.0 0.000 0.000 0.000 0.000 10 -8: mp_bcast_iv 2 1.0 0.000 0.000 0.000 0.000 10 -8: mp_sum_r 1 1.0 0.000 0.000 0.000 0.000 4 -8: mp_max_rv 1 1.0 0.000 0.000 0.000 0.000 11 -8: dbcsr_get_global_col_map 10 5.0 0.000 0.000 0.000 0.000 1 -8: dbcsr_get_global_row_map 10 5.0 0.000 0.000 0.000 0.000 7 -8: mp_sum_i 1 1.0 0.000 0.000 0.000 0.000 11 -8: mp_min_rv 1 1.0 0.000 0.000 0.000 0.000 1 -8: mp_max_d 1 1.0 0.000 0.000 0.000 0.000 1 +8: dbcsr_get_global_row_map 10 5.0 0.000 0.000 0.000 0.000 1 +8: dbcsr_get_global_col_map 10 5.0 0.000 0.000 0.000 0.000 3 +8: mp_bcast_iv 2 1.0 0.000 0.000 0.000 0.000 5 +8: mp_sum_i 1 1.0 0.000 0.000 0.000 0.000 0 +8: dbcsr_mm_hostdrv_init 10 9.0 0.000 0.000 0.000 0.000 5 +8: mp_min_rv 1 1.0 0.000 0.000 0.000 0.000 0 +8: mp_sum_rv 1 1.0 0.000 0.000 0.000 0.000 0 +8: mp_max_d 1 1.0 0.000 0.000 0.000 0.000 0 +8: mp_max_rv 1 1.0 0.000 0.000 0.000 0.000 0 +8: mp_sum_r 1 1.0 0.000 0.000 0.000 0.000 0 8: ------------------------------------------------------------------------------- 8: - 8/19 Test #8: dbcsr_perf:inputs/test_square_sparse.perf ............. Passed 0.50 sec + 8/19 Test #8: dbcsr_perf:inputs/test_square_sparse.perf ............. Passed 1.11 sec test 9 Start 9: dbcsr_perf:inputs/test_square_sparse_bigblocks.perf -9: Test command: /usr/bin/mpiexec "-n" "12" "/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/tests/dbcsr_perf" "/build/reproducible-path/dbcsr-2.6.0/tests/inputs/test_square_sparse_bigblocks.perf" +9: Test command: /usr/bin/mpiexec "-n" "7" "/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/tests/dbcsr_perf" "/build/reproducible-path/dbcsr-2.6.0/tests/inputs/test_square_sparse_bigblocks.perf" 9: Working Directory: /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/tests 9: Environment variables: 9: OMP_NUM_THREADS=2 @@ -3529,12 +3555,12 @@ 9: DBCSR| Use Communication thread T (D) 9: DBCSR| Communication thread load 100 (D) 9: DBCSR| MPI: My process id 0 -9: DBCSR| MPI: Number of processes 12 +9: DBCSR| MPI: Number of processes 7 9: DBCSR| OMP: Current number of threads 2 9: DBCSR| OMP: Max number of threads 2 9: DBCSR| Split modifier for TAS multiplication algorithm 1.0E+00 (D) 9: numthreads 2 -9: numnodes 12 +9: numnodes 7 9: matrix_sizes 10000 1000 1000 9: sparsities 0.90000000000000002 0.90000000000000002 0.90000000000000002 9: trans NN @@ -3551,22 +3577,22 @@ 9: ******************************************************************************** 9: -- PERF dbcsr_multiply (N, N, 3 , N, N, N) 9: matrix sizes A( 10000 x 1000), B( 1000 x 1000) and C( 10000 x 1000) -9: numnodes (nprows X npcols) = 12( 4 X 3) +9: numnodes (nprows X npcols) = 7( 7 X 1) 9: nthreads = 2 9: checksum(A) = 0.314680921010826E+06 9: checksum(B) = 0.359513700691199E+05 -9: checksum(C_in) = 0.330421884044952E+06 +9: checksum(C_in) = 0.330421884044953E+06 9: checksum(C_out) = 0.179511893085946E+09 9: checksum(C_out) POS = 0.349170005426525E+09 9: 9: 9: mean std minmin maxmax -9: time = 56.07E-03 1.66E-03 47.52E-03 75.53E-03 seconds -9: perf total = 3.33E+09 111.63E+06 2.60E+09 3.88E+09 FLOPS -9: perf per node = 277.87E+06 9.30E+06 216.26E+06 323.19E+06 FLOPS -9: perf per thread = 138.93E+06 4.65E+06 108.13E+06 161.59E+06 FLOPS -9: load imbalance = 0.55E-01 0.20E-02 0.47E-01 0.70E-01 -9: rel load imbal = 0.92E+00 0.68E-03 0.92E+00 0.93E+00 +9: time = 121.06E-03 4.94E-03 100.93E-03 162.32E-03 seconds +9: perf total = 1.60E+09 58.55E+06 1.21E+09 1.83E+09 FLOPS +9: perf per node = 228.10E+06 8.36E+06 172.50E+06 261.92E+06 FLOPS +9: perf per thread = 114.05E+06 4.18E+06 86.25E+06 130.96E+06 FLOPS +9: load imbalance = 0.11E+00 0.43E-02 0.92E-01 0.14E+00 +9: rel load imbal = 0.86E+00 0.60E-03 0.86E+00 0.86E+00 9: ******************************************************************************** 9: 9: ------------------------------------------------------------------------------- @@ -3578,35 +3604,35 @@ 9: flops 100 x 50 x 20 1960000000 100.0% 0.0% 0.0% 9: flops inhomo. stacks 0 0.0% 0.0% 0.0% 9: flops total 1.960000E+09 100.0% 0.0% 0.0% -9: flops max/rank 218.000000E+06 100.0% 0.0% 0.0% +9: flops max/rank 356.000000E+06 100.0% 0.0% 0.0% 9: matmuls inhomo. stacks 0 0.0% 0.0% 0.0% 9: matmuls total 9800 100.0% 0.0% 0.0% -9: number of processed stacks 2490 100.0% 0.0% 0.0% -9: average stack size 3.9 0.0 0.0 -9: marketing flops 199.999996E+09 +9: number of processed stacks 970 100.0% 0.0% 0.0% +9: average stack size 10.1 0.0 0.0 +9: marketing flops 199.999980E+09 9: ------------------------------------------------------------------------------- 9: # multiplications 10 -9: max memory usage/rank 115.658752E+06 -9: # max total images/rank 4 +9: max memory usage/rank 95.223808E+06 +9: # max total images/rank 7 9: # max 3D layers 1 -9: # MPI messages exchanged 2040 +9: # MPI messages exchanged 420 9: MPI messages size (bytes): -9: total size 176.960000E+06 -9: min size 8.000000E+03 -9: max size 320.000000E+03 -9: average size 86.745102E+03 +9: total size 51.840000E+06 +9: min size 72.000000E+03 +9: max size 160.000000E+03 +9: average size 123.428570E+03 9: MPI breakdown and total messages size (bytes): 9: size <= 128 0 0 -9: 128 < size <= 8192 270 2160000 -9: 8192 < size <= 32768 570 13440000 -9: 32768 < size <= 131072 660 51280000 -9: 131072 < size <= 4194304 540 110080000 +9: 128 < size <= 8192 0 0 +9: 8192 < size <= 32768 0 0 +9: 32768 < size <= 131072 240 24480000 +9: 131072 < size <= 4194304 180 27360000 9: 4194304 < size <= 16777216 0 0 9: 16777216 < size 0 0 9: ------------------------------------------------------------------------------- 9: 9: *** WARNING in dbcsr_mm.F:291 :: Using a non-square number of MPI ranks *** -9: *** might lead to poor performance. Used ranks: 12 Suggested: 9 25 *** +9: *** might lead to poor performance. Used ranks: 7 Suggested: 9 16 *** 9: 9: ------------------------------------------------------------------------------- 9: - - @@ -3615,10 +3641,10 @@ 9: ------------------------------------------------------------------------------- 9: ROUTINE CALLS AVE VOLUME [Bytes] 9: MP_Bcast 2 12. -9: MP_Allreduce 88 33. -9: MP_Alltoall 41 150412. -9: MP_ISend 420 48511. -9: MP_IRecv 420 43744. +9: MP_Allreduce 88 24. +9: MP_Alltoall 41 210309. +9: MP_ISend 160 44311. +9: MP_IRecv 160 46314. 9: ------------------------------------------------------------------------------- 9: 9: ------------------------------------------------------------------------------- @@ -3628,115 +3654,114 @@ 9: ------------------------------------------------------------------------------- 9: SUBROUTINE CALLS ASD SELF TIME TOTAL TIME MAXRANK 9: MAXIMUM AVERAGE MAXIMUM AVERAGE MAXIMUM -9: dbcsr_performance_driver 1 1.0 0.000 0.000 0.679 0.680 0 -9: dbcsr_perf_multiply_low 1 2.0 0.000 0.000 0.679 0.680 0 -9: perf_multiply 1 3.0 0.000 0.000 0.666 0.671 0 -9: dbcsr_multiply_generic 10 4.0 0.001 0.001 0.561 0.581 9 -9: multiply_cannon 10 5.0 0.008 0.015 0.282 0.321 7 -9: multiply_cannon_loop 10 6.0 0.008 0.022 0.224 0.279 1 -9: multiply_cannon_multrec 120 7.0 0.179 0.221 0.180 0.222 10 -9: make_m2s 20 5.0 0.000 0.001 0.141 0.164 4 -9: mp_sum_l 145 2.7 0.103 0.164 0.103 0.164 5 -9: make_images 20 6.0 0.017 0.027 0.140 0.163 0 -9: dbcsr_multiply_generic_mpsum_f 10 5.0 0.000 0.000 0.101 0.161 4 -9: mp_waitall_1 440 8.3 0.065 0.110 0.065 0.110 2 -9: make_images_sizes 20 7.0 0.000 0.000 0.069 0.094 7 -9: mp_alltoall_i44 20 8.0 0.069 0.094 0.069 0.094 3 -9: mp_allgather_i34 10 6.0 0.043 0.060 0.043 0.060 3 -9: multiply_cannon_metrocomm3 120 7.0 0.000 0.000 0.024 0.057 11 -9: make_images_data 20 7.0 0.000 0.000 0.037 0.056 11 -9: hybrid_alltoall_any 20 8.0 0.003 0.010 0.031 0.053 9 -9: mp_sync 10 4.0 0.034 0.040 0.034 0.040 6 -9: dbcsr_copy 30 4.7 0.006 0.010 0.020 0.040 9 -9: dbcsr_redistribute 3 4.0 0.006 0.021 0.034 0.038 10 -9: dbcsr_create_new 177 6.7 0.014 0.026 0.016 0.034 1 -9: dbcsr_checksum 5 4.0 0.015 0.022 0.031 0.033 10 -9: mp_alltoall_i22 3 5.0 0.024 0.031 0.024 0.031 5 -9: mp_sum_d 76 1.3 0.017 0.022 0.017 0.022 5 -9: dbcsr_finalize 17 4.8 0.000 0.000 0.015 0.021 4 -9: dbcsr_make_random_matrix 3 3.0 0.007 0.009 0.013 0.020 1 -9: multiply_cannon_metrocomm1 120 7.0 0.000 0.000 0.008 0.018 1 -9: dbcsr_merge_all 13 5.8 0.004 0.012 0.011 0.017 2 -9: dbcsr_special_finalize 70 7.0 0.000 0.001 0.010 0.014 11 -9: dbcsr_merge_single_wm 70 8.0 0.005 0.010 0.009 0.014 4 -9: dbcsr_data_release 580 7.0 0.010 0.012 0.010 0.012 11 -9: buffer_matrices_ensure_size 20 6.0 0.003 0.008 0.003 0.008 7 -9: dbcsr_data_copy_aa2 13 6.8 0.005 0.008 0.005 0.008 9 -9: make_images_pack 20 7.0 0.005 0.007 0.005 0.007 7 -9: dbcsr_make_index_exist 177 7.7 0.001 0.007 0.001 0.007 1 -9: dbcsr_add_wm_from_matrix 10 5.0 0.001 0.005 0.005 0.007 10 -9: dbcsr_fill_wm_from_matrix 10 6.0 0.003 0.007 0.003 0.007 6 -9: dbcsr_destroy 167 5.4 0.000 0.000 0.005 0.006 4 -9: dbcsr_sort_data 70 9.0 0.004 0.005 0.004 0.005 9 -9: dbcsr_work_destroy_all 86 7.6 0.000 0.000 0.004 0.005 4 -9: mp_max_l 90 1.0 0.003 0.003 0.003 0.003 7 -9: multiply_cannon_metrocomm2 90 7.0 0.001 0.001 0.003 0.003 4 -9: dbcsr_init_lib_low 1 1.0 0.001 0.003 0.001 0.003 0 -9: tree_to_linear_d 3 6.0 0.001 0.002 0.001 0.002 9 -9: mp_isend_dv 210 8.2 0.002 0.002 0.002 0.002 4 -9: mp_maxloc_dv 203 1.0 0.002 0.002 0.002 0.002 5 -9: mp_alltoall_d11v 9 5.0 0.001 0.002 0.001 0.002 9 -9: mp_irecv_dv 210 8.2 0.001 0.002 0.001 0.002 1 -9: setup_buffer_matrices 20 6.0 0.000 0.000 0.001 0.002 4 -9: multiply_cannon_metrocomm4 80 7.0 0.000 0.000 0.001 0.001 7 -9: dbcsr_data_new 391 7.2 0.001 0.001 0.001 0.001 11 -9: mp_cart_sub 2 5.0 0.001 0.001 0.001 0.001 9 -9: mp_isend_iv 230 8.0 0.001 0.001 0.001 0.001 6 -9: mp_bcast_av 99 1.0 0.000 0.000 0.001 0.001 10 -9: dbcsr_mm_multrec_init 10 6.0 0.000 0.000 0.001 0.001 10 -9: dbcsr_mm_csr_init 10 7.0 0.001 0.001 0.001 0.001 2 -9: multiply_cannon_multrec_finali 10 8.0 0.000 0.000 0.000 0.001 4 -9: dbcsr_mm_multrec_finalize 10 9.0 0.000 0.001 0.000 0.001 4 -9: dbcsr_work_create 86 6.7 0.000 0.000 0.001 0.001 10 -9: mp_bcast_i 100 2.0 0.000 0.001 0.000 0.001 2 -9: dbcsr_make_untransposed_blocks 20 5.0 0.000 0.000 0.000 0.001 9 -9: mp_max_i 93 1.0 0.000 0.001 0.000 0.001 0 -9: mp_cart_create 1 5.0 0.000 0.000 0.000 0.000 8 -9: dbcsr_make_index_list 70 6.0 0.000 0.000 0.000 0.000 4 -9: setup_rec_index_2d 20 6.0 0.000 0.000 0.000 0.000 7 -9: dbcsr_iterator_start 76 6.8 0.000 0.000 0.000 0.000 4 -9: dbcsr_sort_indices 86 8.6 0.000 0.000 0.000 0.000 6 -9: mp_irecv_iv 230 8.0 0.000 0.000 0.000 0.000 4 -9: dbcsr_iterator_stop 76 6.8 0.000 0.000 0.000 0.000 11 -9: merge_index 13 6.8 0.000 0.000 0.000 0.000 9 -9: mp_sum_lv 2 1.0 0.000 0.000 0.000 0.000 11 -9: mp_sum_b 20 5.0 0.000 0.000 0.000 0.000 3 -9: dbcsr_make_index_local_row 70 6.0 0.000 0.000 0.000 0.000 7 +9: dbcsr_performance_driver 1 1.0 0.000 0.000 1.513 1.521 0 +9: dbcsr_perf_multiply_low 1 2.0 0.005 0.032 1.513 1.521 4 +9: perf_multiply 1 3.0 0.000 0.001 1.483 1.501 0 +9: dbcsr_multiply_generic 10 4.0 0.002 0.002 1.210 1.231 4 +9: multiply_cannon 10 5.0 0.012 0.025 0.801 0.867 5 +9: multiply_cannon_loop 10 6.0 0.023 0.056 0.707 0.768 2 +9: multiply_cannon_multrec 70 7.0 0.427 0.575 0.428 0.575 5 +9: multiply_cannon_metrocomm1 70 7.0 0.001 0.001 0.254 0.430 4 +9: mp_waitall_1 480 8.2 0.254 0.430 0.254 0.430 0 +9: make_m2s 20 5.0 0.001 0.001 0.192 0.210 4 +9: make_images 20 6.0 0.024 0.060 0.186 0.204 5 +9: mp_sum_l 145 2.7 0.118 0.159 0.118 0.159 1 +9: dbcsr_multiply_generic_mpsum_f 10 5.0 0.000 0.000 0.113 0.155 0 +9: dbcsr_checksum 5 4.0 0.072 0.098 0.126 0.130 1 +9: make_images_sizes 20 7.0 0.000 0.000 0.102 0.122 2 +9: mp_alltoall_i44 20 8.0 0.102 0.122 0.102 0.122 1 +9: dbcsr_redistribute 3 4.0 0.012 0.018 0.072 0.089 1 +9: dbcsr_finalize 17 4.8 0.000 0.001 0.064 0.086 0 +9: mp_allgather_i34 10 6.0 0.061 0.081 0.061 0.081 3 +9: mp_sum_d 76 1.3 0.055 0.080 0.055 0.080 0 +9: dbcsr_copy 30 4.7 0.019 0.027 0.038 0.074 2 +9: dbcsr_merge_all 13 5.8 0.013 0.035 0.050 0.074 6 +9: mp_alltoall_i22 3 5.0 0.049 0.064 0.049 0.064 3 +9: mp_sync 10 4.0 0.053 0.063 0.053 0.063 1 +9: dbcsr_create_new 197 6.7 0.022 0.053 0.025 0.057 6 +9: dbcsr_data_copy_aa2 13 6.8 0.033 0.047 0.033 0.047 1 +9: dbcsr_data_release 630 7.1 0.027 0.032 0.027 0.032 6 +9: dbcsr_make_random_matrix 3 3.0 0.016 0.019 0.024 0.031 5 +9: dbcsr_special_finalize 80 7.0 0.002 0.009 0.018 0.027 6 +9: dbcsr_add_wm_from_matrix 10 5.0 0.003 0.014 0.015 0.025 0 +9: dbcsr_init_lib_low 1 1.0 0.008 0.024 0.008 0.024 4 +9: make_images_data 20 7.0 0.001 0.001 0.017 0.021 4 +9: hybrid_alltoall_any 20 8.0 0.015 0.020 0.016 0.020 1 +9: make_images_pack 20 7.0 0.016 0.020 0.016 0.020 1 +9: dbcsr_merge_single_wm 70 8.0 0.004 0.007 0.015 0.019 5 +9: mp_max_l 89 1.0 0.014 0.018 0.014 0.018 3 +9: dbcsr_work_destroy_all 96 7.6 0.001 0.001 0.014 0.017 4 +9: mp_alltoall_d11v 9 5.0 0.008 0.017 0.008 0.017 4 +9: buffer_matrices_ensure_size 20 6.0 0.013 0.015 0.013 0.015 2 +9: dbcsr_fill_wm_from_matrix 10 6.0 0.012 0.013 0.012 0.013 5 +9: dbcsr_make_index_list 80 6.0 0.005 0.013 0.005 0.013 2 +9: dbcsr_sort_data 70 9.0 0.010 0.012 0.010 0.012 1 +9: dbcsr_destroy 187 5.4 0.001 0.001 0.009 0.011 0 +9: dbcsr_make_untransposed_blocks 20 5.0 0.002 0.008 0.002 0.008 2 +9: dbcsr_mm_multrec_init 10 6.0 0.000 0.000 0.002 0.007 5 +9: dbcsr_mm_csr_init 10 7.0 0.002 0.007 0.002 0.007 2 +9: mp_max_i 92 1.0 0.002 0.007 0.002 0.007 2 +9: setup_buffer_matrices 20 6.0 0.001 0.001 0.004 0.005 5 +9: tree_to_linear_d 3 6.0 0.003 0.004 0.003 0.004 5 +9: dbcsr_data_new 421 7.3 0.002 0.003 0.002 0.003 5 +9: dbcsr_make_index_exist 197 7.7 0.002 0.002 0.002 0.002 6 +9: multiply_cannon_metrocomm2 60 7.0 0.001 0.001 0.002 0.002 2 +9: setup_rec_index_2d 20 6.0 0.001 0.002 0.001 0.002 5 +9: mp_maxloc_dv 201 1.0 0.002 0.002 0.002 0.002 1 +9: mp_cart_sub 2 5.0 0.002 0.002 0.002 0.002 0 +9: mp_bcast_av 98 1.0 0.001 0.001 0.001 0.002 4 +9: dbcsr_work_create 96 6.7 0.001 0.001 0.001 0.001 4 +9: multiply_cannon_multrec_finali 10 8.0 0.000 0.000 0.001 0.001 0 +9: dbcsr_mm_multrec_finalize 10 9.0 0.001 0.001 0.001 0.001 0 +9: mp_cart_create 1 5.0 0.001 0.001 0.001 0.001 3 +9: mp_bcast_i 99 2.0 0.001 0.001 0.001 0.001 1 +9: dbcsr_iterator_start 76 6.8 0.000 0.001 0.001 0.001 2 +9: dbcsr_sort_indices 96 8.6 0.001 0.001 0.001 0.001 2 +9: quick_finalize 13 7.5 0.000 0.000 0.000 0.001 6 +9: mp_irecv_dv 60 8.0 0.000 0.000 0.000 0.000 4 +9: dbcsr_iterator_stop 76 6.8 0.000 0.000 0.000 0.000 4 +9: mp_isend_iv 100 8.0 0.000 0.000 0.000 0.000 6 +9: mp_isend_dv 60 8.0 0.000 0.000 0.000 0.000 0 +9: mp_irecv_iv 100 8.0 0.000 0.000 0.000 0.000 6 +9: merge_index 13 6.8 0.000 0.000 0.000 0.000 0 +9: dbcsr_make_index_local_row 80 6.0 0.000 0.000 0.000 0.000 4 9: dbcsr_iterator_seek 76 7.8 0.000 0.000 0.000 0.000 2 -9: fill_hash_tables 10 8.0 0.000 0.000 0.000 0.000 0 -9: dbcsr_make_dbcsr_index 86 8.6 0.000 0.000 0.000 0.000 11 -9: dbcsr_distribution_new 26 4.7 0.000 0.000 0.000 0.000 10 -9: quick_finalize 3 6.0 0.000 0.000 0.000 0.000 2 -9: dbcsr_switch_data_area 23 6.1 0.000 0.000 0.000 0.000 4 -9: mp_max_r 1 1.0 0.000 0.000 0.000 0.000 10 +9: dbcsr_switch_data_area 33 7.0 0.000 0.000 0.000 0.000 1 +9: dbcsr_make_dbcsr_index 96 8.6 0.000 0.000 0.000 0.000 0 +9: mp_sum_b 20 5.0 0.000 0.000 0.000 0.000 6 +9: dbcsr_distribution_new 26 4.7 0.000 0.000 0.000 0.000 4 +9: fill_hash_tables 10 8.0 0.000 0.000 0.000 0.000 5 +9: mp_max_r 1 1.0 0.000 0.000 0.000 0.000 5 +9: multiply_cannon_metrocomm3 70 7.0 0.000 0.000 0.000 0.000 6 9: mp_sum_root_rm 2 4.0 0.000 0.000 0.000 0.000 0 +9: dbcsr_mm_sched_init 10 8.0 0.000 0.000 0.000 0.000 2 +9: dbcsr_get_data_size_used 16 5.8 0.000 0.000 0.000 0.000 0 9: dbcsr_dist_bin 4 3.0 0.000 0.000 0.000 0.000 4 -9: mp_comm_free 4 2.0 0.000 0.000 0.000 0.000 0 -9: dbcsr_mm_sched_init 10 8.0 0.000 0.000 0.000 0.000 10 -9: dbcsr_get_data_size_used 16 5.8 0.000 0.000 0.000 0.000 4 -9: mp_alltoall_i11v 9 5.0 0.000 0.000 0.000 0.000 4 -9: dbcsr_get_global_row_map 10 5.0 0.000 0.000 0.000 0.000 11 -9: dbcsr_verify_matrix 3 4.0 0.000 0.000 0.000 0.000 10 -9: mp_bcast_iv 2 1.0 0.000 0.000 0.000 0.000 10 -9: dbcsr_get_local_rows 10 5.0 0.000 0.000 0.000 0.000 4 -9: mp_max_rv 1 1.0 0.000 0.000 0.000 0.000 2 -9: mp_sum_lm3 1 1.0 0.000 0.000 0.000 0.000 2 -9: mp_sum_rv 1 1.0 0.000 0.000 0.000 0.000 0 -9: mp_min_rv 1 1.0 0.000 0.000 0.000 0.000 9 -9: dbcsr_get_local_cols 10 5.0 0.000 0.000 0.000 0.000 9 +9: mp_comm_free 4 2.0 0.000 0.000 0.000 0.000 2 +9: mp_sum_lv 2 1.0 0.000 0.000 0.000 0.000 0 +9: mp_sum_lm3 1 1.0 0.000 0.000 0.000 0.000 4 +9: mp_alltoall_i11v 9 5.0 0.000 0.000 0.000 0.000 3 +9: dbcsr_mm_hostdrv_init 10 9.0 0.000 0.000 0.000 0.000 5 +9: dbcsr_get_local_rows 10 5.0 0.000 0.000 0.000 0.000 2 +9: dbcsr_get_local_cols 10 5.0 0.000 0.000 0.000 0.000 3 +9: dbcsr_mm_sched_finalize 10 10.0 0.000 0.000 0.000 0.000 0 +9: dbcsr_verify_matrix 3 4.0 0.000 0.000 0.000 0.000 6 +9: dbcsr_get_global_row_map 10 5.0 0.000 0.000 0.000 0.000 5 +9: dbcsr_get_global_col_map 10 5.0 0.000 0.000 0.000 0.000 3 +9: mp_bcast_iv 2 1.0 0.000 0.000 0.000 0.000 4 +9: mp_min_rv 1 1.0 0.000 0.000 0.000 0.000 2 9: mp_sum_r 1 1.0 0.000 0.000 0.000 0.000 2 -9: dbcsr_mm_sched_finalize 10 10.0 0.000 0.000 0.000 0.000 3 -9: dbcsr_get_global_col_map 10 5.0 0.000 0.000 0.000 0.000 9 -9: dbcsr_mm_hostdrv_init 10 9.0 0.000 0.000 0.000 0.000 10 -9: mp_max_d 1 1.0 0.000 0.000 0.000 0.000 9 -9: mp_sum_i 1 1.0 0.000 0.000 0.000 0.000 8 +9: mp_max_d 1 1.0 0.000 0.000 0.000 0.000 1 +9: mp_max_rv 1 1.0 0.000 0.000 0.000 0.000 5 +9: mp_sum_i 1 1.0 0.000 0.000 0.000 0.000 2 +9: mp_sum_rv 1 1.0 0.000 0.000 0.000 0.000 2 9: ------------------------------------------------------------------------------- 9: - 9/19 Test #9: dbcsr_perf:inputs/test_square_sparse_bigblocks.perf ... Passed 0.74 sec + 9/19 Test #9: dbcsr_perf:inputs/test_square_sparse_bigblocks.perf ... Passed 1.61 sec test 10 Start 10: dbcsr_perf:inputs/test_square_sparse_rma.perf -10: Test command: /usr/bin/mpiexec "-n" "12" "/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/tests/dbcsr_perf" "/build/reproducible-path/dbcsr-2.6.0/tests/inputs/test_square_sparse_rma.perf" +10: Test command: /usr/bin/mpiexec "-n" "7" "/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/tests/dbcsr_perf" "/build/reproducible-path/dbcsr-2.6.0/tests/inputs/test_square_sparse_rma.perf" 10: Working Directory: /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/tests 10: Environment variables: 10: OMP_NUM_THREADS=2 @@ -3755,12 +3780,12 @@ 10: DBCSR| Use Communication thread T (D) 10: DBCSR| Communication thread load 100 (D) 10: DBCSR| MPI: My process id 0 -10: DBCSR| MPI: Number of processes 12 +10: DBCSR| MPI: Number of processes 7 10: DBCSR| OMP: Current number of threads 2 10: DBCSR| OMP: Max number of threads 2 10: DBCSR| Split modifier for TAS multiplication algorithm 1.0E+00 (D) 10: numthreads 2 -10: numnodes 12 +10: numnodes 7 10: matrix_sizes 1000 1000 1000 10: sparsities 0.90000000000000002 0.90000000000000002 0.90000000000000002 10: trans NN @@ -3777,7 +3802,7 @@ 10: ******************************************************************************** 10: -- PERF dbcsr_multiply (N, N, 3 , N, N, N) 10: matrix sizes A( 1000 x 1000), B( 1000 x 1000) and C( 1000 x 1000) -10: numnodes (nprows X npcols) = 12( 4 X 3) +10: numnodes (nprows X npcols) = 7( 7 X 1) 10: nthreads = 2 10: checksum(A) = 0.330113256255407E+05 10: checksum(B) = 0.336183330312199E+05 @@ -3787,12 +3812,12 @@ 10: 10: 10: mean std minmin maxmax -10: time = 37.08E-03 2.27E-03 27.71E-03 55.54E-03 seconds -10: perf total = 481.67E+06 28.56E+06 356.62E+06 632.32E+06 FLOPS -10: perf per node = 40.14E+06 2.38E+06 29.72E+06 52.69E+06 FLOPS -10: perf per thread = 20.07E+06 1.19E+06 14.86E+06 26.35E+06 FLOPS -10: load imbalance = 0.39E-01 0.22E-02 0.29E-01 0.51E-01 -10: rel load imbal = 0.93E+00 0.25E-02 0.92E+00 0.95E+00 +10: time = 63.20E-03 3.51E-03 45.01E-03 88.11E-03 seconds +10: perf total = 305.33E+06 16.55E+06 224.81E+06 382.35E+06 FLOPS +10: perf per node = 43.62E+06 2.36E+06 32.12E+06 54.62E+06 FLOPS +10: perf per thread = 21.81E+06 1.18E+06 16.06E+06 27.31E+06 FLOPS +10: load imbalance = 0.58E-01 0.31E-02 0.45E-01 0.76E-01 +10: rel load imbal = 0.86E+00 0.14E-02 0.86E+00 0.88E+00 10: ******************************************************************************** 10: 10: ------------------------------------------------------------------------------- @@ -3804,35 +3829,35 @@ 10: flops 5 x 5 x 5 198075000 100.0% 0.0% 0.0% 10: flops inhomo. stacks 0 0.0% 0.0% 0.0% 10: flops total 198.075000E+06 100.0% 0.0% 0.0% -10: flops max/rank 17.092500E+06 100.0% 0.0% 0.0% +10: flops max/rank 28.655000E+06 100.0% 0.0% 0.0% 10: matmuls inhomo. stacks 0 0.0% 0.0% 0.0% 10: matmuls total 792300 100.0% 0.0% 0.0% -10: number of processed stacks 2880 100.0% 0.0% 0.0% -10: average stack size 275.1 0.0 0.0 -10: marketing flops 20.000000E+09 +10: number of processed stacks 1040 100.0% 0.0% 0.0% +10: average stack size 761.8 0.0 0.0 +10: marketing flops 19.999998E+09 10: ------------------------------------------------------------------------------- 10: # multiplications 10 -10: max memory usage/rank 104.554496E+06 -10: # max total images/rank 4 +10: max memory usage/rank 80.064512E+06 +10: # max total images/rank 7 10: # max 3D layers 1 -10: # MPI messages exchanged 2880 +10: # MPI messages exchanged 980 10: MPI messages size (bytes): -10: total size 55.996000E+06 -10: min size 10.800000E+03 -10: max size 27.800000E+03 -10: average size 19.443055E+03 +10: total size 64.486000E+06 +10: min size 13.000000E+03 +10: max size 121.000000E+03 +10: average size 65.802039E+03 10: MPI breakdown and total messages size (bytes): 10: size <= 128 0 0 10: 128 < size <= 8192 0 0 -10: 8192 < size <= 32768 2880 55996000 -10: 32768 < size <= 131072 0 0 +10: 8192 < size <= 32768 490 7884000 +10: 32768 < size <= 131072 490 56602000 10: 131072 < size <= 4194304 0 0 10: 4194304 < size <= 16777216 0 0 10: 16777216 < size 0 0 10: ------------------------------------------------------------------------------- 10: 10: *** WARNING in dbcsr_mm.F:291 :: Using a non-square number of MPI ranks *** -10: *** might lead to poor performance. Used ranks: 12 Suggested: 9 25 *** +10: *** might lead to poor performance. Used ranks: 7 Suggested: 9 16 *** 10: 10: ------------------------------------------------------------------------------- 10: - - @@ -3841,11 +3866,9 @@ 10: ------------------------------------------------------------------------------- 10: ROUTINE CALLS AVE VOLUME [Bytes] 10: MP_Bcast 2 12. -10: MP_Allreduce 68 40. -10: MP_Alltoall 41 21097. -10: MP_ISend 40 11554. -10: MP_IRecv 40 11819. -10: MP_RGet 480 10440. +10: MP_Allreduce 68 28. +10: MP_Alltoall 41 35114. +10: MP_RGet 280 34945. 10: ------------------------------------------------------------------------------- 10: 10: ------------------------------------------------------------------------------- @@ -3855,120 +3878,116 @@ 10: ------------------------------------------------------------------------------- 10: SUBROUTINE CALLS ASD SELF TIME TOTAL TIME MAXRANK 10: MAXIMUM AVERAGE MAXIMUM AVERAGE MAXIMUM -10: dbcsr_performance_driver 1 1.0 0.000 0.000 0.501 0.504 0 -10: dbcsr_perf_multiply_low 1 2.0 0.000 0.001 0.501 0.504 7 -10: perf_multiply 1 3.0 0.000 0.000 0.494 0.498 0 -10: dbcsr_multiply_generic 10 4.0 0.001 0.001 0.371 0.390 11 -10: multiply_3D 10 5.0 0.006 0.016 0.154 0.172 6 -10: multiply_3D_loop 10 6.0 0.007 0.015 0.119 0.150 8 -10: make_buffers 20 5.0 0.026 0.038 0.111 0.128 8 -10: mp_sum_l 125 2.4 0.077 0.118 0.077 0.118 4 -10: dbcsr_multiply_generic_mpsum_f 10 5.0 0.000 0.000 0.076 0.117 4 -10: mp_waitall_1 490 7.7 0.069 0.090 0.069 0.090 8 -10: make_buffers_sizes 20 6.0 0.000 0.000 0.066 0.075 3 -10: mp_alltoall_i44 20 7.0 0.066 0.075 0.066 0.075 7 -10: mp_sync 10 4.0 0.064 0.074 0.064 0.074 6 -10: multiply_3D_multrec 120 7.0 0.049 0.060 0.049 0.060 11 -10: multiply_3D_comm_right 120 7.0 0.000 0.000 0.036 0.059 3 -10: dbcsr_copy 30 4.7 0.004 0.011 0.023 0.043 3 -10: dbcsr_redistribute 3 4.0 0.008 0.020 0.034 0.040 5 -10: multiply_3D_comm_left 120 7.0 0.000 0.000 0.021 0.037 8 -10: dbcsr_create_new 77 5.7 0.018 0.027 0.019 0.033 3 -10: mp_alltoall_i22 3 5.0 0.025 0.032 0.025 0.032 4 -10: win_setup 20 6.0 0.000 0.000 0.019 0.032 3 -10: win_setup_win_check 18 7.0 0.000 0.000 0.015 0.027 11 -10: mp_wait 18 8.0 0.015 0.027 0.015 0.027 5 -10: dbcsr_checksum 5 4.0 0.007 0.011 0.022 0.024 5 -10: make_buffers_data 20 6.0 0.000 0.000 0.014 0.021 8 -10: hybrid_alltoall_any 20 7.0 0.000 0.000 0.013 0.020 5 -10: mp_sum_d 76 1.3 0.015 0.017 0.015 0.017 11 -10: dbcsr_init_lib_low 1 1.0 0.003 0.011 0.003 0.011 0 -10: dbcsr_make_untransposed_blocks 20 5.0 0.006 0.010 0.006 0.010 3 -10: dbcsr_finalize 17 5.4 0.001 0.003 0.009 0.010 0 -10: mp_rget_iv 240 7.0 0.004 0.010 0.004 0.010 8 -10: dbcsr_merge_all 13 6.5 0.001 0.002 0.007 0.008 3 -10: dbcsr_make_random_matrix 3 3.0 0.005 0.006 0.006 0.007 0 -10: dbcsr_mm_multrec_init 10 7.0 0.000 0.000 0.002 0.006 11 -10: dbcsr_mm_csr_init 10 8.0 0.001 0.006 0.002 0.006 6 -10: mp_max_l 88 1.0 0.005 0.006 0.005 0.006 1 -10: dbcsr_make_index_exist 37 6.4 0.001 0.006 0.001 0.006 3 -10: dbcsr_mm_multrec_finalize 10 6.0 0.001 0.005 0.001 0.005 3 -10: mp_win_create_dv 2 7.0 0.004 0.005 0.004 0.005 0 -10: setup_rec_index_images 20 6.0 0.003 0.004 0.003 0.004 11 -10: dbcsr_sort_indices 16 7.4 0.003 0.003 0.003 0.003 9 -10: make_buffers_pack 20 6.0 0.002 0.002 0.002 0.003 1 -10: mp_rget_dv 240 7.0 0.001 0.002 0.001 0.002 5 -10: dbcsr_data_release 310 6.7 0.001 0.002 0.001 0.002 8 -10: dbcsr_add_wm_from_matrix 10 5.0 0.000 0.000 0.002 0.002 3 -10: dbcsr_work_destroy_all 16 6.4 0.000 0.000 0.001 0.002 6 -10: dbcsr_fill_wm_from_matrix 10 6.0 0.001 0.001 0.001 0.001 10 -10: merge_index 13 7.5 0.001 0.001 0.001 0.001 9 -10: dbcsr_data_copy_aa2 13 7.5 0.001 0.001 0.001 0.001 9 -10: mp_maxloc_dv 199 1.0 0.001 0.001 0.001 0.001 2 -10: mp_bcast_av 97 1.0 0.000 0.000 0.001 0.001 3 -10: mp_cart_sub 2 5.0 0.001 0.001 0.001 0.001 9 -10: mp_bcast_i 98 2.0 0.000 0.001 0.000 0.001 5 -10: fill_hash_tables 10 9.0 0.000 0.001 0.000 0.001 1 -10: tree_to_linear_d 3 6.0 0.000 0.001 0.000 0.001 9 -10: mp_max_i 91 1.0 0.000 0.001 0.000 0.001 4 -10: dbcsr_destroy 67 5.4 0.000 0.000 0.000 0.000 3 -10: dbcsr_iterator_start 76 6.3 0.000 0.000 0.000 0.000 2 -10: dbcsr_data_new 179 6.1 0.000 0.000 0.000 0.000 5 -10: mp_isend_dv 20 8.0 0.000 0.000 0.000 0.000 10 -10: mp_cart_create 1 5.0 0.000 0.000 0.000 0.000 9 -10: mp_win_create_iv 2 7.0 0.000 0.000 0.000 0.000 4 -10: dbcsr_work_create 16 5.4 0.000 0.000 0.000 0.000 7 -10: dbcsr_iterator_seek 76 7.3 0.000 0.000 0.000 0.000 3 -10: mp_sum_lm3 1 1.0 0.000 0.000 0.000 0.000 6 -10: mp_alltoall_d11v 9 5.0 0.000 0.000 0.000 0.000 7 -10: mp_iallgather_i24 20 6.0 0.000 0.000 0.000 0.000 3 -10: dbcsr_distribution_new 26 4.7 0.000 0.000 0.000 0.000 7 -10: dbcsr_iterator_stop 76 6.3 0.000 0.000 0.000 0.000 10 -10: quick_finalize 3 6.0 0.000 0.000 0.000 0.000 7 -10: mp_isum_bv 18 6.0 0.000 0.000 0.000 0.000 8 -10: dbcsr_dist_bin 4 3.0 0.000 0.000 0.000 0.000 0 -10: mp_isend_iv 20 7.0 0.000 0.000 0.000 0.000 3 -10: mp_max_r 1 1.0 0.000 0.000 0.000 0.000 10 -10: dbcsr_make_dbcsr_index 16 7.4 0.000 0.000 0.000 0.000 7 -10: dbcsr_switch_data_area 23 6.1 0.000 0.000 0.000 0.000 7 +10: dbcsr_performance_driver 1 1.0 0.000 0.000 0.798 0.799 0 +10: dbcsr_perf_multiply_low 1 2.0 0.000 0.001 0.797 0.799 3 +10: perf_multiply 1 3.0 0.000 0.000 0.781 0.787 0 +10: dbcsr_multiply_generic 10 4.0 0.002 0.002 0.632 0.646 1 +10: multiply_3D 10 5.0 0.003 0.003 0.318 0.380 2 +10: multiply_3D_loop 10 6.0 0.008 0.038 0.226 0.292 2 +10: mp_sum_l 125 2.4 0.157 0.198 0.157 0.198 4 +10: multiply_3D_multrec 70 7.0 0.110 0.171 0.110 0.171 1 +10: dbcsr_multiply_generic_mpsum_f 10 5.0 0.000 0.000 0.119 0.155 4 +10: mp_waitall_1 390 7.7 0.100 0.132 0.100 0.132 0 +10: multiply_3D_comm_right 70 7.0 0.000 0.000 0.100 0.132 5 +10: make_buffers 20 5.0 0.012 0.044 0.119 0.124 2 +10: make_buffers_sizes 20 6.0 0.000 0.000 0.082 0.093 1 +10: mp_alltoall_i44 20 7.0 0.082 0.093 0.082 0.093 4 +10: mp_sync 10 4.0 0.058 0.092 0.058 0.092 1 +10: win_setup 20 6.0 0.000 0.000 0.066 0.085 1 +10: dbcsr_copy 30 4.7 0.007 0.014 0.019 0.070 2 +10: win_setup_win_check 18 7.0 0.000 0.000 0.046 0.064 1 +10: mp_wait 18 8.0 0.046 0.064 0.046 0.064 4 +10: dbcsr_create_new 77 5.7 0.012 0.056 0.012 0.056 2 +10: dbcsr_redistribute 3 4.0 0.023 0.034 0.044 0.048 1 +10: dbcsr_checksum 5 4.0 0.023 0.036 0.041 0.045 1 +10: dbcsr_finalize 17 5.4 0.000 0.000 0.024 0.041 3 +10: dbcsr_merge_all 13 6.5 0.006 0.012 0.021 0.038 4 +10: mp_alltoall_i22 3 5.0 0.019 0.031 0.019 0.031 2 +10: mp_sum_d 76 1.3 0.019 0.029 0.019 0.029 5 +10: dbcsr_sort_indices 16 7.4 0.009 0.023 0.009 0.023 1 +10: dbcsr_make_random_matrix 3 3.0 0.009 0.010 0.016 0.022 4 +10: dbcsr_make_untransposed_blocks 20 5.0 0.016 0.021 0.016 0.021 3 +10: mp_win_create_dv 2 7.0 0.019 0.021 0.019 0.021 4 +10: mp_max_l 84 1.0 0.008 0.012 0.008 0.012 1 +10: dbcsr_mm_multrec_finalize 10 6.0 0.004 0.012 0.004 0.012 4 +10: mp_iallgather_i24 20 6.0 0.011 0.011 0.011 0.011 5 +10: dbcsr_add_wm_from_matrix 10 5.0 0.000 0.001 0.005 0.009 4 +10: dbcsr_fill_wm_from_matrix 10 6.0 0.004 0.008 0.004 0.009 1 +10: make_buffers_pack 20 6.0 0.007 0.008 0.007 0.008 5 +10: mp_rget_iv 140 7.0 0.002 0.008 0.002 0.008 6 +10: dbcsr_init_lib_low 1 1.0 0.002 0.007 0.002 0.007 1 +10: setup_rec_index_images 20 6.0 0.005 0.006 0.005 0.006 3 +10: dbcsr_mm_multrec_init 10 7.0 0.000 0.000 0.002 0.006 6 +10: dbcsr_mm_csr_init 10 8.0 0.001 0.005 0.002 0.006 4 +10: mp_maxloc_dv 191 1.0 0.005 0.006 0.005 0.006 4 +10: dbcsr_data_release 310 6.7 0.003 0.004 0.003 0.004 6 +10: dbcsr_switch_data_area 23 6.1 0.001 0.004 0.001 0.004 3 +10: dbcsr_data_copy_aa2 13 7.5 0.003 0.004 0.003 0.004 3 +10: dbcsr_work_destroy_all 16 6.4 0.001 0.001 0.003 0.003 2 +10: mp_rget_dv 140 7.0 0.002 0.003 0.002 0.003 5 +10: merge_index 13 7.5 0.002 0.002 0.002 0.002 3 +10: mp_cart_sub 2 5.0 0.002 0.002 0.002 0.002 0 +10: dbcsr_destroy 67 5.4 0.000 0.001 0.001 0.002 4 +10: fill_hash_tables 10 9.0 0.001 0.002 0.001 0.002 3 +10: make_buffers_data 20 6.0 0.001 0.001 0.001 0.002 3 +10: mp_bcast_av 93 1.0 0.001 0.001 0.001 0.001 3 +10: tree_to_linear_d 3 6.0 0.001 0.001 0.001 0.001 6 +10: mp_max_i 87 1.0 0.001 0.001 0.001 0.001 4 +10: hybrid_alltoall_any 20 7.0 0.000 0.001 0.001 0.001 6 +10: dbcsr_iterator_start 76 6.3 0.000 0.000 0.001 0.001 5 +10: mp_bcast_i 94 2.0 0.001 0.001 0.001 0.001 4 +10: dbcsr_data_new 179 6.1 0.000 0.001 0.000 0.001 1 +10: mp_cart_create 1 5.0 0.000 0.000 0.000 0.000 5 +10: dbcsr_make_index_exist 37 6.4 0.000 0.000 0.000 0.000 6 +10: dbcsr_iterator_stop 76 6.3 0.000 0.000 0.000 0.000 3 +10: multiply_3D_comm_left 70 7.0 0.000 0.000 0.000 0.000 2 +10: dbcsr_distribution_new 26 4.7 0.000 0.000 0.000 0.000 3 +10: mp_alltoall_d11v 9 5.0 0.000 0.000 0.000 0.000 1 10: mp_sum_root_rm 2 4.0 0.000 0.000 0.000 0.000 0 -10: dbcsr_get_data_size_used 16 6.4 0.000 0.000 0.000 0.000 1 -10: mp_comm_free 4 2.0 0.000 0.000 0.000 0.000 6 -10: dbcsr_verify_matrix 3 4.0 0.000 0.000 0.000 0.000 11 -10: multiply_3D_sizes 10 6.0 0.000 0.000 0.000 0.000 11 -10: mp_irecv_dv 20 8.0 0.000 0.000 0.000 0.000 0 -10: dbcsr_mm_sched_init 10 9.0 0.000 0.000 0.000 0.000 6 -10: mp_alltoall_i11v 9 5.0 0.000 0.000 0.000 0.000 2 -10: mp_irecv_iv 20 7.0 0.000 0.000 0.000 0.000 3 -10: dbcsr_get_local_rows 10 5.0 0.000 0.000 0.000 0.000 2 -10: mp_win_lock_all 4 7.0 0.000 0.000 0.000 0.000 5 -10: dbcsr_get_local_cols 10 5.0 0.000 0.000 0.000 0.000 10 -10: dbcsr_get_global_col_map 10 5.0 0.000 0.000 0.000 0.000 0 -10: mp_min_rv 1 1.0 0.000 0.000 0.000 0.000 10 -10: mp_sum_r 1 1.0 0.000 0.000 0.000 0.000 6 -10: mp_sum_lv 2 1.0 0.000 0.000 0.000 0.000 2 -10: mp_bcast_iv 2 1.0 0.000 0.000 0.000 0.000 6 -10: mp_max_d 1 1.0 0.000 0.000 0.000 0.000 2 -10: mp_max_rv 1 1.0 0.000 0.000 0.000 0.000 3 -10: mp_sum_i 1 1.0 0.000 0.000 0.000 0.000 6 -10: mp_sum_rv 1 1.0 0.000 0.000 0.000 0.000 7 -10: dbcsr_get_global_row_map 10 5.0 0.000 0.000 0.000 0.000 7 -10: dbcsr_mm_sched_finalize 10 7.0 0.000 0.000 0.000 0.000 0 -10: dbcsr_mm_hostdrv_init 10 10.0 0.000 0.000 0.000 0.000 11 +10: dbcsr_work_create 16 5.4 0.000 0.000 0.000 0.000 1 +10: dbcsr_iterator_seek 76 7.3 0.000 0.000 0.000 0.000 5 +10: mp_win_create_iv 2 7.0 0.000 0.000 0.000 0.000 0 +10: quick_finalize 3 6.0 0.000 0.000 0.000 0.000 3 +10: multiply_3D_sizes 10 6.0 0.000 0.000 0.000 0.000 1 +10: dbcsr_make_dbcsr_index 16 7.4 0.000 0.000 0.000 0.000 5 +10: mp_isum_bv 18 6.0 0.000 0.000 0.000 0.000 6 +10: dbcsr_dist_bin 4 3.0 0.000 0.000 0.000 0.000 1 +10: mp_max_r 1 1.0 0.000 0.000 0.000 0.000 4 +10: dbcsr_verify_matrix 3 4.0 0.000 0.000 0.000 0.000 4 +10: dbcsr_mm_sched_init 10 9.0 0.000 0.000 0.000 0.000 4 +10: dbcsr_get_data_size_used 16 6.4 0.000 0.000 0.000 0.000 3 +10: mp_comm_free 4 2.0 0.000 0.000 0.000 0.000 4 +10: mp_sum_lv 2 1.0 0.000 0.000 0.000 0.000 0 +10: mp_alltoall_i11v 9 5.0 0.000 0.000 0.000 0.000 6 +10: dbcsr_get_local_rows 10 5.0 0.000 0.000 0.000 0.000 5 +10: dbcsr_get_local_cols 10 5.0 0.000 0.000 0.000 0.000 5 +10: dbcsr_get_global_col_map 10 5.0 0.000 0.000 0.000 0.000 2 +10: mp_bcast_iv 2 1.0 0.000 0.000 0.000 0.000 4 +10: mp_win_lock_all 4 7.0 0.000 0.000 0.000 0.000 2 +10: dbcsr_get_global_row_map 10 5.0 0.000 0.000 0.000 0.000 2 +10: dbcsr_mm_sched_finalize 10 7.0 0.000 0.000 0.000 0.000 4 +10: mp_sum_lm3 1 1.0 0.000 0.000 0.000 0.000 0 +10: mp_sum_i 1 1.0 0.000 0.000 0.000 0.000 5 +10: dbcsr_mm_hostdrv_init 10 10.0 0.000 0.000 0.000 0.000 4 +10: mp_sum_r 1 1.0 0.000 0.000 0.000 0.000 0 +10: mp_max_rv 1 1.0 0.000 0.000 0.000 0.000 4 +10: mp_max_d 1 1.0 0.000 0.000 0.000 0.000 4 +10: mp_min_rv 1 1.0 0.000 0.000 0.000 0.000 4 +10: mp_sum_rv 1 1.0 0.000 0.000 0.000 0.000 5 10: ------------------------------------------------------------------------------- 10: -10/19 Test #10: dbcsr_perf:inputs/test_square_sparse_rma.perf ......... Passed 0.58 sec +10/19 Test #10: dbcsr_perf:inputs/test_square_sparse_rma.perf ......... Passed 0.93 sec test 11 Start 11: dbcsr_unittest1 -11: Test command: /usr/bin/mpiexec "-n" "12" "/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/tests/dbcsr_unittest1" +11: Test command: /usr/bin/mpiexec "-n" "7" "/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/tests/dbcsr_unittest1" 11: Working Directory: /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/tests 11: Environment variables: 11: OMP_NUM_THREADS=2 11: Test timeout computed to be: 1500 11: test_name add_1 11: numthreads 2 -11: numnodes 12 +11: numnodes 7 11: matrix_sizes 50 25 11: sparsities 0.69999999999999996 0.50000000000000000 11: alpha (1.0000000000000000,1.0000000000000000) @@ -4015,7 +4034,7 @@ 11: ********************************************************************** 11: test_name add_2 11: numthreads 2 -11: numnodes 12 +11: numnodes 7 11: matrix_sizes 50 50 11: sparsities 0.40000000000000002 0.50000000000000000 11: alpha (3.0000000000000000,2.0000000000000000) @@ -4206,7 +4225,7 @@ 11: ********************************************************************** 11: test_name multiply_ALPHA 11: numthreads 2 -11: numnodes 12 +11: numnodes 7 11: matrix_sizes 20 20 20 11: sparsities 0.50000000000000000 0.50000000000000000 0.50000000000000000 11: alpha (-3.0000000000000000,-4.0000000000000000) @@ -5838,7 +5857,7 @@ 11: ********************************************************************** 11: test_name multiply_BETA 11: numthreads 2 -11: numnodes 12 +11: numnodes 7 11: matrix_sizes 20 20 20 11: sparsities 0.50000000000000000 0.50000000000000000 0.50000000000000000 11: alpha (1.0000000000000000,0.0000000000000000) @@ -7470,7 +7489,7 @@ 11: ********************************************************************** 11: test_name multiply_LIMITS_COL_1 11: numthreads 2 -11: numnodes 12 +11: numnodes 7 11: matrix_sizes 50 50 50 11: sparsities 0.0000000000000000 0.0000000000000000 0.0000000000000000 11: alpha (1.0000000000000000,0.0000000000000000) @@ -9102,7 +9121,7 @@ 11: ********************************************************************** 11: test_name multiply_LIMITS_COL_2 11: numthreads 2 -11: numnodes 12 +11: numnodes 7 11: matrix_sizes 50 50 50 11: sparsities 0.0000000000000000 0.0000000000000000 0.0000000000000000 11: alpha (1.0000000000000000,0.0000000000000000) @@ -10734,7 +10753,7 @@ 11: ********************************************************************** 11: test_name multiply_LIMITS_COL_3 11: numthreads 2 -11: numnodes 12 +11: numnodes 7 11: matrix_sizes 50 50 50 11: sparsities 0.50000000000000000 0.50000000000000000 0.50000000000000000 11: alpha (1.0000000000000000,0.0000000000000000) @@ -12366,7 +12385,7 @@ 11: ********************************************************************** 11: test_name multiply_LIMITS_COL_4 11: numthreads 2 -11: numnodes 12 +11: numnodes 7 11: matrix_sizes 25 50 75 11: sparsities 0.50000000000000000 0.50000000000000000 0.50000000000000000 11: alpha (1.0000000000000000,0.0000000000000000) @@ -12558,7 +12577,7 @@ 11: ********************************************************************** 11: test_name multiply_LIMITS_K_1 11: numthreads 2 -11: numnodes 12 +11: numnodes 7 11: matrix_sizes 50 50 50 11: sparsities 0.0000000000000000 0.0000000000000000 0.0000000000000000 11: alpha (1.0000000000000000,0.0000000000000000) @@ -14310,7 +14329,7 @@ 11: ********************************************************************** 11: test_name multiply_LIMITS_K_2 11: numthreads 2 -11: numnodes 12 +11: numnodes 7 11: matrix_sizes 50 50 50 11: sparsities 0.0000000000000000 0.0000000000000000 0.0000000000000000 11: alpha (1.0000000000000000,0.0000000000000000) @@ -16062,7 +16081,7 @@ 11: ********************************************************************** 11: test_name multiply_LIMITS_K_3 11: numthreads 2 -11: numnodes 12 +11: numnodes 7 11: matrix_sizes 50 50 50 11: sparsities 0.50000000000000000 0.50000000000000000 0.50000000000000000 11: alpha (1.0000000000000000,0.0000000000000000) @@ -17814,7 +17833,7 @@ 11: ********************************************************************** 11: test_name multiply_LIMITS_K_4 11: numthreads 2 -11: numnodes 12 +11: numnodes 7 11: matrix_sizes 25 50 75 11: sparsities 0.50000000000000000 0.50000000000000000 0.50000000000000000 11: alpha (1.0000000000000000,0.0000000000000000) @@ -18006,7 +18025,7 @@ 11: ********************************************************************** 11: test_name multiply_LIMITS_MIX_1 11: numthreads 2 -11: numnodes 12 +11: numnodes 7 11: matrix_sizes 50 50 50 11: sparsities 0.0000000000000000 0.0000000000000000 0.0000000000000000 11: alpha (1.0000000000000000,0.0000000000000000) @@ -19638,7 +19657,7 @@ 11: ********************************************************************** 11: test_name multiply_LIMITS_MIX_2 11: numthreads 2 -11: numnodes 12 +11: numnodes 7 11: matrix_sizes 50 50 50 11: sparsities 0.0000000000000000 0.0000000000000000 0.0000000000000000 11: alpha (1.0000000000000000,0.0000000000000000) @@ -21270,7 +21289,7 @@ 11: ********************************************************************** 11: test_name multiply_LIMITS_MIX_3 11: numthreads 2 -11: numnodes 12 +11: numnodes 7 11: matrix_sizes 50 50 50 11: sparsities 0.0000000000000000 0.0000000000000000 0.0000000000000000 11: alpha (1.0000000000000000,0.0000000000000000) @@ -22902,7 +22921,7 @@ 11: ********************************************************************** 11: test_name multiply_LIMITS_MIX_4 11: numthreads 2 -11: numnodes 12 +11: numnodes 7 11: matrix_sizes 50 50 50 11: sparsities 0.0000000000000000 0.0000000000000000 0.0000000000000000 11: alpha (1.0000000000000000,0.0000000000000000) @@ -24534,7 +24553,7 @@ 11: ********************************************************************** 11: test_name multiply_LIMITS_MIX_5 11: numthreads 2 -11: numnodes 12 +11: numnodes 7 11: matrix_sizes 50 50 50 11: sparsities 0.50000000000000000 0.50000000000000000 0.50000000000000000 11: alpha (1.0000000000000000,0.0000000000000000) @@ -26166,7 +26185,7 @@ 11: ********************************************************************** 11: test_name multiply_LIMITS_MIX_6 11: numthreads 2 -11: numnodes 12 +11: numnodes 7 11: matrix_sizes 25 50 75 11: sparsities 0.50000000000000000 0.50000000000000000 0.50000000000000000 11: alpha (1.0000000000000000,0.0000000000000000) @@ -26358,7 +26377,7 @@ 11: ********************************************************************** 11: test_name multiply_LIMITS_MIX_7 11: numthreads 2 -11: numnodes 12 +11: numnodes 7 11: matrix_sizes 25 50 75 11: sparsities 0.50000000000000000 0.50000000000000000 0.50000000000000000 11: alpha (1.0000000000000000,1.0000000000000000) @@ -26550,7 +26569,7 @@ 11: ********************************************************************** 11: test_name multiply_LIMITS_ROW_1 11: numthreads 2 -11: numnodes 12 +11: numnodes 7 11: matrix_sizes 50 50 50 11: sparsities 0.0000000000000000 0.0000000000000000 0.0000000000000000 11: alpha (1.0000000000000000,0.0000000000000000) @@ -28182,7 +28201,7 @@ 11: ********************************************************************** 11: test_name multiply_LIMITS_ROW_2 11: numthreads 2 -11: numnodes 12 +11: numnodes 7 11: matrix_sizes 50 50 50 11: sparsities 0.0000000000000000 0.0000000000000000 0.0000000000000000 11: alpha (1.0000000000000000,0.0000000000000000) @@ -29814,7 +29833,7 @@ 11: ********************************************************************** 11: test_name multiply_LIMITS_ROW_3 11: numthreads 2 -11: numnodes 12 +11: numnodes 7 11: matrix_sizes 50 50 50 11: sparsities 0.50000000000000000 0.50000000000000000 0.50000000000000000 11: alpha (1.0000000000000000,0.0000000000000000) @@ -31446,7 +31465,7 @@ 11: ********************************************************************** 11: test_name multiply_LIMITS_ROW_4 11: numthreads 2 -11: numnodes 12 +11: numnodes 7 11: matrix_sizes 25 50 75 11: sparsities 0.50000000000000000 0.50000000000000000 0.50000000000000000 11: alpha (1.0000000000000000,0.0000000000000000) @@ -31638,7 +31657,7 @@ 11: ********************************************************************** 11: test_name multiply_RT 11: numthreads 2 -11: numnodes 12 +11: numnodes 7 11: matrix_sizes 50 50 50 11: sparsities 0.50000000000000000 0.50000000000000000 0.50000000000000000 11: alpha (1.0000000000000000,0.0000000000000000) @@ -33390,7 +33409,7 @@ 11: ********************************************************************** 11: test_name multiply_SQ 11: numthreads 2 -11: numnodes 12 +11: numnodes 7 11: matrix_sizes 50 50 50 11: sparsities 0.0000000000000000 0.0000000000000000 0.0000000000000000 11: alpha (1.0000000000000000,0.0000000000000000) @@ -35142,7 +35161,7 @@ 11: ********************************************************************** 11: test_name ub2 11: numthreads 2 -11: numnodes 12 +11: numnodes 7 11: matrix_sizes 20 20 20 11: sparsities 0.50000000000000000 0.50000000000000000 0.50000000000000000 11: alpha (1.0000000000000000,0.0000000000000000) @@ -36774,7 +36793,7 @@ 11: ********************************************************************** 11: test_name ub-k-ghost 11: numthreads 2 -11: numnodes 12 +11: numnodes 7 11: matrix_sizes 20 20 20 11: sparsities 0.50000000000000000 0.50000000000000000 0.50000000000000000 11: alpha (1.0000000000000000,0.0000000000000000) @@ -38406,7 +38425,7 @@ 11: ********************************************************************** 11: test_name ub-m-ghost 11: numthreads 2 -11: numnodes 12 +11: numnodes 7 11: matrix_sizes 20 20 20 11: sparsities 0.50000000000000000 0.50000000000000000 0.50000000000000000 11: alpha (1.0000000000000000,0.0000000000000000) @@ -40038,7 +40057,7 @@ 11: ********************************************************************** 11: test_name ub-mnk-ghost 11: numthreads 2 -11: numnodes 12 +11: numnodes 7 11: matrix_sizes 20 20 20 11: sparsities 0.50000000000000000 0.50000000000000000 0.50000000000000000 11: alpha (1.0000000000000000,0.0000000000000000) @@ -41670,7 +41689,7 @@ 11: ********************************************************************** 11: test_name ub-n-ghost 11: numthreads 2 -11: numnodes 12 +11: numnodes 7 11: matrix_sizes 20 20 20 11: sparsities 0.50000000000000000 0.50000000000000000 0.50000000000000000 11: alpha (1.0000000000000000,0.0000000000000000) @@ -43302,7 +43321,7 @@ 11: ********************************************************************** 11: test_name ub 11: numthreads 2 -11: numnodes 12 +11: numnodes 7 11: matrix_sizes 20 20 20 11: sparsities 0.50000000000000000 0.50000000000000000 0.50000000000000000 11: alpha (1.0000000000000000,0.0000000000000000) @@ -45066,39 +45085,35 @@ 11: flops 2 x 2 x 1 6240 100.0% 0.0% 0.0% 11: flops 1 x 2 x 2 11352 100.0% 0.0% 0.0% 11: flops 4 x 4 x 4 257536 100.0% 0.0% 0.0% -11: flops 2 x 2 x 6 374400 100.0% 0.0% 0.0% -11: flops 8 x 18 x 6 684288 100.0% 0.0% 0.0% -11: flops 8 x 16 x 6 1216512 100.0% 0.0% 0.0% -11: flops 2 x 2 x 4 2745600 100.0% 0.0% 0.0% -11: flops 6 x 18 x 6 3592512 100.0% 0.0% 0.0% -11: flops 8 x 18 x 4 5018112 100.0% 0.0% 0.0% -11: flops 6 x 16 x 6 6386688 100.0% 0.0% 0.0% -11: flops 8 x 16 x 4 8921088 100.0% 0.0% 0.0% -11: flops 6 x 18 x 4 26345088 100.0% 0.0% 0.0% -11: flops 6 x 16 x 4 46835712 100.0% 0.0% 0.0% +11: flops 2 x 2 x 6 1123200 100.0% 0.0% 0.0% +11: flops 2 x 2 x 8 1996800 100.0% 0.0% 0.0% +11: flops 2 x 50 x 6 4276800 100.0% 0.0% 0.0% +11: flops 2 x 50 x 8 7603200 100.0% 0.0% 0.0% +11: flops 4 x 50 x 6 31363200 100.0% 0.0% 0.0% +11: flops 4 x 50 x 8 55756800 100.0% 0.0% 0.0% 11: flops 2 x 2 x 2 229160704 100.0% 0.0% 0.0% 11: flops inhomo. stacks 0 0.0% 0.0% 0.0% 11: flops total 331.559076E+06 100.0% 0.0% 0.0% -11: flops max/rank 34.169564E+06 100.0% 0.0% 0.0% +11: flops max/rank 55.107060E+06 100.0% 0.0% 0.0% 11: matmuls inhomo. stacks 0 0.0% 0.0% 0.0% -11: matmuls total 14534538 100.0% 0.0% 0.0% -11: number of processed stacks 907085 100.0% 0.0% 0.0% -11: average stack size 16.0 0.0 0.0 -11: marketing flops 389.263424E+06 +11: matmuls total 14420298 100.0% 0.0% 0.0% +11: number of processed stacks 351183 100.0% 0.0% 0.0% +11: average stack size 41.1 0.0 0.0 +11: marketing flops 389.298752E+06 11: ------------------------------------------------------------------------------- 11: # multiplications 8100 -11: max memory usage/rank 99.954688E+06 -11: # max total images/rank 4 +11: max memory usage/rank 73.101312E+06 +11: # max total images/rank 7 11: # max 3D layers 1 -11: # MPI messages exchanged 1652400 +11: # MPI messages exchanged 340200 11: MPI messages size (bytes): -11: total size 250.771104E+06 +11: total size 300.724384E+06 11: min size 0.000000E+00 -11: max size 1.728000E+03 -11: average size 151.761734E+00 +11: max size 6.400000E+03 +11: average size 883.963501E+00 11: MPI breakdown and total messages size (bytes): -11: size <= 128 1120664 26246428 -11: 128 < size <= 8192 531736 224524672 +11: size <= 128 148800 2487720 +11: 128 < size <= 8192 191400 298236672 11: 8192 < size <= 32768 0 0 11: 32768 < size <= 131072 0 0 11: 131072 < size <= 4194304 0 0 @@ -45107,7 +45122,7 @@ 11: ------------------------------------------------------------------------------- 11: 11: *** WARNING in dbcsr_mm.F:291 :: Using a non-square number of MPI ranks *** -11: *** might lead to poor performance. Used ranks: 12 Suggested: 9 25 *** +11: *** might lead to poor performance. Used ranks: 7 Suggested: 9 16 *** 11: 11: ------------------------------------------------------------------------------- 11: - - @@ -45115,11 +45130,11 @@ 11: - - 11: ------------------------------------------------------------------------------- 11: ROUTINE CALLS AVE VOLUME [Bytes] -11: MP_Bcast 8143 4. -11: MP_Allreduce 59011 8. -11: MP_Alltoall 186636 2391. -11: MP_ISend 452556 148. -11: MP_IRecv 424560 154. +11: MP_Bcast 8139 4. +11: MP_Allreduce 59003 8. +11: MP_Alltoall 186636 2368. +11: MP_ISend 241596 393. +11: MP_IRecv 247862 399. 11: ------------------------------------------------------------------------------- 11: 11: ------------------------------------------------------------------------------- @@ -45129,157 +45144,156 @@ 11: ------------------------------------------------------------------------------- 11: SUBROUTINE CALLS ASD SELF TIME TOTAL TIME MAXRANK 11: MAXIMUM AVERAGE MAXIMUM AVERAGE MAXIMUM -11: dbcsr_unittest 1 1.0 0.001 0.001 398.283 398.287 8 -11: dbcsr_test_multiplies 29 2.0 3.205 3.663 397.319 397.322 10 -11: test_multiply 8100 3.0 0.570 0.855 384.984 387.332 1 -11: dbcsr_multiply_generic 8100 4.0 0.684 1.052 186.815 187.845 1 -11: dbcsr_redistribute 24348 4.0 28.573 31.225 112.856 117.345 2 -11: make_m2s 16200 5.0 0.700 1.073 104.737 106.469 2 -11: make_images 16200 6.0 8.202 9.002 91.973 93.154 2 -11: mp_alltoall_i22 24348 5.0 79.961 85.270 79.961 85.270 1 -11: multiply_cannon 8100 5.0 5.053 5.580 67.591 70.263 0 -11: mp_sum_l 59029 4.4 53.300 56.870 53.300 56.870 0 -11: make_images_sizes 16200 7.0 0.198 0.543 46.949 49.194 6 -11: mp_alltoall_i44 16200 8.0 46.751 49.165 46.751 49.165 0 -11: mp_waitall_1 356400 8.3 44.431 47.278 44.431 47.278 9 -11: multiply_cannon_loop 8100 6.0 2.708 3.285 30.346 31.903 0 -11: make_images_data 16200 7.0 0.430 0.449 26.997 28.984 11 -11: mp_allgather_i34 8100 6.0 25.946 28.100 25.946 28.100 2 -11: dbcsr_replicate 8124 4.0 0.458 0.554 25.872 26.275 4 -11: dbcsr_create_new 290640 6.5 14.200 15.253 19.716 21.244 6 -11: hybrid_alltoall_any 16200 8.0 0.859 1.281 19.072 21.236 1 -11: dbcsr_make_random_matrix 24348 3.0 2.352 10.081 8.215 20.807 0 -11: dbcsr_finalize 170364 6.6 1.869 2.404 12.775 17.275 9 -11: mp_allgather_i12 8124 5.0 16.255 16.884 16.255 16.884 11 -11: dbcsr_merge_all 85368 7.3 7.961 9.022 9.700 14.106 0 -11: multiply_cannon_metrocomm1 97200 7.0 0.194 0.550 10.752 12.607 5 -11: multiply_cannon_metrocomm3 97200 7.0 0.183 0.891 8.637 10.029 2 -11: dbcsr_check_multiply 8100 4.0 1.529 1.761 6.101 9.915 0 -11: mp_bcast_b 8124 5.0 4.320 8.218 4.320 8.218 11 -11: multiply_cannon_multrec 97200 7.0 6.122 7.013 6.925 7.829 6 -11: dbcsr_special_finalize 56700 7.0 0.752 1.164 6.788 7.687 11 -11: dbcsr_merge_single_wm 53928 8.0 4.609 5.645 5.382 6.330 7 -11: dbcsr_make_index_exist 290640 7.5 5.249 5.790 5.249 5.790 7 -11: dbcsr_crop_matrix 44772 6.0 0.233 0.240 5.066 5.606 4 -11: dbcsr_copy_submatrix 44772 7.0 0.819 1.028 4.589 5.137 5 -11: dbcsr_new_transposed 10752 5.0 0.523 0.590 4.218 4.818 10 -11: dbcsr_to_dense_local 32472 3.3 1.808 4.617 1.975 4.794 0 -11: dbcsr_make_images_dense 840 6.0 0.025 0.025 3.759 4.308 7 -11: dbcsr_iterator_start 232818 6.2 3.103 3.763 3.245 3.900 6 -11: setup_buffer_matrices 16200 6.0 0.154 0.195 2.847 3.481 5 -11: dbcsr_make_dense_low 3336 6.9 0.033 0.033 2.820 3.475 5 -11: make_dense_data 3336 7.9 0.734 1.265 2.776 3.430 7 -11: dbcsr_make_index_list 56700 6.0 1.647 2.597 1.647 2.597 4 -11: buffer_matrices_ensure_size 16200 6.0 1.325 1.797 1.325 1.797 4 -11: quick_finalize 27120 6.2 1.073 1.607 1.239 1.756 6 -11: dbcsr_copy 60324 5.7 0.368 0.448 1.433 1.680 1 -11: dbcsr_iterator_stop 232818 6.2 1.454 1.564 1.532 1.641 6 -11: dbcsr_scale_anytype 7080 5.0 0.157 0.554 1.058 1.589 6 -11: dbcsr_data_new 924846 6.6 0.944 1.559 0.944 1.559 2 -11: setup_rec_index_2d 16200 6.0 1.146 1.517 1.146 1.517 2 -11: multiply_cannon_metrocomm4 64800 7.0 0.311 0.315 0.594 1.511 2 -11: dbcsr_mm_multrec_init 8100 6.0 0.018 0.019 0.757 1.286 1 -11: multiply_cannon_multrec_finali 8100 8.0 0.031 0.186 0.802 1.275 11 -11: mp_allgatherv_iv 8124 5.0 0.841 1.268 0.841 1.268 8 -11: dbcsr_mm_csr_init 8100 7.0 0.689 1.219 0.739 1.268 4 -11: dbcsr_mm_multrec_finalize 8100 9.0 0.766 1.254 0.772 1.260 3 -11: dbcsr_destroy 290496 5.3 0.680 1.064 0.841 1.216 7 -11: multiply_cannon_metrocomm2 72900 7.0 0.369 0.478 0.730 1.178 4 -11: dbcsr_sort_indices 133097 7.7 0.783 1.177 0.783 1.177 0 -11: mp_alltoall_r11v 18585 5.0 0.730 1.176 0.730 1.176 1 -11: dbcsr_sort_data 62052 8.7 0.804 1.121 0.804 1.121 3 -11: mp_alltoall_z11v 17937 5.0 0.759 1.076 0.759 1.076 6 -11: dbcsr_test_adds 2 2.0 0.039 0.087 0.964 0.965 11 -11: test_add 24 3.0 0.001 0.001 0.914 0.932 0 -11: dbcsr_data_release 1369572 6.7 0.690 0.932 0.690 0.932 6 -11: merge_index 85368 8.3 0.675 0.882 0.675 0.882 0 -11: tree_to_linear_z 5979 6.0 0.086 0.881 0.086 0.881 0 -11: dbcsr_work_create 166416 6.4 0.455 0.686 0.627 0.840 4 -11: tree_to_linear_s 6195 6.0 0.070 0.768 0.070 0.768 0 -11: mp_alltoall_c11v 17937 5.0 0.657 0.753 0.657 0.753 11 -11: dbcsr_make_dense 396 5.0 0.003 0.003 0.622 0.715 0 -11: mp_alltoall_d11v 18585 5.0 0.639 0.714 0.639 0.714 11 -11: dbcsr_make_undense 396 5.0 0.166 0.240 0.542 0.691 6 -11: mp_isend_rv 56324 8.4 0.183 0.664 0.183 0.664 4 -11: tree_to_linear_c 5979 6.0 0.059 0.632 0.059 0.632 0 -11: tree_to_linear_d 6195 6.0 0.057 0.610 0.057 0.610 0 -11: dbcsr_work_destroy_all 166416 7.3 0.388 0.398 0.496 0.548 0 -11: dbcsr_distribution_new 76884 4.5 0.174 0.546 0.174 0.546 2 -11: mp_sum_b 2184 5.0 0.419 0.483 0.419 0.483 8 -11: dbcsr_make_untransposed_blocks 15156 5.0 0.307 0.396 0.395 0.483 6 -11: mp_irecv_rv 58765 8.4 0.112 0.427 0.112 0.427 4 -11: make_images_pack 16200 7.0 0.190 0.242 0.284 0.404 0 -11: dbcsr_make_dists_dense 420 5.0 0.190 0.331 0.193 0.333 3 -11: dbcsr_impose_sparsity 4484 5.0 0.255 0.263 0.289 0.297 6 -11: mp_alltoall_i11v 73044 5.0 0.235 0.285 0.235 0.285 1 -11: dbcsr_add_wm_from_matrix 7056 5.0 0.070 0.090 0.248 0.269 9 -11: dbcsr_verify_matrix 32472 4.3 0.121 0.253 0.121 0.253 4 -11: mp_allgatherv_zv 1995 5.0 0.198 0.236 0.198 0.236 9 -11: dbcsr_add_anytype 24 4.0 0.003 0.009 0.054 0.224 8 -11: mp_isend_iv 242189 8.0 0.216 0.223 0.216 0.223 2 -11: dbcsr_switch_data_area 110904 6.6 0.156 0.159 0.208 0.213 11 -11: dbcsr_make_index_local_row 56700 6.0 0.087 0.212 0.087 0.212 10 -11: dbcsr_get_data_size_used 109716 7.0 0.125 0.188 0.125 0.188 8 -11: dbcsr_get_local_cols 8496 5.0 0.047 0.175 0.047 0.175 0 -11: dbcsr_fill_wm_from_matrix 7056 6.0 0.107 0.121 0.144 0.158 2 -11: dbcsr_iterator_seek 232818 7.2 0.142 0.157 0.142 0.157 0 -11: mp_irecv_iv 251143 8.0 0.135 0.142 0.135 0.142 3 -11: mp_allgatherv_rv 2067 5.0 0.117 0.141 0.117 0.141 3 -11: dbcsr_make_dbcsr_index 177384 8.3 0.099 0.120 0.099 0.120 0 -11: mp_isend_dv 56343 8.4 0.060 0.115 0.060 0.115 3 -11: mp_allgatherv_cv 1995 5.0 0.086 0.106 0.086 0.106 2 -11: mp_irecv_dv 58782 8.4 0.042 0.102 0.042 0.102 6 -11: dbcsr_data_copy_aa2 38782 8.4 0.021 0.102 0.021 0.102 0 -11: transpose_index_local 10752 6.0 0.037 0.040 0.088 0.100 11 -11: dbcsr_conjg 5376 5.0 0.060 0.066 0.090 0.096 11 -11: mp_irecv_zv 56683 8.4 0.040 0.082 0.040 0.082 11 -11: mp_allgatherv_dv 2067 5.0 0.055 0.064 0.055 0.064 3 -11: dbcsr_check_add 24 4.0 0.005 0.006 0.042 0.063 0 -11: dbcsr_get_local_rows 8496 5.0 0.027 0.059 0.027 0.059 2 -11: mp_isend_zv 54225 8.4 0.056 0.059 0.056 0.059 7 -11: mp_isend_cv 54277 8.4 0.052 0.054 0.052 0.054 7 -11: mp_irecv_cv 56607 8.4 0.036 0.042 0.036 0.042 6 -11: fill_hash_tables 8100 8.0 0.032 0.034 0.032 0.034 11 -11: dbcsr_mm_sched_init 8100 8.0 0.015 0.016 0.018 0.019 5 -11: dbcsr_get_global_row_map 8100 5.0 0.008 0.009 0.008 0.009 3 -11: dbcsr_get_global_col_map 8100 5.0 0.007 0.008 0.007 0.008 2 -11: dbcsr_mm_sched_finalize 8100 10.0 0.006 0.006 0.006 0.006 10 -11: dbcsr_index_prune_deleted 2940 7.0 0.005 0.005 0.005 0.005 1 -11: dbcsr_init_lib_low 1 1.0 0.002 0.005 0.002 0.005 8 -11: dbcsr_mm_hostdrv_init 8100 9.0 0.003 0.003 0.003 0.003 5 -11: mp_max_l 124 1.0 0.002 0.003 0.002 0.003 1 -11: mp_bcast_av 133 1.0 0.000 0.000 0.002 0.003 10 -11: mp_bcast_i 134 2.0 0.002 0.002 0.002 0.002 5 -11: mp_maxloc_dv 271 1.0 0.001 0.001 0.001 0.001 1 -11: mp_sum_d 273 1.0 0.001 0.001 0.001 0.001 5 -11: mp_cart_sub 2 5.0 0.001 0.001 0.001 0.001 0 -11: mp_comm_free 4 2.0 0.000 0.001 0.000 0.001 2 -11: mp_max_i 144 1.0 0.001 0.001 0.001 0.001 0 -11: mp_sum_lv 19 1.0 0.000 0.000 0.000 0.000 0 -11: mp_max_r 1 1.0 0.000 0.000 0.000 0.000 2 -11: mp_bcast_iv 19 1.0 0.000 0.000 0.000 0.000 9 -11: mp_cart_create 1 5.0 0.000 0.000 0.000 0.000 8 -11: mp_sum_i 1 1.0 0.000 0.000 0.000 0.000 3 +11: dbcsr_unittest 1 1.0 0.000 0.000 1124.203 1124.213 4 +11: dbcsr_test_multiplies 29 2.0 8.892 10.938 1123.435 1123.446 3 +11: test_multiply 8100 3.0 0.612 0.683 1101.808 1107.493 0 +11: dbcsr_multiply_generic 8100 4.0 1.247 1.277 553.706 555.340 2 +11: make_m2s 16200 5.0 1.308 1.324 288.465 292.597 4 +11: make_images 16200 6.0 24.515 26.518 264.268 268.989 0 +11: dbcsr_redistribute 24348 4.0 49.627 57.248 246.711 261.200 4 +11: multiply_cannon 8100 5.0 16.811 17.549 218.779 226.086 2 +11: mp_alltoall_i22 24348 5.0 184.680 195.408 184.680 195.408 1 +11: mp_waitall_1 388800 8.2 181.558 185.003 181.558 185.003 3 +11: mp_sum_l 59029 4.4 171.867 178.834 171.867 178.834 0 +11: multiply_cannon_loop 8100 6.0 7.170 7.941 127.456 130.320 4 +11: dbcsr_replicate 8124 4.0 0.986 1.072 119.553 121.798 6 +11: make_images_sizes 16200 7.0 0.075 0.077 117.701 120.762 3 +11: mp_alltoall_i44 16200 8.0 117.626 120.688 117.626 120.688 5 +11: multiply_cannon_metrocomm1 56700 7.0 0.648 0.658 94.167 96.047 2 +11: make_images_data 16200 7.0 0.997 1.025 91.905 95.026 6 +11: hybrid_alltoall_any 16200 8.0 2.226 2.413 73.498 76.204 3 +11: mp_allgather_i34 8100 6.0 64.502 71.047 64.502 71.047 1 +11: mp_allgather_i12 8124 5.0 58.018 60.560 58.018 60.560 1 +11: dbcsr_create_new 320052 6.6 39.861 46.467 47.153 53.320 0 +11: dbcsr_finalize 185424 6.7 4.171 4.502 32.127 41.883 6 +11: dbcsr_merge_all 91764 7.4 22.716 28.608 25.665 35.398 0 +11: dbcsr_make_random_matrix 24348 3.0 3.928 13.503 11.042 30.009 0 +11: dbcsr_check_multiply 8100 4.0 1.914 2.148 20.341 29.656 0 +11: mp_bcast_b 8124 5.0 18.085 27.506 18.085 27.506 6 +11: dbcsr_special_finalize 64800 7.0 1.397 1.673 24.615 26.925 5 +11: multiply_cannon_multrec 56700 7.0 20.613 22.258 25.064 26.271 0 +11: mp_allgatherv_iv 8124 5.0 22.866 24.085 22.866 24.085 0 +11: dbcsr_crop_matrix 51168 6.0 0.658 0.673 17.375 18.743 5 +11: dbcsr_copy_submatrix 51168 7.0 2.420 2.682 15.850 17.198 6 +11: dbcsr_new_transposed 10752 5.0 0.916 1.039 16.359 17.077 5 +11: dbcsr_merge_single_wm 53928 8.0 11.621 12.979 13.291 14.825 5 +11: quick_finalize 35220 6.6 9.869 10.428 10.351 10.916 3 +11: dbcsr_make_index_exist 320052 7.6 6.685 7.399 6.685 7.399 4 +11: dbcsr_to_dense_local 32472 3.3 2.488 5.683 2.902 6.112 0 +11: dbcsr_iterator_start 242042 6.3 5.459 5.639 5.869 6.077 0 +11: multiply_cannon_multrec_finali 8100 8.0 0.039 0.040 4.451 5.051 2 +11: dbcsr_mm_multrec_finalize 8100 9.0 4.397 4.995 4.413 5.012 6 +11: dbcsr_copy 66720 5.8 0.862 0.954 3.964 4.263 3 +11: setup_buffer_matrices 16200 6.0 0.373 0.379 3.232 3.676 6 +11: dbcsr_scale_anytype 7080 5.0 0.245 0.270 3.533 3.627 6 +11: setup_rec_index_2d 16200 6.0 3.349 3.622 3.349 3.622 4 +11: mp_alltoall_z11v 17937 5.0 2.687 3.352 2.687 3.352 4 +11: mp_alltoall_d11v 18585 5.0 2.420 2.975 2.420 2.975 4 +11: mp_alltoall_r11v 18585 5.0 2.332 2.891 2.332 2.891 6 +11: dbcsr_iterator_stop 242042 6.3 2.275 2.570 2.551 2.835 0 +11: mp_sum_b 2184 5.0 2.498 2.785 2.498 2.785 1 +11: buffer_matrices_ensure_size 16200 6.0 1.826 2.751 1.826 2.751 0 +11: mp_alltoall_c11v 17937 5.0 2.021 2.532 2.021 2.532 2 +11: dbcsr_make_index_list 64800 6.0 1.807 2.375 1.807 2.375 3 +11: dbcsr_data_release 1462180 6.8 1.993 2.146 1.993 2.146 0 +11: dbcsr_destroy 319908 5.3 1.565 1.593 2.041 2.066 3 +11: mp_allgatherv_zv 1995 5.0 1.980 2.052 1.980 2.052 6 +11: dbcsr_data_new 984794 6.7 1.922 1.985 1.922 1.985 0 +11: dbcsr_sort_data 62052 8.7 1.743 1.911 1.743 1.911 5 +11: mp_allgatherv_rv 2067 5.0 1.824 1.893 1.824 1.893 3 +11: mp_allgatherv_cv 1995 5.0 1.766 1.870 1.766 1.870 6 +11: mp_allgatherv_dv 2067 5.0 1.804 1.863 1.804 1.863 2 +11: dbcsr_sort_indices 142124 7.8 1.244 1.766 1.244 1.766 0 +11: dbcsr_work_create 180912 6.5 1.139 1.161 1.606 1.628 6 +11: merge_index 91764 8.4 1.103 1.622 1.103 1.622 0 +11: dbcsr_work_destroy_all 180912 7.4 1.129 1.165 1.491 1.540 0 +11: mp_alltoall_i11v 73044 5.0 0.674 1.307 0.674 1.307 3 +11: dbcsr_mm_multrec_init 8100 6.0 0.049 0.051 1.166 1.285 5 +11: dbcsr_mm_csr_init 8100 7.0 1.020 1.153 1.117 1.236 2 +11: multiply_cannon_metrocomm2 48600 7.0 0.593 0.611 0.993 1.015 3 +11: tree_to_linear_z 5979 6.0 0.138 0.873 0.138 0.873 0 +11: dbcsr_make_untransposed_blocks 15156 5.0 0.518 0.606 0.753 0.842 3 +11: dbcsr_test_adds 2 2.0 0.014 0.037 0.768 0.771 6 +11: tree_to_linear_c 5979 6.0 0.122 0.764 0.122 0.764 0 +11: dbcsr_add_wm_from_matrix 7056 5.0 0.233 0.295 0.702 0.751 1 +11: tree_to_linear_s 6195 6.0 0.120 0.746 0.120 0.746 0 +11: test_add 24 3.0 0.002 0.002 0.729 0.740 0 +11: tree_to_linear_d 6195 6.0 0.117 0.729 0.117 0.729 0 +11: make_images_pack 16200 7.0 0.404 0.449 0.606 0.655 3 +11: dbcsr_switch_data_area 125820 6.8 0.467 0.477 0.624 0.648 2 +11: dbcsr_make_images_dense 840 6.0 0.055 0.060 0.543 0.589 2 +11: dbcsr_fill_wm_from_matrix 7056 6.0 0.283 0.399 0.384 0.499 0 +11: dbcsr_get_data_size_used 116112 7.1 0.375 0.451 0.375 0.451 6 +11: dbcsr_iterator_seek 242042 7.3 0.411 0.438 0.411 0.438 0 +11: dbcsr_verify_matrix 32472 4.3 0.206 0.425 0.206 0.425 0 +11: dbcsr_impose_sparsity 4484 5.0 0.319 0.334 0.393 0.407 6 +11: dbcsr_make_dense_low 3756 6.9 0.084 0.094 0.349 0.392 3 +11: dbcsr_make_dbcsr_index 191880 8.3 0.310 0.363 0.310 0.363 0 +11: mp_isend_iv 144156 8.0 0.324 0.349 0.324 0.349 6 +11: make_dense_data 3756 7.9 0.087 0.114 0.228 0.281 5 +11: dbcsr_make_dists_dense 420 5.0 0.186 0.277 0.190 0.281 6 +11: dbcsr_distribution_new 76884 4.5 0.230 0.237 0.230 0.237 6 +11: mp_irecv_iv 142845 8.0 0.230 0.235 0.230 0.235 2 +11: dbcsr_conjg 5376 5.0 0.124 0.140 0.198 0.215 6 +11: transpose_index_local 10752 6.0 0.091 0.099 0.185 0.200 6 +11: dbcsr_data_copy_aa2 39647 8.3 0.061 0.183 0.061 0.183 0 +11: dbcsr_check_add 24 4.0 0.011 0.013 0.063 0.163 6 +11: dbcsr_make_index_local_row 64800 6.0 0.140 0.148 0.140 0.148 5 +11: dbcsr_add_anytype 24 4.0 0.014 0.023 0.035 0.104 4 +11: dbcsr_make_dense 396 5.0 0.006 0.007 0.076 0.091 4 +11: mp_isend_zv 28308 8.6 0.081 0.084 0.081 0.084 6 +11: mp_isend_dv 29334 8.6 0.075 0.080 0.075 0.080 6 +11: mp_isend_rv 29407 8.6 0.071 0.078 0.071 0.078 2 +11: mp_isend_cv 28255 8.6 0.072 0.078 0.072 0.078 6 +11: dbcsr_make_undense 396 5.0 0.031 0.033 0.063 0.072 6 +11: multiply_cannon_metrocomm3 56700 7.0 0.062 0.067 0.062 0.067 5 +11: fill_hash_tables 8100 8.0 0.051 0.065 0.051 0.065 4 +11: mp_irecv_cv 27892 8.6 0.047 0.059 0.047 0.059 0 +11: dbcsr_mm_sched_init 8100 8.0 0.037 0.049 0.047 0.058 5 +11: mp_irecv_zv 27907 8.6 0.048 0.055 0.048 0.055 4 +11: mp_irecv_rv 28959 8.6 0.048 0.053 0.048 0.053 6 +11: mp_irecv_dv 29030 8.6 0.047 0.049 0.047 0.049 1 +11: dbcsr_get_local_rows 8496 5.0 0.048 0.049 0.048 0.049 0 +11: dbcsr_get_local_cols 8496 5.0 0.029 0.042 0.029 0.042 1 +11: dbcsr_get_global_row_map 8100 5.0 0.017 0.017 0.017 0.017 6 +11: dbcsr_mm_sched_finalize 8100 10.0 0.016 0.017 0.016 0.017 6 +11: mp_bcast_av 132 1.0 0.001 0.001 0.013 0.015 4 +11: dbcsr_get_global_col_map 8100 5.0 0.015 0.015 0.015 0.015 0 +11: mp_bcast_i 133 2.0 0.012 0.014 0.012 0.014 1 +11: mp_max_l 123 1.0 0.010 0.013 0.010 0.013 0 +11: dbcsr_index_prune_deleted 3360 7.0 0.010 0.013 0.010 0.013 0 +11: dbcsr_mm_hostdrv_init 8100 9.0 0.009 0.010 0.009 0.010 3 +11: mp_sum_d 271 1.0 0.003 0.003 0.003 0.003 1 +11: mp_maxloc_dv 269 1.0 0.002 0.002 0.002 0.002 3 +11: dbcsr_init_lib_low 1 1.0 0.001 0.002 0.001 0.002 6 +11: mp_cart_sub 2 5.0 0.001 0.001 0.001 0.001 3 +11: mp_max_i 139 1.0 0.001 0.001 0.001 0.001 1 +11: mp_cart_create 1 5.0 0.000 0.000 0.000 0.000 6 +11: mp_max_r 1 1.0 0.000 0.000 0.000 0.000 4 +11: mp_sum_lv 15 1.0 0.000 0.000 0.000 0.000 1 +11: mp_bcast_iv 15 1.0 0.000 0.000 0.000 0.000 5 +11: mp_comm_free 4 2.0 0.000 0.000 0.000 0.000 5 +11: mp_max_d 1 1.0 0.000 0.000 0.000 0.000 1 11: mp_sum_lm3 1 1.0 0.000 0.000 0.000 0.000 4 -11: mp_min_rv 1 1.0 0.000 0.000 0.000 0.000 4 -11: mp_sum_r 1 1.0 0.000 0.000 0.000 0.000 1 -11: mp_max_d 1 1.0 0.000 0.000 0.000 0.000 3 +11: mp_sum_r 1 1.0 0.000 0.000 0.000 0.000 4 +11: mp_min_rv 1 1.0 0.000 0.000 0.000 0.000 2 +11: mp_sum_rv 1 1.0 0.000 0.000 0.000 0.000 6 11: mp_max_rv 1 1.0 0.000 0.000 0.000 0.000 1 -11: mp_sum_rv 1 1.0 0.000 0.000 0.000 0.000 11 +11: mp_sum_i 1 1.0 0.000 0.000 0.000 0.000 1 11: ------------------------------------------------------------------------------- 11: -11/19 Test #11: dbcsr_unittest1 ....................................... Passed 398.44 sec +11/19 Test #11: dbcsr_unittest1 ....................................... Passed 1124.34 sec test 12 Start 12: dbcsr_unittest2 -12: Test command: /usr/bin/mpiexec "-n" "12" "/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/tests/dbcsr_unittest2" +12: Test command: /usr/bin/mpiexec "-n" "7" "/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/tests/dbcsr_unittest2" 12: Working Directory: /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/tests 12: Environment variables: 12: OMP_NUM_THREADS=2 12: Test timeout computed to be: 1500 12: test_name large_blocks_1 12: numthreads 2 -12: numnodes 12 +12: numnodes 7 12: matrix_sizes 500 500 500 12: sparsities 0.50000000000000000 0.50000000000000000 0.50000000000000000 12: alpha (1.0000000000000000,0.0000000000000000) @@ -47031,7 +47045,7 @@ 12: ********************************************************************** 12: test_name large_blocks_2 12: numthreads 2 -12: numnodes 12 +12: numnodes 7 12: matrix_sizes 500 50 50 12: sparsities 0.50000000000000000 0.50000000000000000 0.50000000000000000 12: alpha (1.0000000000000000,0.0000000000000000) @@ -47583,7 +47597,7 @@ 12: ********************************************************************** 12: test_name rectangular_matrix_M 12: numthreads 2 -12: numnodes 12 +12: numnodes 7 12: matrix_sizes 500 50 50 12: sparsities 0.50000000000000000 0.50000000000000000 0.50000000000000000 12: alpha (1.0000000000000000,0.0000000000000000) @@ -48135,7 +48149,7 @@ 12: ********************************************************************** 12: test_name rectangular_matrix_K 12: numthreads 2 -12: numnodes 12 +12: numnodes 7 12: matrix_sizes 50 50 500 12: sparsities 0.50000000000000000 0.50000000000000000 0.50000000000000000 12: alpha (1.0000000000000000,0.0000000000000000) @@ -48377,35 +48391,35 @@ 12: flops 100 x 100 x 100 20756000000 100.0% 0.0% 0.0% 12: flops inhomo. stacks 0 0.0% 0.0% 0.0% 12: flops total 20.914688E+09 100.0% 0.0% 0.0% -12: flops max/rank 3.393949E+09 100.0% 0.0% 0.0% +12: flops max/rank 4.314545E+09 100.0% 0.0% 0.0% 12: matmuls inhomo. stacks 0 0.0% 0.0% 0.0% 12: matmuls total 385455 100.0% 0.0% 0.0% -12: number of processed stacks 46755 100.0% 0.0% 0.0% -12: average stack size 8.2 0.0 0.0 -12: marketing flops 87.649976E+09 +12: number of processed stacks 19028 100.0% 0.0% 0.0% +12: average stack size 20.3 0.0 0.0 +12: marketing flops 87.650058E+09 12: ------------------------------------------------------------------------------- 12: # multiplications 608 -12: max memory usage/rank 130.600960E+06 -12: # max total images/rank 4 +12: max memory usage/rank 100.913152E+06 +12: # max total images/rank 7 12: # max 3D layers 1 -12: # MPI messages exchanged 124032 +12: # MPI messages exchanged 25536 12: MPI messages size (bytes): -12: total size 1.959741E+09 +12: total size 2.309977E+09 12: min size 0.000000E+00 -12: max size 320.000000E+03 -12: average size 15.800288E+03 +12: max size 800.000000E+03 +12: average size 90.459609E+03 12: MPI breakdown and total messages size (bytes): -12: size <= 128 74900 83700 -12: 128 < size <= 8192 30338 65750000 -12: 8192 < size <= 32768 759 12988400 -12: 32768 < size <= 131072 12137 818200000 -12: 131072 < size <= 4194304 5898 1062720000 +12: size <= 128 5964 1200 +12: 128 < size <= 8192 8166 17752200 +12: 8192 < size <= 32768 1338 24063600 +12: 32768 < size <= 131072 2988 252158400 +12: 131072 < size <= 4194304 7080 2016000000 12: 4194304 < size <= 16777216 0 0 12: 16777216 < size 0 0 12: ------------------------------------------------------------------------------- 12: 12: *** WARNING in dbcsr_mm.F:291 :: Using a non-square number of MPI ranks *** -12: *** might lead to poor performance. Used ranks: 12 Suggested: 9 25 *** +12: *** might lead to poor performance. Used ranks: 7 Suggested: 9 16 *** 12: 12: ------------------------------------------------------------------------------- 12: - - @@ -48415,9 +48429,9 @@ 12: ROUTINE CALLS AVE VOLUME [Bytes] 12: MP_Bcast 612 4. 12: MP_Allreduce 4601 8. -12: MP_Alltoall 13984 81557. -12: MP_ISend 24330 6500. -12: MP_IRecv 24344 6099. +12: MP_Alltoall 13984 71557. +12: MP_ISend 9862 36837. +12: MP_IRecv 11242 34438. 12: ------------------------------------------------------------------------------- 12: 12: ------------------------------------------------------------------------------- @@ -48427,140 +48441,139 @@ 12: ------------------------------------------------------------------------------- 12: SUBROUTINE CALLS ASD SELF TIME TOTAL TIME MAXRANK 12: MAXIMUM AVERAGE MAXIMUM AVERAGE MAXIMUM -12: dbcsr_unittest 1 1.0 0.000 0.001 625.833 625.834 0 -12: dbcsr_test_multiplies 4 2.0 6.838 7.415 625.833 625.834 2 -12: test_multiply 608 3.0 0.119 0.463 587.295 590.547 6 -12: dbcsr_multiply_generic 608 4.0 1.063 1.581 218.692 221.394 4 -12: dbcsr_check_multiply 608 4.0 170.756 178.718 198.029 212.588 2 -12: dbcsr_redistribute 1824 4.0 4.762 7.833 90.087 105.430 10 -12: multiply_cannon 608 5.0 4.664 6.409 97.872 99.866 5 -12: mp_alltoall_i22 1824 5.0 78.632 98.009 78.632 98.009 1 -12: make_m2s 1216 5.0 0.116 0.580 92.437 95.581 0 -12: make_images 1216 6.0 8.618 10.401 83.056 86.494 11 -12: dbcsr_create_new 14816 6.0 33.064 34.672 55.833 59.471 3 -12: multiply_cannon_loop 608 6.0 9.870 11.157 49.069 51.241 10 -12: mp_sum_l 4649 4.4 47.713 50.885 47.713 50.885 6 -12: mp_bcast_b 608 5.0 27.273 42.274 27.273 42.274 11 -12: dbcsr_make_random_matrix 1824 3.0 0.917 8.064 26.808 38.043 0 -12: make_images_sizes 1216 7.0 0.004 0.004 33.025 37.469 8 -12: mp_alltoall_i44 1216 8.0 33.022 37.465 33.022 37.465 0 -12: dbcsr_finalize 4864 4.6 3.319 4.314 26.783 30.891 11 -12: dbcsr_replicate 608 4.0 0.067 0.388 29.874 30.694 4 -12: dbcsr_merge_all 3040 5.4 19.906 22.051 23.246 27.361 10 -12: mp_allgather_i34 608 6.0 23.581 27.091 23.581 27.091 5 -12: mp_waitall_1 26752 8.3 23.089 26.005 23.089 26.005 1 -12: dbcsr_make_index_exist 14816 7.0 22.559 24.484 22.559 24.484 8 -12: multiply_cannon_multrec 7296 7.0 20.627 22.338 21.185 23.369 8 -12: dbcsr_special_finalize 4256 7.0 7.118 8.381 21.209 22.999 1 -12: setup_buffer_matrices 1216 6.0 0.064 0.551 13.423 15.329 9 -12: dbcsr_merge_single_wm 4256 8.0 11.559 12.804 13.891 15.175 2 -12: multiply_cannon_metrocomm1 7296 7.0 0.194 0.773 12.058 14.116 0 -12: dbcsr_make_index_list 4256 6.0 9.259 10.414 9.259 10.414 4 -12: mp_allgatherv_zv 144 5.0 8.288 8.574 8.288 8.574 8 -12: make_images_data 1216 7.0 0.062 0.119 6.756 8.516 3 -12: dbcsr_to_dense_local 2432 3.2 6.262 7.900 6.377 7.924 0 -12: multiply_cannon_metrocomm3 7296 7.0 0.018 0.096 5.558 7.422 8 -12: hybrid_alltoall_any 1216 8.0 0.950 2.190 5.021 6.737 10 -12: setup_rec_index_2d 1216 6.0 5.314 6.045 5.314 6.045 6 -12: dbcsr_new_transposed 800 5.0 0.078 0.459 5.174 5.658 2 -12: mp_alltoall_i11v 5472 5.0 2.125 4.897 2.125 4.897 2 -12: mp_allgather_i12 608 5.0 4.297 4.699 4.297 4.699 11 -12: dbcsr_copy 1248 4.9 0.161 0.421 4.011 4.660 11 -12: mp_allgatherv_dv 160 5.0 4.319 4.544 4.319 4.544 9 -12: dbcsr_sort_data 4864 8.8 3.186 4.230 3.186 4.230 9 -12: mp_alltoall_d11v 1440 5.0 1.675 3.684 1.675 3.684 4 -12: mp_allgatherv_iv 608 5.0 2.537 2.827 2.537 2.827 6 -12: merge_index 3040 6.4 1.915 2.765 1.915 2.765 0 -12: mp_allgatherv_cv 144 5.0 2.425 2.548 2.425 2.548 7 -12: mp_alltoall_z11v 1296 5.0 1.296 2.302 1.296 2.302 0 -12: mp_allgatherv_rv 160 5.0 2.028 2.222 2.028 2.222 1 -12: dbcsr_data_release 71212 6.1 1.277 2.045 1.277 2.045 3 -12: buffer_matrices_ensure_size 1216 6.0 1.528 1.993 1.528 1.993 3 -12: dbcsr_iterator_start 10736 5.5 0.592 1.630 0.601 1.642 0 -12: mp_alltoall_c11v 1296 5.0 0.824 1.628 0.824 1.628 0 -12: dbcsr_make_untransposed_blocks 608 5.0 0.958 1.585 0.963 1.590 11 -12: dbcsr_data_new 48624 5.9 0.825 1.353 0.825 1.353 8 -12: mp_sum_b 320 5.0 1.032 1.341 1.032 1.341 8 -12: dbcsr_data_copy_aa2 2319 6.7 0.191 1.333 0.191 1.333 0 -12: dbcsr_destroy 14784 4.9 0.104 0.409 0.531 1.222 5 -12: multiply_cannon_metrocomm2 5472 7.0 0.031 0.038 0.298 1.216 8 -12: multiply_cannon_multrec_finali 608 8.0 0.002 0.002 0.557 1.184 11 -12: dbcsr_mm_multrec_finalize 608 9.0 0.555 1.182 0.556 1.182 0 -12: tree_to_linear_s 480 6.0 0.134 1.005 0.134 1.005 9 -12: dbcsr_work_create 9120 5.7 0.097 0.443 0.199 0.963 1 -12: tree_to_linear_z 432 6.0 0.080 0.956 0.080 0.956 0 -12: make_images_pack 1216 7.0 0.184 0.556 0.298 0.916 7 -12: mp_isend_dv 3408 8.1 0.117 0.803 0.117 0.803 1 -12: mp_alltoall_r11v 1440 5.0 0.460 0.730 0.460 0.730 0 -12: tree_to_linear_d 480 6.0 0.059 0.698 0.059 0.698 0 -12: dbcsr_work_destroy_all 9120 6.7 0.240 0.601 0.342 0.674 1 -12: dbcsr_mm_multrec_init 608 6.0 0.002 0.002 0.226 0.614 0 -12: dbcsr_mm_csr_init 608 7.0 0.220 0.609 0.224 0.612 10 -12: mp_isend_iv 13957 8.0 0.142 0.545 0.142 0.545 10 -12: dbcsr_sort_indices 7367 7.2 0.078 0.516 0.078 0.516 11 -12: dbcsr_get_local_rows 608 5.0 0.040 0.448 0.040 0.448 8 -12: multiply_cannon_metrocomm4 4864 7.0 0.026 0.030 0.100 0.424 3 -12: mp_isend_rv 3397 8.1 0.046 0.420 0.046 0.420 0 -12: dbcsr_get_data_size_used 4864 5.6 0.039 0.419 0.039 0.419 11 -12: mp_isend_zv 3052 8.1 0.035 0.360 0.035 0.360 1 -12: tree_to_linear_c 432 6.0 0.024 0.278 0.024 0.278 0 -12: mp_irecv_dv 3284 8.1 0.021 0.193 0.021 0.193 4 -12: quick_finalize 1824 6.0 0.026 0.090 0.037 0.102 11 -12: mp_irecv_cv 2955 8.1 0.013 0.070 0.013 0.070 3 -12: dbcsr_verify_matrix 2432 4.2 0.012 0.061 0.012 0.061 2 -12: dbcsr_iterator_stop 10736 5.5 0.021 0.034 0.026 0.038 2 -12: dbcsr_distribution_new 5664 4.5 0.015 0.018 0.015 0.018 8 -12: transpose_index_local 800 6.0 0.004 0.014 0.007 0.017 8 -12: dbcsr_conjg 400 5.0 0.007 0.011 0.010 0.014 10 -12: mp_irecv_iv 13164 8.0 0.011 0.014 0.011 0.014 10 -12: dbcsr_iterator_seek 10736 6.5 0.009 0.012 0.009 0.012 0 -12: dbcsr_switch_data_area 4556 6.1 0.008 0.008 0.011 0.011 3 -12: dbcsr_mm_sched_finalize 608 10.0 0.001 0.008 0.001 0.008 7 -12: dbcsr_make_dbcsr_index 9952 7.7 0.006 0.007 0.006 0.007 0 -12: mp_max_l 107 1.0 0.005 0.007 0.005 0.007 8 -12: mp_irecv_rv 3293 8.1 0.006 0.006 0.006 0.006 8 -12: dbcsr_make_index_local_row 4256 6.0 0.006 0.006 0.006 0.006 6 -12: mp_irecv_zv 2957 8.1 0.004 0.006 0.004 0.006 4 -12: mp_isend_cv 3067 8.1 0.005 0.005 0.005 0.005 10 -12: dbcsr_init_lib_low 1 1.0 0.002 0.005 0.002 0.005 11 -12: dbcsr_get_global_col_map 608 5.0 0.001 0.003 0.001 0.003 5 -12: fill_hash_tables 608 8.0 0.002 0.002 0.002 0.002 10 -12: mp_maxloc_dv 237 1.0 0.002 0.002 0.002 0.002 11 -12: dbcsr_mm_sched_init 608 8.0 0.001 0.001 0.002 0.002 6 -12: dbcsr_get_local_cols 608 5.0 0.002 0.002 0.002 0.002 5 -12: mp_cart_sub 2 5.0 0.002 0.002 0.002 0.002 0 -12: mp_comm_free 4 2.0 0.002 0.002 0.002 0.002 7 -12: mp_sum_d 239 1.0 0.001 0.001 0.001 0.001 4 -12: mp_bcast_av 116 1.0 0.000 0.001 0.001 0.001 6 -12: dbcsr_get_global_row_map 608 5.0 0.001 0.001 0.001 0.001 0 -12: mp_bcast_i 117 2.0 0.001 0.001 0.001 0.001 4 -12: mp_cart_create 1 5.0 0.001 0.001 0.001 0.001 9 -12: mp_max_i 112 1.0 0.001 0.001 0.001 0.001 4 -12: dbcsr_mm_hostdrv_init 608 9.0 0.000 0.000 0.000 0.000 6 -12: mp_max_r 1 1.0 0.000 0.000 0.000 0.000 7 -12: mp_sum_i 1 1.0 0.000 0.000 0.000 0.000 4 -12: mp_sum_lv 4 1.0 0.000 0.000 0.000 0.000 0 -12: mp_sum_lm3 1 1.0 0.000 0.000 0.000 0.000 8 +12: dbcsr_unittest 1 1.0 0.000 0.000 501.951 501.957 2 +12: dbcsr_test_multiplies 4 2.0 1.141 1.378 501.951 501.957 0 +12: test_multiply 608 3.0 0.056 0.061 494.288 496.500 1 +12: dbcsr_check_multiply 608 4.0 264.639 282.233 329.460 368.354 5 +12: dbcsr_redistribute 1824 4.0 2.669 3.290 91.881 143.145 6 +12: mp_alltoall_i22 1824 5.0 86.895 139.456 86.895 139.456 0 +12: mp_bcast_b 608 5.0 64.821 89.237 64.821 89.237 3 +12: dbcsr_multiply_generic 608 4.0 0.094 0.109 45.393 47.504 0 +12: multiply_cannon 608 5.0 1.422 2.056 26.184 27.514 0 +12: multiply_cannon_loop 608 6.0 0.553 1.333 20.053 22.701 2 +12: mp_waitall_1 29184 8.2 15.030 16.709 15.030 16.709 1 +12: make_m2s 1216 5.0 0.049 0.049 15.607 16.420 5 +12: mp_sum_l 4649 4.4 12.724 16.385 12.724 16.385 1 +12: make_images 1216 6.0 2.094 2.398 15.309 16.155 4 +12: multiply_cannon_metrocomm1 4256 7.0 0.049 0.057 11.253 13.957 3 +12: dbcsr_make_random_matrix 1824 3.0 1.376 8.832 2.383 13.127 0 +12: dbcsr_replicate 608 4.0 0.071 0.075 12.169 12.510 2 +12: multiply_cannon_multrec 4256 7.0 7.946 11.410 8.161 11.445 4 +12: make_images_sizes 1216 7.0 0.006 0.006 7.593 8.381 0 +12: mp_alltoall_i44 1216 8.0 7.588 8.376 7.588 8.376 5 +12: dbcsr_to_dense_local 2432 3.2 5.677 6.867 5.719 6.911 0 +12: dbcsr_finalize 4864 4.6 0.089 0.102 3.517 6.765 5 +12: dbcsr_merge_all 3040 5.4 1.471 2.545 3.293 6.466 0 +12: dbcsr_create_new 16032 6.1 4.063 5.605 4.404 5.999 1 +12: mp_allgather_i34 608 6.0 4.219 5.899 4.219 5.899 1 +12: make_images_data 1216 7.0 0.052 0.056 4.012 4.955 2 +12: mp_allgather_i12 608 5.0 3.918 4.173 3.918 4.173 5 +12: hybrid_alltoall_any 1216 8.0 0.107 0.150 3.046 3.968 2 +12: dbcsr_sort_data 4864 8.8 1.455 1.544 1.455 1.544 6 +12: mp_allgatherv_zv 144 5.0 1.412 1.508 1.412 1.508 1 +12: dbcsr_data_release 74252 6.2 1.121 1.425 1.121 1.425 0 +12: dbcsr_new_transposed 800 5.0 0.069 0.090 1.198 1.357 4 +12: mp_allgatherv_iv 608 5.0 1.277 1.349 1.277 1.349 5 +12: dbcsr_special_finalize 4864 7.0 0.078 0.086 1.015 1.189 6 +12: mp_allgatherv_dv 160 5.0 0.875 0.962 0.875 0.962 1 +12: dbcsr_merge_single_wm 4256 8.0 0.593 0.737 0.697 0.892 5 +12: dbcsr_data_copy_aa2 1976 6.5 0.146 0.851 0.146 0.851 0 +12: mp_alltoall_z11v 1296 5.0 0.618 0.809 0.618 0.809 2 +12: mp_allgatherv_cv 144 5.0 0.724 0.793 0.724 0.793 1 +12: mp_alltoall_i11v 5472 5.0 0.442 0.728 0.442 0.728 5 +12: tree_to_linear_z 432 6.0 0.098 0.678 0.098 0.678 0 +12: dbcsr_copy 1248 4.9 0.021 0.033 0.479 0.620 0 +12: mp_alltoall_d11v 1440 5.0 0.403 0.509 0.403 0.509 6 +12: dbcsr_destroy 16000 5.0 0.085 0.095 0.344 0.475 1 +12: mp_alltoall_c11v 1296 5.0 0.370 0.466 0.370 0.466 4 +12: mp_allgatherv_rv 160 5.0 0.427 0.456 0.427 0.456 4 +12: mp_sum_b 320 5.0 0.370 0.422 0.370 0.422 3 +12: multiply_cannon_multrec_finali 608 8.0 0.003 0.003 0.215 0.414 3 +12: dbcsr_mm_multrec_finalize 608 9.0 0.211 0.410 0.212 0.411 0 +12: mp_alltoall_r11v 1440 5.0 0.291 0.358 0.291 0.358 5 +12: tree_to_linear_d 480 6.0 0.052 0.353 0.052 0.353 0 +12: quick_finalize 2432 6.5 0.235 0.331 0.259 0.351 1 +12: dbcsr_make_index_exist 16032 7.1 0.290 0.342 0.290 0.342 1 +12: tree_to_linear_c 432 6.0 0.048 0.330 0.048 0.330 0 +12: setup_buffer_matrices 1216 6.0 0.027 0.028 0.227 0.254 3 +12: make_images_pack 1216 7.0 0.103 0.219 0.118 0.234 2 +12: dbcsr_data_new 50448 6.0 0.211 0.219 0.211 0.219 0 +12: tree_to_linear_s 480 6.0 0.030 0.199 0.030 0.199 0 +12: dbcsr_make_index_local_row 4864 6.0 0.148 0.197 0.148 0.197 4 +12: dbcsr_work_destroy_all 9728 6.8 0.054 0.063 0.107 0.172 2 +12: setup_rec_index_2d 1216 6.0 0.079 0.144 0.079 0.144 2 +12: dbcsr_work_create 9728 5.8 0.063 0.066 0.117 0.121 2 +12: dbcsr_mm_multrec_init 608 6.0 0.004 0.005 0.077 0.114 2 +12: dbcsr_make_index_list 4864 6.0 0.102 0.111 0.102 0.111 3 +12: dbcsr_mm_csr_init 608 7.0 0.068 0.105 0.073 0.110 0 +12: buffer_matrices_ensure_size 1216 6.0 0.066 0.096 0.066 0.096 3 +12: multiply_cannon_metrocomm2 3648 7.0 0.045 0.049 0.082 0.087 2 +12: dbcsr_iterator_start 10736 5.5 0.060 0.066 0.077 0.084 5 +12: dbcsr_sort_indices 8331 7.4 0.052 0.060 0.052 0.060 5 +12: dbcsr_make_untransposed_blocks 608 5.0 0.034 0.049 0.044 0.059 6 +12: merge_index 3040 6.4 0.036 0.058 0.036 0.058 0 +12: dbcsr_iterator_stop 10736 5.5 0.041 0.042 0.053 0.055 0 +12: dbcsr_switch_data_area 5164 6.5 0.018 0.019 0.024 0.026 0 +12: dbcsr_distribution_new 5664 4.5 0.020 0.022 0.020 0.022 0 +12: dbcsr_conjg 400 5.0 0.013 0.016 0.018 0.021 5 +12: mp_isend_iv 7714 8.0 0.016 0.019 0.016 0.019 4 +12: dbcsr_iterator_seek 10736 6.5 0.017 0.019 0.017 0.019 0 +12: dbcsr_verify_matrix 2432 4.2 0.011 0.016 0.011 0.016 0 +12: dbcsr_make_dbcsr_index 10560 7.7 0.014 0.015 0.014 0.015 0 +12: transpose_index_local 800 6.0 0.006 0.010 0.010 0.014 5 +12: mp_irecv_iv 7655 8.0 0.011 0.012 0.011 0.012 2 +12: mp_isend_rv 1577 8.3 0.009 0.012 0.009 0.012 4 +12: mp_isend_cv 1419 8.3 0.006 0.011 0.006 0.011 1 +12: mp_max_l 106 1.0 0.007 0.009 0.007 0.009 2 +12: dbcsr_get_data_size_used 4864 5.6 0.008 0.009 0.008 0.009 0 +12: mp_isend_zv 1427 8.3 0.006 0.007 0.006 0.007 5 +12: dbcsr_init_lib_low 1 1.0 0.004 0.006 0.004 0.006 3 +12: mp_sum_d 237 1.0 0.006 0.006 0.006 0.006 5 +12: mp_maxloc_dv 235 1.0 0.003 0.006 0.003 0.006 0 +12: mp_isend_dv 1582 8.3 0.005 0.006 0.005 0.006 5 +12: mp_max_i 111 1.0 0.005 0.006 0.005 0.006 2 +12: multiply_cannon_metrocomm3 4256 7.0 0.004 0.005 0.004 0.005 0 +12: dbcsr_get_local_rows 608 5.0 0.004 0.004 0.004 0.004 0 +12: dbcsr_mm_sched_init 608 8.0 0.003 0.003 0.004 0.004 5 +12: mp_irecv_dv 1574 8.3 0.003 0.004 0.003 0.004 4 +12: mp_irecv_zv 1414 8.3 0.003 0.004 0.003 0.004 3 +12: mp_irecv_rv 1559 8.3 0.003 0.003 0.003 0.003 4 +12: mp_irecv_cv 1410 8.3 0.003 0.003 0.003 0.003 5 +12: mp_bcast_av 115 1.0 0.001 0.001 0.002 0.003 3 +12: fill_hash_tables 608 8.0 0.002 0.002 0.002 0.002 5 +12: dbcsr_get_local_cols 608 5.0 0.002 0.002 0.002 0.002 0 +12: mp_bcast_i 116 2.0 0.001 0.002 0.001 0.002 5 +12: dbcsr_get_global_row_map 608 5.0 0.001 0.002 0.001 0.002 6 +12: dbcsr_mm_sched_finalize 608 10.0 0.001 0.001 0.001 0.001 0 +12: mp_cart_sub 2 5.0 0.001 0.001 0.001 0.001 4 +12: dbcsr_get_global_col_map 608 5.0 0.001 0.001 0.001 0.001 6 +12: dbcsr_mm_hostdrv_init 608 9.0 0.001 0.001 0.001 0.001 5 +12: mp_cart_create 1 5.0 0.001 0.001 0.001 0.001 4 +12: mp_max_r 1 1.0 0.000 0.000 0.000 0.000 5 +12: mp_sum_lv 4 1.0 0.000 0.000 0.000 0.000 1 +12: mp_comm_free 4 2.0 0.000 0.000 0.000 0.000 5 12: mp_bcast_iv 4 1.0 0.000 0.000 0.000 0.000 5 -12: mp_max_rv 1 1.0 0.000 0.000 0.000 0.000 4 -12: mp_min_rv 1 1.0 0.000 0.000 0.000 0.000 9 -12: mp_max_d 1 1.0 0.000 0.000 0.000 0.000 4 -12: mp_sum_r 1 1.0 0.000 0.000 0.000 0.000 0 -12: mp_sum_rv 1 1.0 0.000 0.000 0.000 0.000 6 +12: mp_max_rv 1 1.0 0.000 0.000 0.000 0.000 6 +12: mp_sum_lm3 1 1.0 0.000 0.000 0.000 0.000 0 +12: mp_min_rv 1 1.0 0.000 0.000 0.000 0.000 0 +12: mp_sum_r 1 1.0 0.000 0.000 0.000 0.000 5 +12: mp_max_d 1 1.0 0.000 0.000 0.000 0.000 5 +12: mp_sum_rv 1 1.0 0.000 0.000 0.000 0.000 2 +12: mp_sum_i 1 1.0 0.000 0.000 0.000 0.000 6 12: ------------------------------------------------------------------------------- 12: -12/19 Test #12: dbcsr_unittest2 ....................................... Passed 626.14 sec +12/19 Test #12: dbcsr_unittest2 ....................................... Passed 502.18 sec test 13 Start 13: dbcsr_unittest3 -13: Test command: /usr/bin/mpiexec "-n" "12" "/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/tests/dbcsr_unittest3" +13: Test command: /usr/bin/mpiexec "-n" "7" "/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/tests/dbcsr_unittest3" 13: Working Directory: /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/tests 13: Environment variables: 13: OMP_NUM_THREADS=2 13: Test timeout computed to be: 1500 13: test_name blocks_1_3_4 13: numthreads 2 -13: numnodes 12 +13: numnodes 7 13: matrix_sizes 496 48 48 13: sparsities 0.50000000000000000 0.50000000000000000 0.50000000000000000 13: alpha (1.0000000000000000,0.0000000000000000) @@ -49112,7 +49125,7 @@ 13: ********************************************************************** 13: test_name blocks_4_5_7 13: numthreads 2 -13: numnodes 12 +13: numnodes 7 13: matrix_sizes 496 48 48 13: sparsities 0.50000000000000000 0.50000000000000000 0.50000000000000000 13: alpha (1.0000000000000000,0.0000000000000000) @@ -49664,7 +49677,7 @@ 13: ********************************************************************** 13: test_name blocks_5_8_9 13: numthreads 2 -13: numnodes 12 +13: numnodes 7 13: matrix_sizes 506 44 44 13: sparsities 0.50000000000000000 0.50000000000000000 0.50000000000000000 13: alpha (1.0000000000000000,0.0000000000000000) @@ -50216,7 +50229,7 @@ 13: ********************************************************************** 13: test_name blocks_4_13_25 13: numthreads 2 -13: numnodes 12 +13: numnodes 7 13: matrix_sizes 504 42 42 13: sparsities 0.50000000000000000 0.50000000000000000 0.50000000000000000 13: alpha (1.0000000000000000,0.0000000000000000) @@ -50768,7 +50781,7 @@ 13: ********************************************************************** 13: test_name blocks_14_29_32 13: numthreads 2 -13: numnodes 12 +13: numnodes 7 13: matrix_sizes 525 75 75 13: sparsities 0.50000000000000000 0.50000000000000000 0.50000000000000000 13: alpha (1.0000000000000000,0.0000000000000000) @@ -51320,7 +51333,7 @@ 13: ********************************************************************** 13: test_name blocks_H2O 13: numthreads 2 -13: numnodes 12 +13: numnodes 7 13: matrix_sizes 552 46 46 13: sparsities 0.50000000000000000 0.50000000000000000 0.50000000000000000 13: alpha (1.0000000000000000,0.0000000000000000) @@ -51872,7 +51885,7 @@ 13: ********************************************************************** 13: test_name blocks_45_67_78 13: numthreads 2 -13: numnodes 12 +13: numnodes 7 13: matrix_sizes 570 190 190 13: sparsities 0.50000000000000000 0.50000000000000000 0.50000000000000000 13: alpha (1.0000000000000000,0.0000000000000000) @@ -52591,35 +52604,35 @@ 13: flops 78 x 78 x 78 83521152 100.0% 0.0% 0.0% 13: flops inhomo. stacks 0 0.0% 0.0% 0.0% 13: flops total 1.621150E+09 100.0% 0.0% 0.0% -13: flops max/rank 208.224268E+06 100.0% 0.0% 0.0% +13: flops max/rank 375.607274E+06 100.0% 0.0% 0.0% 13: matmuls inhomo. stacks 0 0.0% 0.0% 0.0% 13: matmuls total 1917619 100.0% 0.0% 0.0% -13: number of processed stacks 195163 100.0% 0.0% 0.0% -13: average stack size 9.8 0.0 0.0 -13: marketing flops 6.232116E+09 +13: number of processed stacks 369949 100.0% 0.0% 0.0% +13: average stack size 5.2 0.0 0.0 +13: marketing flops 6.232123E+09 13: ------------------------------------------------------------------------------- 13: # multiplications 756 -13: max memory usage/rank 113.934336E+06 -13: # max total images/rank 4 +13: max memory usage/rank 86.278144E+06 +13: # max total images/rank 7 13: # max 3D layers 1 -13: # MPI messages exchanged 154224 +13: # MPI messages exchanged 31752 13: MPI messages size (bytes): -13: total size 336.624384E+06 +13: total size 155.148384E+06 13: min size 0.000000E+00 13: max size 237.120000E+03 -13: average size 2.182698E+03 +13: average size 4.886255E+03 13: MPI breakdown and total messages size (bytes): -13: size <= 128 99291 431188 -13: 128 < size <= 8192 46409 91322732 -13: 8192 < size <= 32768 6150 99577232 -13: 32768 < size <= 131072 2252 126029712 -13: 131072 < size <= 4194304 122 19263520 +13: size <= 128 13080 11904 +13: 128 < size <= 8192 15804 29314944 +13: 8192 < size <= 32768 1530 23782680 +13: 32768 < size <= 131072 1134 68073960 +13: 131072 < size <= 4194304 204 33964896 13: 4194304 < size <= 16777216 0 0 13: 16777216 < size 0 0 13: ------------------------------------------------------------------------------- 13: 13: *** WARNING in dbcsr_mm.F:291 :: Using a non-square number of MPI ranks *** -13: *** might lead to poor performance. Used ranks: 12 Suggested: 9 25 *** +13: *** might lead to poor performance. Used ranks: 7 Suggested: 9 16 *** 13: 13: ------------------------------------------------------------------------------- 13: - - @@ -52629,9 +52642,9 @@ 13: ROUTINE CALLS AVE VOLUME [Bytes] 13: MP_Bcast 917 5. 13: MP_Allreduce 6135 9. -13: MP_Alltoall 17388 19625. -13: MP_ISend 30812 1284. -13: MP_IRecv 33008 1157. +13: MP_Alltoall 17388 20090. +13: MP_ISend 13354 2016. +13: MP_IRecv 16710 2195. 13: ------------------------------------------------------------------------------- 13: 13: ------------------------------------------------------------------------------- @@ -52641,140 +52654,139 @@ 13: ------------------------------------------------------------------------------- 13: SUBROUTINE CALLS ASD SELF TIME TOTAL TIME MAXRANK 13: MAXIMUM AVERAGE MAXIMUM AVERAGE MAXIMUM -13: dbcsr_unittest 1 1.0 0.001 0.003 215.498 215.527 2 -13: dbcsr_test_multiplies 7 2.0 3.487 4.168 215.497 215.527 4 -13: test_multiply 756 3.0 0.067 0.413 200.457 202.777 3 -13: dbcsr_multiply_generic 756 4.0 0.483 0.753 107.359 110.626 10 -13: multiply_cannon 756 5.0 2.707 3.042 49.374 52.489 8 -13: make_m2s 1512 5.0 0.147 0.575 44.131 47.203 10 -13: make_images 1512 6.0 4.946 5.607 40.797 42.638 6 -13: dbcsr_redistribute 2268 4.0 4.520 5.904 39.506 42.532 11 -13: mp_alltoall_i22 2268 5.0 33.974 36.915 33.974 36.915 3 -13: mp_sum_l 5869 4.4 29.038 30.973 29.038 30.973 8 -13: multiply_cannon_loop 756 6.0 4.163 5.112 24.282 26.470 1 -13: dbcsr_create_new 18396 6.0 15.289 16.232 23.434 24.576 10 -13: make_images_sizes 1512 7.0 0.366 0.829 18.423 19.582 1 -13: mp_alltoall_i44 1512 8.0 18.056 19.218 18.056 19.218 3 -13: mp_waitall_1 33264 8.3 14.419 17.431 14.419 17.431 6 -13: mp_allgather_i34 756 6.0 14.704 17.296 14.704 17.296 5 -13: dbcsr_check_multiply 756 4.0 10.384 11.077 13.695 15.366 1 -13: dbcsr_make_random_matrix 2268 3.0 0.447 3.076 10.527 14.377 0 -13: dbcsr_finalize 6048 4.6 1.390 2.140 11.326 14.312 9 -13: dbcsr_merge_all 3780 5.4 8.327 10.362 9.692 13.186 7 -13: dbcsr_replicate 756 4.0 0.066 0.067 10.037 10.300 10 -13: dbcsr_special_finalize 5292 7.0 3.394 4.540 9.020 10.292 9 -13: multiply_cannon_multrec 9072 7.0 7.915 9.371 8.341 9.750 7 -13: dbcsr_make_index_exist 18396 7.0 8.115 8.835 8.115 8.835 8 -13: multiply_cannon_metrocomm1 9072 7.0 0.059 0.496 6.926 8.174 5 -13: dbcsr_merge_single_wm 5292 8.0 5.036 5.914 5.520 6.236 2 -13: setup_buffer_matrices 1512 6.0 0.035 0.214 4.849 5.686 5 -13: multiply_cannon_metrocomm3 9072 7.0 0.013 0.014 4.321 5.226 5 -13: mp_bcast_b 756 5.0 3.311 5.205 3.311 5.205 7 -13: make_images_data 1512 7.0 0.033 0.037 3.652 5.103 10 -13: dbcsr_make_index_list 5292 6.0 3.179 4.767 3.179 4.767 11 -13: mp_allgather_i12 756 5.0 3.458 3.668 3.458 3.668 8 -13: hybrid_alltoall_any 1512 8.0 0.258 0.831 2.527 3.580 8 -13: dbcsr_new_transposed 1008 5.0 0.023 0.037 3.023 3.370 3 -13: setup_rec_index_2d 1512 6.0 2.219 2.968 2.219 2.968 9 -13: dbcsr_copy 1512 5.0 0.079 0.415 2.076 2.895 1 -13: dbcsr_to_dense_local 3024 3.2 1.543 2.595 1.564 2.617 0 -13: merge_index 3780 6.4 0.797 1.968 0.797 1.968 0 -13: multiply_cannon_multrec_finali 756 8.0 0.002 0.002 0.426 1.432 10 -13: dbcsr_mm_multrec_finalize 756 9.0 0.424 1.429 0.424 1.430 11 -13: dbcsr_sort_data 6048 8.8 0.688 1.310 0.688 1.310 3 -13: dbcsr_data_release 88620 6.1 0.441 1.260 0.441 1.260 7 -13: multiply_cannon_metrocomm2 6804 7.0 0.141 0.560 0.251 1.085 10 -13: mp_sum_b 504 5.0 0.779 1.085 0.779 1.085 6 -13: mp_allgatherv_dv 189 5.0 0.816 1.032 0.816 1.032 1 -13: dbcsr_work_destroy_all 11340 6.7 0.114 0.548 0.251 0.981 6 -13: dbcsr_make_untransposed_blocks 756 5.0 0.338 0.974 0.344 0.980 11 -13: mp_allgatherv_iv 756 5.0 0.881 0.948 0.881 0.948 8 -13: multiply_cannon_metrocomm4 6048 7.0 0.032 0.039 0.280 0.839 10 -13: mp_allgatherv_rv 189 5.0 0.791 0.824 0.791 0.824 9 -13: mp_isend_zv 4092 8.2 0.097 0.786 0.097 0.786 8 -13: dbcsr_work_create 11340 5.7 0.131 0.650 0.185 0.671 1 -13: buffer_matrices_ensure_size 1512 6.0 0.391 0.655 0.391 0.655 3 -13: dbcsr_data_new 60480 5.9 0.197 0.614 0.197 0.614 4 -13: dbcsr_destroy 18396 4.9 0.132 0.574 0.262 0.614 10 -13: tree_to_linear_c 567 6.0 0.050 0.584 0.050 0.584 0 -13: mp_isend_rv 4095 8.2 0.054 0.583 0.054 0.583 4 -13: mp_irecv_cv 4182 8.2 0.151 0.580 0.151 0.580 10 -13: dbcsr_sort_indices 8370 7.3 0.243 0.548 0.243 0.548 0 -13: dbcsr_distribution_new 7056 4.5 0.060 0.529 0.060 0.529 2 -13: mp_irecv_rv 4162 8.2 0.047 0.512 0.047 0.512 11 -13: mp_isend_cv 4087 8.2 0.049 0.495 0.049 0.495 3 -13: dbcsr_get_local_cols 756 5.0 0.036 0.408 0.036 0.408 2 -13: mp_allgatherv_zv 189 5.0 0.337 0.400 0.337 0.400 4 -13: dbcsr_iterator_stop 13356 5.5 0.053 0.392 0.058 0.397 5 -13: mp_allgatherv_cv 189 5.0 0.335 0.385 0.335 0.385 1 -13: mp_alltoall_d11v 1701 5.0 0.219 0.347 0.219 0.347 7 -13: dbcsr_mm_multrec_init 756 6.0 0.002 0.005 0.118 0.345 8 -13: dbcsr_mm_csr_init 756 7.0 0.107 0.336 0.115 0.343 0 -13: mp_irecv_zv 4165 8.2 0.031 0.322 0.031 0.322 1 -13: mp_alltoall_z11v 1701 5.0 0.185 0.273 0.185 0.273 11 -13: mp_alltoall_c11v 1701 5.0 0.153 0.270 0.153 0.270 11 -13: dbcsr_data_copy_aa2 2800 6.8 0.019 0.193 0.019 0.193 0 -13: mp_alltoall_r11v 1701 5.0 0.132 0.192 0.132 0.192 3 -13: tree_to_linear_z 567 6.0 0.017 0.190 0.017 0.190 0 -13: quick_finalize 2268 6.0 0.077 0.169 0.092 0.185 11 -13: make_images_pack 1512 7.0 0.028 0.150 0.037 0.159 5 -13: mp_alltoall_i11v 6804 5.0 0.065 0.124 0.065 0.124 6 -13: tree_to_linear_s 567 6.0 0.025 0.111 0.025 0.111 0 -13: tree_to_linear_d 567 6.0 0.010 0.108 0.010 0.108 0 -13: mp_max_l 107 1.0 0.029 0.077 0.029 0.077 8 -13: dbcsr_iterator_start 13356 5.5 0.037 0.044 0.047 0.054 5 -13: dbcsr_verify_matrix 3024 4.2 0.018 0.030 0.018 0.030 0 -13: mp_isend_iv 17657 8.0 0.022 0.023 0.022 0.023 11 -13: mp_irecv_iv 17485 8.0 0.013 0.015 0.013 0.015 7 -13: dbcsr_switch_data_area 5712 6.1 0.009 0.009 0.012 0.013 5 -13: dbcsr_make_dbcsr_index 12348 7.7 0.010 0.013 0.010 0.013 0 -13: dbcsr_conjg 504 5.0 0.006 0.009 0.010 0.013 10 -13: dbcsr_get_data_size_used 6048 5.6 0.007 0.012 0.007 0.012 11 -13: dbcsr_iterator_seek 13356 6.5 0.010 0.012 0.010 0.012 0 -13: mp_isend_dv 4116 8.2 0.007 0.009 0.007 0.009 7 -13: transpose_index_local 1008 6.0 0.004 0.004 0.008 0.009 11 -13: fill_hash_tables 756 8.0 0.006 0.008 0.006 0.008 10 -13: dbcsr_make_index_local_row 5292 6.0 0.008 0.008 0.008 0.008 3 -13: mp_irecv_dv 4172 8.2 0.004 0.005 0.004 0.005 3 -13: dbcsr_get_local_rows 756 5.0 0.004 0.004 0.004 0.004 6 -13: mp_comm_free 4 2.0 0.001 0.003 0.001 0.003 0 -13: mp_sum_lv 161 1.0 0.002 0.002 0.002 0.002 11 -13: dbcsr_mm_sched_init 756 8.0 0.002 0.002 0.002 0.002 2 -13: mp_max_i 269 1.0 0.002 0.002 0.002 0.002 11 -13: mp_maxloc_dv 237 1.0 0.001 0.001 0.001 0.001 8 -13: dbcsr_init_lib_low 1 1.0 0.001 0.001 0.001 0.001 4 -13: mp_sum_d 239 1.0 0.001 0.001 0.001 0.001 11 -13: dbcsr_get_global_row_map 756 5.0 0.001 0.001 0.001 0.001 0 -13: mp_cart_sub 2 5.0 0.001 0.001 0.001 0.001 0 -13: mp_bcast_av 116 1.0 0.000 0.000 0.001 0.001 1 +13: dbcsr_unittest 1 1.0 0.002 0.004 106.651 106.691 6 +13: dbcsr_test_multiplies 7 2.0 0.963 1.104 106.648 106.687 6 +13: test_multiply 756 3.0 0.059 0.068 103.201 104.060 6 +13: dbcsr_multiply_generic 756 4.0 0.117 0.135 40.504 40.882 5 +13: dbcsr_redistribute 2268 4.0 3.072 3.649 20.182 21.536 4 +13: make_m2s 1512 5.0 0.062 0.063 18.036 18.235 2 +13: multiply_cannon 756 5.0 1.505 1.761 17.760 18.115 4 +13: make_images 1512 6.0 2.048 2.394 17.789 18.023 4 +13: dbcsr_check_multiply 756 4.0 13.800 14.783 16.628 17.759 6 +13: mp_alltoall_i22 2268 5.0 15.931 17.374 15.931 17.374 1 +13: mp_sum_l 5869 4.4 13.997 15.011 13.997 15.011 0 +13: mp_waitall_1 36288 8.2 12.391 13.726 12.391 13.726 0 +13: dbcsr_replicate 756 4.0 0.125 0.134 11.882 12.174 1 +13: multiply_cannon_loop 756 6.0 0.291 0.405 10.987 11.194 4 +13: make_images_sizes 1512 7.0 0.007 0.007 9.437 9.936 5 +13: mp_alltoall_i44 1512 8.0 9.430 9.929 9.430 9.929 5 +13: multiply_cannon_metrocomm1 5292 7.0 0.060 0.063 7.994 8.630 2 +13: mp_allgather_i12 756 5.0 5.453 5.714 5.453 5.714 1 +13: dbcsr_make_random_matrix 2268 3.0 0.764 3.390 1.614 5.648 0 +13: make_images_data 1512 7.0 0.066 0.072 4.639 5.309 6 +13: dbcsr_create_new 19908 6.1 4.105 4.857 4.433 5.187 3 +13: mp_allgather_i34 756 6.0 4.708 5.030 4.708 5.030 5 +13: mp_bcast_b 756 5.0 2.828 4.637 2.828 4.637 5 +13: hybrid_alltoall_any 1512 8.0 0.079 0.088 3.559 4.203 5 +13: dbcsr_finalize 6048 4.6 0.103 0.119 2.286 3.446 6 +13: dbcsr_merge_all 3780 5.4 1.400 1.823 2.056 3.224 0 +13: multiply_cannon_multrec 5292 7.0 2.221 2.558 2.599 2.934 4 +13: mp_allgatherv_iv 756 5.0 2.365 2.579 2.365 2.579 6 +13: dbcsr_to_dense_local 3024 3.2 1.430 2.035 1.474 2.074 0 +13: dbcsr_special_finalize 6048 7.0 0.089 0.098 1.153 1.327 1 +13: dbcsr_new_transposed 1008 5.0 0.041 0.063 1.185 1.324 5 +13: dbcsr_merge_single_wm 5292 8.0 0.721 0.893 0.789 0.969 4 +13: mp_sum_b 504 5.0 0.689 0.789 0.689 0.789 3 +13: dbcsr_copy 1512 5.0 0.023 0.029 0.605 0.775 6 +13: mp_allgatherv_zv 189 5.0 0.470 0.498 0.470 0.498 0 +13: multiply_cannon_multrec_finali 756 8.0 0.004 0.004 0.378 0.488 4 +13: dbcsr_mm_multrec_finalize 756 9.0 0.373 0.483 0.374 0.484 5 +13: dbcsr_data_release 92400 6.2 0.321 0.387 0.321 0.387 0 +13: dbcsr_sort_data 6048 8.8 0.360 0.377 0.360 0.377 6 +13: quick_finalize 3024 6.5 0.267 0.339 0.301 0.375 2 +13: mp_allgatherv_dv 189 5.0 0.330 0.364 0.330 0.364 3 +13: mp_allgatherv_cv 189 5.0 0.328 0.361 0.328 0.361 5 +13: mp_alltoall_z11v 1701 5.0 0.253 0.319 0.253 0.319 5 +13: mp_alltoall_c11v 1701 5.0 0.222 0.313 0.222 0.313 6 +13: dbcsr_make_index_exist 19908 7.1 0.278 0.299 0.278 0.299 1 +13: dbcsr_data_copy_aa2 2951 6.7 0.046 0.290 0.046 0.290 0 +13: mp_alltoall_d11v 1701 5.0 0.209 0.276 0.209 0.276 5 +13: mp_alltoall_r11v 1701 5.0 0.204 0.270 0.204 0.270 5 +13: setup_buffer_matrices 1512 6.0 0.032 0.033 0.232 0.246 4 +13: mp_allgatherv_rv 189 5.0 0.223 0.246 0.223 0.246 3 +13: dbcsr_destroy 19908 5.0 0.109 0.116 0.181 0.198 4 +13: tree_to_linear_z 567 6.0 0.028 0.186 0.028 0.186 0 +13: dbcsr_sort_indices 10092 7.6 0.147 0.185 0.147 0.185 0 +13: dbcsr_data_new 62748 6.0 0.175 0.182 0.175 0.182 0 +13: setup_rec_index_2d 1512 6.0 0.103 0.156 0.103 0.156 4 +13: tree_to_linear_c 567 6.0 0.021 0.134 0.021 0.134 0 +13: dbcsr_make_index_list 6048 6.0 0.117 0.133 0.117 0.133 6 +13: mp_alltoall_i11v 6804 5.0 0.082 0.129 0.082 0.129 6 +13: buffer_matrices_ensure_size 1512 6.0 0.085 0.127 0.085 0.127 6 +13: dbcsr_work_create 12096 5.8 0.073 0.082 0.111 0.121 4 +13: dbcsr_mm_multrec_init 756 6.0 0.005 0.005 0.099 0.112 3 +13: dbcsr_mm_csr_init 756 7.0 0.086 0.099 0.094 0.108 2 +13: tree_to_linear_d 567 6.0 0.016 0.105 0.016 0.105 0 +13: multiply_cannon_metrocomm2 4536 7.0 0.055 0.062 0.097 0.104 4 +13: merge_index 3780 6.4 0.085 0.102 0.085 0.102 0 +13: dbcsr_make_index_local_row 6048 6.0 0.068 0.100 0.068 0.100 4 +13: dbcsr_iterator_start 13356 5.5 0.068 0.074 0.092 0.096 4 +13: dbcsr_work_destroy_all 12096 6.8 0.068 0.075 0.090 0.096 4 +13: tree_to_linear_s 567 6.0 0.016 0.092 0.016 0.092 0 +13: dbcsr_iterator_stop 13356 5.5 0.051 0.062 0.067 0.076 1 +13: make_images_pack 1512 7.0 0.037 0.050 0.056 0.069 5 +13: mp_max_l 106 1.0 0.040 0.066 0.040 0.066 0 +13: dbcsr_make_untransposed_blocks 756 5.0 0.030 0.034 0.041 0.046 4 +13: dbcsr_verify_matrix 3024 4.2 0.027 0.042 0.027 0.042 0 +13: dbcsr_distribution_new 7056 4.5 0.026 0.035 0.026 0.035 4 +13: dbcsr_switch_data_area 6468 6.5 0.023 0.026 0.031 0.034 6 +13: dbcsr_iterator_seek 13356 6.5 0.024 0.031 0.024 0.031 0 +13: dbcsr_make_dbcsr_index 13104 7.8 0.024 0.027 0.024 0.027 5 +13: dbcsr_conjg 504 5.0 0.012 0.019 0.019 0.026 5 +13: mp_isend_iv 10895 8.0 0.021 0.025 0.021 0.025 6 +13: dbcsr_get_data_size_used 6048 5.6 0.011 0.018 0.011 0.018 2 +13: transpose_index_local 1008 6.0 0.007 0.008 0.013 0.016 6 +13: mp_irecv_iv 9359 8.0 0.014 0.015 0.014 0.015 5 +13: mp_isend_zv 2172 8.4 0.009 0.013 0.009 0.013 6 +13: mp_isend_cv 2175 8.4 0.007 0.010 0.007 0.010 4 +13: mp_isend_dv 2181 8.4 0.008 0.010 0.008 0.010 5 +13: mp_isend_rv 2188 8.4 0.007 0.010 0.007 0.010 4 +13: multiply_cannon_metrocomm3 5292 7.0 0.006 0.010 0.006 0.010 3 +13: mp_irecv_rv 1959 8.4 0.004 0.006 0.004 0.006 2 +13: dbcsr_init_lib_low 1 1.0 0.003 0.006 0.003 0.006 1 +13: dbcsr_get_local_rows 756 5.0 0.006 0.006 0.006 0.006 0 +13: dbcsr_mm_sched_init 756 8.0 0.003 0.004 0.004 0.005 4 +13: fill_hash_tables 756 8.0 0.004 0.004 0.004 0.004 4 +13: mp_irecv_zv 1967 8.4 0.003 0.004 0.003 0.004 2 +13: mp_irecv_dv 1955 8.4 0.003 0.004 0.003 0.004 2 +13: mp_irecv_cv 1938 8.4 0.003 0.003 0.003 0.003 0 +13: mp_sum_lv 161 1.0 0.002 0.003 0.002 0.003 0 +13: mp_max_i 268 1.0 0.002 0.003 0.002 0.003 6 +13: mp_maxloc_dv 235 1.0 0.002 0.002 0.002 0.002 0 +13: dbcsr_get_local_cols 756 5.0 0.002 0.002 0.002 0.002 0 +13: mp_sum_d 237 1.0 0.002 0.002 0.002 0.002 0 +13: dbcsr_get_global_row_map 756 5.0 0.002 0.002 0.002 0.002 0 +13: mp_bcast_av 115 1.0 0.001 0.001 0.001 0.002 3 13: dbcsr_get_global_col_map 756 5.0 0.001 0.001 0.001 0.001 5 +13: mp_cart_sub 2 5.0 0.001 0.001 0.001 0.001 0 13: mp_max_r 1 1.0 0.001 0.001 0.001 0.001 2 -13: mp_cart_create 1 5.0 0.001 0.001 0.001 0.001 10 -13: dbcsr_mm_sched_finalize 756 10.0 0.001 0.001 0.001 0.001 3 -13: mp_bcast_i 117 2.0 0.000 0.001 0.000 0.001 6 -13: dbcsr_mm_hostdrv_init 756 9.0 0.000 0.000 0.000 0.000 3 -13: mp_bcast_iv 161 1.0 0.000 0.000 0.000 0.000 8 -13: mp_min_rv 1 1.0 0.000 0.000 0.000 0.000 4 -13: mp_sum_lm3 1 1.0 0.000 0.000 0.000 0.000 0 -13: mp_max_d 1 1.0 0.000 0.000 0.000 0.000 2 -13: mp_sum_r 1 1.0 0.000 0.000 0.000 0.000 6 -13: mp_sum_rv 1 1.0 0.000 0.000 0.000 0.000 9 -13: mp_max_rv 1 1.0 0.000 0.000 0.000 0.000 10 -13: mp_sum_i 1 1.0 0.000 0.000 0.000 0.000 11 +13: dbcsr_mm_sched_finalize 756 10.0 0.001 0.001 0.001 0.001 4 +13: dbcsr_mm_hostdrv_init 756 9.0 0.001 0.001 0.001 0.001 0 +13: mp_bcast_i 116 2.0 0.001 0.001 0.001 0.001 4 +13: mp_bcast_iv 161 1.0 0.001 0.001 0.001 0.001 4 +13: mp_cart_create 1 5.0 0.001 0.001 0.001 0.001 5 +13: mp_comm_free 4 2.0 0.000 0.000 0.000 0.000 0 +13: mp_sum_i 1 1.0 0.000 0.000 0.000 0.000 2 +13: mp_sum_lm3 1 1.0 0.000 0.000 0.000 0.000 6 +13: mp_max_d 1 1.0 0.000 0.000 0.000 0.000 6 +13: mp_sum_rv 1 1.0 0.000 0.000 0.000 0.000 2 +13: mp_min_rv 1 1.0 0.000 0.000 0.000 0.000 6 +13: mp_sum_r 1 1.0 0.000 0.000 0.000 0.000 2 +13: mp_max_rv 1 1.0 0.000 0.000 0.000 0.000 0 13: ------------------------------------------------------------------------------- 13: -13/19 Test #13: dbcsr_unittest3 ....................................... Passed 216.27 sec +13/19 Test #13: dbcsr_unittest3 ....................................... Passed 106.82 sec test 14 Start 14: dbcsr_unittest4 -14: Test command: /usr/bin/mpiexec "-n" "12" "/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/tests/dbcsr_unittest4" +14: Test command: /usr/bin/mpiexec "-n" "7" "/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/tests/dbcsr_unittest4" 14: Working Directory: /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/tests 14: Environment variables: 14: OMP_NUM_THREADS=2 14: Test timeout computed to be: 1500 14: test_name scale_by_vector_symmetric 14: numthreads 2 -14: numnodes 12 +14: numnodes 7 14: matrix_size 20 20 14: sparsity 0.50000000000000000 14: bs_m 1 4 @@ -52817,7 +52829,7 @@ 14: ********************************************************************** 14: test_name scale_by_vector_asymm_exact1 14: numthreads 2 -14: numnodes 12 +14: numnodes 7 14: matrix_size 30 20 14: sparsity 0.0000000000000000 14: bs_m 1 4 @@ -52836,7 +52848,7 @@ 14: ********************************************************************** 14: test_name scale_by_vector_asymm_exact2 14: numthreads 2 -14: numnodes 12 +14: numnodes 7 14: matrix_size 20 30 14: sparsity 0.0000000000000000 14: bs_m 1 4 @@ -52876,7 +52888,7 @@ 14: ROUTINE CALLS AVE VOLUME [Bytes] 14: MP_Bcast 1 12. 14: MP_Allreduce 43 14. -14: MP_Alltoall 140 844. +14: MP_Alltoall 140 623. 14: ------------------------------------------------------------------------------- 14: 14: ------------------------------------------------------------------------------- @@ -52886,75 +52898,75 @@ 14: ------------------------------------------------------------------------------- 14: SUBROUTINE CALLS ASD SELF TIME TOTAL TIME MAXRANK 14: MAXIMUM AVERAGE MAXIMUM AVERAGE MAXIMUM -14: dbcsr_unittest 1 1.0 0.001 0.006 1.364 1.378 7 -14: dbcsr_test_scale_by_vectors 3 2.0 0.078 0.106 1.363 1.378 7 -14: test_scale_by_vector 20 3.0 0.001 0.001 1.123 1.249 11 -14: dbcsr_redistribute 20 4.0 0.038 0.072 0.595 0.728 11 -14: mp_alltoall_i22 20 5.0 0.415 0.547 0.415 0.547 1 -14: dbcsr_checksum 24 4.0 0.098 0.145 0.435 0.493 11 -14: mp_sum_d 99 2.0 0.337 0.437 0.337 0.437 6 -14: dbcsr_make_random_matrix 40 3.0 0.001 0.006 0.161 0.284 0 -14: dbcsr_create_new 100 4.4 0.112 0.162 0.149 0.228 7 -14: dbcsr_finalize 60 4.3 0.014 0.026 0.102 0.182 7 -14: dbcsr_merge_all 40 5.0 0.080 0.144 0.087 0.155 7 -14: dbcsr_new_transposed 40 4.0 0.000 0.001 0.075 0.122 11 -14: mp_cart_sub 2 5.0 0.093 0.096 0.093 0.096 6 -14: dbcsr_make_index_exist 100 5.4 0.037 0.069 0.037 0.069 3 -14: mp_cart_create 1 5.0 0.043 0.048 0.043 0.048 9 -14: dbcsr_init_lib_low 1 1.0 0.012 0.033 0.012 0.033 10 -14: mp_alltoall_d11v 15 5.0 0.004 0.013 0.004 0.013 10 -14: merge_index 40 6.0 0.007 0.012 0.007 0.012 10 -14: mp_max_l 48 1.0 0.005 0.006 0.005 0.006 0 -14: dbcsr_to_dense_local 36 3.4 0.001 0.003 0.001 0.003 1 -14: transpose_index_local 40 5.0 0.000 0.002 0.000 0.002 0 -14: mp_alltoall_r11v 15 5.0 0.001 0.002 0.001 0.002 7 -14: mp_maxloc_dv 121 1.0 0.001 0.001 0.001 0.001 10 -14: mp_sum_l 99 1.0 0.001 0.001 0.001 0.001 3 -14: dbcsr_scale_by_vector_anytype 40 4.0 0.000 0.000 0.000 0.001 11 -14: mp_bcast_av 58 1.0 0.000 0.000 0.000 0.001 5 -14: dbcsr_destroy 100 3.6 0.000 0.000 0.000 0.000 11 -14: dbcsr_data_new 452 4.8 0.000 0.000 0.000 0.000 7 -14: dbcsr_data_release 588 5.1 0.000 0.000 0.000 0.000 11 -14: mp_bcast_i 59 2.0 0.000 0.000 0.000 0.000 2 -14: dbcsr_work_create 60 4.3 0.000 0.000 0.000 0.000 7 -14: dbcsr_iterator_start 116 4.8 0.000 0.000 0.000 0.000 11 -14: mp_max_i 51 1.0 0.000 0.000 0.000 0.000 0 -14: quick_finalize 20 6.0 0.000 0.000 0.000 0.000 11 -14: dbcsr_work_destroy_all 60 5.3 0.000 0.000 0.000 0.000 11 -14: dbcsr_iterator_stop 116 4.8 0.000 0.000 0.000 0.000 0 +14: dbcsr_unittest 1 1.0 0.001 0.001 0.224 0.229 3 +14: dbcsr_test_scale_by_vectors 3 2.0 0.012 0.025 0.223 0.228 0 +14: test_scale_by_vector 20 3.0 0.001 0.001 0.201 0.217 3 +14: dbcsr_redistribute 20 4.0 0.018 0.039 0.103 0.120 5 +14: mp_alltoall_i22 20 5.0 0.080 0.103 0.080 0.103 2 +14: dbcsr_checksum 24 4.0 0.011 0.027 0.082 0.094 0 +14: mp_sum_d 99 2.0 0.072 0.094 0.072 0.094 4 +14: dbcsr_init_lib_low 1 1.0 0.010 0.035 0.010 0.035 4 +14: dbcsr_create_new 100 4.4 0.013 0.030 0.014 0.031 1 +14: dbcsr_new_transposed 40 4.0 0.001 0.001 0.011 0.029 3 +14: dbcsr_make_random_matrix 40 3.0 0.002 0.003 0.009 0.011 0 +14: dbcsr_finalize 60 4.3 0.001 0.001 0.005 0.006 3 +14: mp_max_i 51 1.0 0.004 0.005 0.004 0.005 6 +14: dbcsr_merge_all 40 5.0 0.002 0.003 0.003 0.004 0 +14: mp_max_l 48 1.0 0.003 0.004 0.003 0.004 2 +14: dbcsr_to_dense_local 36 3.4 0.001 0.001 0.002 0.002 3 +14: mp_cart_sub 2 5.0 0.002 0.002 0.002 0.002 4 +14: mp_maxloc_dv 121 1.0 0.001 0.001 0.001 0.001 2 +14: dbcsr_scale_by_vector_anytype 40 4.0 0.001 0.001 0.001 0.001 3 +14: dbcsr_make_index_exist 100 5.4 0.001 0.001 0.001 0.001 1 +14: mp_bcast_av 58 1.0 0.000 0.001 0.001 0.001 3 +14: mp_sum_l 99 1.0 0.001 0.001 0.001 0.001 2 +14: dbcsr_data_release 588 5.1 0.001 0.001 0.001 0.001 3 +14: dbcsr_destroy 100 3.6 0.001 0.001 0.001 0.001 6 +14: dbcsr_data_new 452 4.8 0.001 0.001 0.001 0.001 3 +14: dbcsr_work_create 60 4.3 0.000 0.001 0.001 0.001 3 +14: dbcsr_iterator_start 116 4.8 0.000 0.001 0.001 0.001 3 +14: dbcsr_iterator_stop 116 4.8 0.000 0.000 0.001 0.001 4 +14: dbcsr_work_destroy_all 60 5.3 0.000 0.000 0.001 0.001 3 +14: quick_finalize 20 6.0 0.000 0.000 0.000 0.001 6 +14: mp_bcast_i 59 2.0 0.000 0.001 0.000 0.001 4 +14: transpose_index_local 40 5.0 0.000 0.000 0.000 0.000 6 +14: merge_index 40 6.0 0.000 0.000 0.000 0.000 0 +14: mp_alltoall_i11v 60 5.0 0.000 0.000 0.000 0.000 2 +14: tree_to_linear_c 10 6.0 0.000 0.000 0.000 0.000 0 14: tree_to_linear_z 10 6.0 0.000 0.000 0.000 0.000 0 14: tree_to_linear_d 10 6.0 0.000 0.000 0.000 0.000 0 14: tree_to_linear_s 10 6.0 0.000 0.000 0.000 0.000 0 -14: dbcsr_distribution_new 100 4.4 0.000 0.000 0.000 0.000 11 -14: tree_to_linear_c 10 6.0 0.000 0.000 0.000 0.000 0 -14: dbcsr_sort_indices 82 6.2 0.000 0.000 0.000 0.000 0 -14: mp_alltoall_z11v 15 5.0 0.000 0.000 0.000 0.000 4 -14: mp_alltoall_i11v 60 5.0 0.000 0.000 0.000 0.000 2 -14: mp_alltoall_c11v 15 5.0 0.000 0.000 0.000 0.000 4 -14: mp_max_r 1 1.0 0.000 0.000 0.000 0.000 11 -14: dbcsr_iterator_seek 116 5.8 0.000 0.000 0.000 0.000 0 -14: dbcsr_verify_matrix 40 4.0 0.000 0.000 0.000 0.000 0 +14: dbcsr_distribution_new 100 4.4 0.000 0.000 0.000 0.000 3 +14: dbcsr_sort_indices 84 6.2 0.000 0.000 0.000 0.000 6 +14: mp_alltoall_z11v 15 5.0 0.000 0.000 0.000 0.000 2 +14: mp_alltoall_c11v 15 5.0 0.000 0.000 0.000 0.000 2 +14: mp_alltoall_r11v 15 5.0 0.000 0.000 0.000 0.000 2 +14: dbcsr_iterator_seek 116 5.8 0.000 0.000 0.000 0.000 6 +14: mp_alltoall_d11v 15 5.0 0.000 0.000 0.000 0.000 2 +14: dbcsr_make_dbcsr_index 100 6.2 0.000 0.000 0.000 0.000 3 +14: dbcsr_switch_data_area 20 7.0 0.000 0.000 0.000 0.000 0 +14: mp_cart_create 1 5.0 0.000 0.000 0.000 0.000 2 +14: dbcsr_get_data_size_used 60 5.3 0.000 0.000 0.000 0.000 6 14: dbcsr_data_copy_aa2 40 6.0 0.000 0.000 0.000 0.000 0 -14: dbcsr_switch_data_area 20 7.0 0.000 0.000 0.000 0.000 7 -14: dbcsr_get_data_size_used 60 5.3 0.000 0.000 0.000 0.000 11 -14: dbcsr_make_dbcsr_index 100 6.2 0.000 0.000 0.000 0.000 7 -14: mp_comm_free 4 2.0 0.000 0.000 0.000 0.000 8 -14: mp_bcast_iv 1 1.0 0.000 0.000 0.000 0.000 6 -14: mp_sum_lv 1 1.0 0.000 0.000 0.000 0.000 11 -14: mp_sum_lm3 1 1.0 0.000 0.000 0.000 0.000 0 -14: mp_sum_r 1 1.0 0.000 0.000 0.000 0.000 8 -14: mp_max_d 1 1.0 0.000 0.000 0.000 0.000 3 -14: mp_sum_i 1 1.0 0.000 0.000 0.000 0.000 4 -14: mp_min_rv 1 1.0 0.000 0.000 0.000 0.000 11 -14: mp_max_rv 1 1.0 0.000 0.000 0.000 0.000 9 -14: mp_sum_rv 1 1.0 0.000 0.000 0.000 0.000 3 +14: dbcsr_verify_matrix 40 4.0 0.000 0.000 0.000 0.000 3 +14: mp_max_r 1 1.0 0.000 0.000 0.000 0.000 6 +14: mp_comm_free 4 2.0 0.000 0.000 0.000 0.000 1 +14: mp_sum_lv 1 1.0 0.000 0.000 0.000 0.000 0 +14: mp_bcast_iv 1 1.0 0.000 0.000 0.000 0.000 4 +14: mp_sum_lm3 1 1.0 0.000 0.000 0.000 0.000 2 +14: mp_min_rv 1 1.0 0.000 0.000 0.000 0.000 2 +14: mp_sum_i 1 1.0 0.000 0.000 0.000 0.000 6 +14: mp_sum_rv 1 1.0 0.000 0.000 0.000 0.000 2 +14: mp_sum_r 1 1.0 0.000 0.000 0.000 0.000 2 +14: mp_max_rv 1 1.0 0.000 0.000 0.000 0.000 6 +14: mp_max_d 1 1.0 0.000 0.000 0.000 0.000 2 14: ------------------------------------------------------------------------------- 14: -14/19 Test #14: dbcsr_unittest4 ....................................... Passed 1.81 sec +14/19 Test #14: dbcsr_unittest4 ....................................... Passed 0.37 sec test 15 Start 15: dbcsr_tensor_unittest -15: Test command: /usr/bin/mpiexec "-n" "12" "/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/tests/dbcsr_tensor_unittest" +15: Test command: /usr/bin/mpiexec "-n" "7" "/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/tests/dbcsr_tensor_unittest" 15: Working Directory: /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/tests 15: Environment variables: 15: OMP_NUM_THREADS=2 @@ -52984,20 +52996,20 @@ 15: 15: Test 1: ( 1 | 2 ) 15: Reference distribution: -15: Dist vec 1: 2 2 0 1 0 0 2 0 3 3 3 0 2 3 -15: Dist vec 2: 2 1 0 2 2 2 2 1 0 1 1 0 2 1 0 2 0 2 0 0 1 +15: Dist vec 1: 0 4 0 2 5 6 6 3 6 1 4 0 5 3 +15: Dist vec 2: 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 15: Test distribution: -15: Dist vec 1: 2 2 0 1 0 0 2 0 3 3 3 0 2 3 -15: Dist vec 2: 2 1 0 2 2 2 2 1 0 1 1 0 2 1 0 2 0 2 0 0 1 +15: Dist vec 1: 0 4 0 2 5 6 6 3 6 1 4 0 5 3 +15: Dist vec 2: 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 15: Test 1 Test passed! 15: 15: Test 2: ( 2 | 1 ) 15: Reference distribution: -15: Dist vec 1: 2 2 0 1 0 0 2 0 3 3 3 0 2 3 -15: Dist vec 2: 2 1 0 2 2 2 2 1 0 1 1 0 2 1 0 2 0 2 0 0 1 +15: Dist vec 1: 0 4 0 2 5 6 6 3 6 1 4 0 5 3 +15: Dist vec 2: 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 15: Test distribution: -15: Dist vec 1: 2 2 0 1 0 0 2 0 3 3 3 0 2 3 -15: Dist vec 2: 2 1 0 2 2 2 2 1 0 1 1 0 2 1 0 2 0 2 0 0 1 +15: Dist vec 1: 0 4 0 2 5 6 6 3 6 1 4 0 5 3 +15: Dist vec 2: 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 15: Test 2 Test passed! 15: 15: -------------------------------------------------------------------------------- @@ -53019,134 +53031,134 @@ 15: 15: Test 1: ( 1 | 2 3 ) 15: Reference distribution: -15: Dist vec 1: 2 0 1 0 -15: Dist vec 2: 1 0 0 1 0 1 -15: Dist vec 3: 0 0 1 -15: Test distribution: -15: Dist vec 1: 2 0 1 0 -15: Dist vec 2: 1 0 0 1 0 1 -15: Dist vec 3: 0 0 1 +15: Dist vec 1: 5 3 4 2 +15: Dist vec 2: 0 0 0 0 0 0 +15: Dist vec 3: 0 0 0 +15: Test distribution: +15: Dist vec 1: 5 3 4 2 +15: Dist vec 2: 0 0 0 0 0 0 +15: Dist vec 3: 0 0 0 15: Test 1 Test passed! 15: 15: Test 2: ( 1 2 | 3 ) 15: Reference distribution: -15: Dist vec 1: 2 0 1 0 -15: Dist vec 2: 1 0 0 1 0 1 -15: Dist vec 3: 0 0 1 -15: Test distribution: -15: Dist vec 1: 2 0 1 0 -15: Dist vec 2: 1 0 0 1 0 1 -15: Dist vec 3: 0 0 1 +15: Dist vec 1: 5 3 4 2 +15: Dist vec 2: 0 0 0 0 0 0 +15: Dist vec 3: 0 0 0 +15: Test distribution: +15: Dist vec 1: 5 3 4 2 +15: Dist vec 2: 0 0 0 0 0 0 +15: Dist vec 3: 0 0 0 15: Test 2 Test passed! 15: 15: Test 3: ( 1 | 3 2 ) 15: Reference distribution: -15: Dist vec 1: 2 0 1 0 -15: Dist vec 2: 1 0 0 1 0 1 -15: Dist vec 3: 0 0 1 -15: Test distribution: -15: Dist vec 1: 2 0 1 0 -15: Dist vec 2: 1 0 0 1 0 1 -15: Dist vec 3: 0 0 1 +15: Dist vec 1: 5 3 4 2 +15: Dist vec 2: 0 0 0 0 0 0 +15: Dist vec 3: 0 0 0 +15: Test distribution: +15: Dist vec 1: 5 3 4 2 +15: Dist vec 2: 0 0 0 0 0 0 +15: Dist vec 3: 0 0 0 15: Test 3 Test passed! 15: 15: Test 4: ( 1 3 | 2 ) 15: Reference distribution: -15: Dist vec 1: 2 0 1 0 -15: Dist vec 2: 1 0 0 1 0 1 -15: Dist vec 3: 0 0 1 -15: Test distribution: -15: Dist vec 1: 2 0 1 0 -15: Dist vec 2: 1 0 0 1 0 1 -15: Dist vec 3: 0 0 1 +15: Dist vec 1: 5 3 4 2 +15: Dist vec 2: 0 0 0 0 0 0 +15: Dist vec 3: 0 0 0 +15: Test distribution: +15: Dist vec 1: 5 3 4 2 +15: Dist vec 2: 0 0 0 0 0 0 +15: Dist vec 3: 0 0 0 15: Test 4 Test passed! 15: 15: Test 5: ( 2 | 1 3 ) 15: Reference distribution: -15: Dist vec 1: 2 0 1 0 -15: Dist vec 2: 1 0 0 1 0 1 -15: Dist vec 3: 0 0 1 -15: Test distribution: -15: Dist vec 1: 2 0 1 0 -15: Dist vec 2: 1 0 0 1 0 1 -15: Dist vec 3: 0 0 1 +15: Dist vec 1: 5 3 4 2 +15: Dist vec 2: 0 0 0 0 0 0 +15: Dist vec 3: 0 0 0 +15: Test distribution: +15: Dist vec 1: 5 3 4 2 +15: Dist vec 2: 0 0 0 0 0 0 +15: Dist vec 3: 0 0 0 15: Test 5 Test passed! 15: 15: Test 6: ( 2 1 | 3 ) 15: Reference distribution: -15: Dist vec 1: 2 0 1 0 -15: Dist vec 2: 1 0 0 1 0 1 -15: Dist vec 3: 0 0 1 -15: Test distribution: -15: Dist vec 1: 2 0 1 0 -15: Dist vec 2: 1 0 0 1 0 1 -15: Dist vec 3: 0 0 1 +15: Dist vec 1: 5 3 4 2 +15: Dist vec 2: 0 0 0 0 0 0 +15: Dist vec 3: 0 0 0 +15: Test distribution: +15: Dist vec 1: 5 3 4 2 +15: Dist vec 2: 0 0 0 0 0 0 +15: Dist vec 3: 0 0 0 15: Test 6 Test passed! 15: 15: Test 7: ( 2 | 3 1 ) 15: Reference distribution: -15: Dist vec 1: 2 0 1 0 -15: Dist vec 2: 1 0 0 1 0 1 -15: Dist vec 3: 0 0 1 -15: Test distribution: -15: Dist vec 1: 2 0 1 0 -15: Dist vec 2: 1 0 0 1 0 1 -15: Dist vec 3: 0 0 1 +15: Dist vec 1: 5 3 4 2 +15: Dist vec 2: 0 0 0 0 0 0 +15: Dist vec 3: 0 0 0 +15: Test distribution: +15: Dist vec 1: 5 3 4 2 +15: Dist vec 2: 0 0 0 0 0 0 +15: Dist vec 3: 0 0 0 15: Test 7 Test passed! 15: 15: Test 8: ( 2 3 | 1 ) 15: Reference distribution: -15: Dist vec 1: 2 0 1 0 -15: Dist vec 2: 1 0 0 1 0 1 -15: Dist vec 3: 0 0 1 -15: Test distribution: -15: Dist vec 1: 2 0 1 0 -15: Dist vec 2: 1 0 0 1 0 1 -15: Dist vec 3: 0 0 1 +15: Dist vec 1: 5 3 4 2 +15: Dist vec 2: 0 0 0 0 0 0 +15: Dist vec 3: 0 0 0 +15: Test distribution: +15: Dist vec 1: 5 3 4 2 +15: Dist vec 2: 0 0 0 0 0 0 +15: Dist vec 3: 0 0 0 15: Test 8 Test passed! 15: 15: Test 9: ( 3 | 2 1 ) 15: Reference distribution: -15: Dist vec 1: 2 0 1 0 -15: Dist vec 2: 1 0 0 1 0 1 -15: Dist vec 3: 0 0 1 -15: Test distribution: -15: Dist vec 1: 2 0 1 0 -15: Dist vec 2: 1 0 0 1 0 1 -15: Dist vec 3: 0 0 1 +15: Dist vec 1: 5 3 4 2 +15: Dist vec 2: 0 0 0 0 0 0 +15: Dist vec 3: 0 0 0 +15: Test distribution: +15: Dist vec 1: 5 3 4 2 +15: Dist vec 2: 0 0 0 0 0 0 +15: Dist vec 3: 0 0 0 15: Test 9 Test passed! 15: 15: Test 10: ( 3 2 | 1 ) 15: Reference distribution: -15: Dist vec 1: 2 0 1 0 -15: Dist vec 2: 1 0 0 1 0 1 -15: Dist vec 3: 0 0 1 -15: Test distribution: -15: Dist vec 1: 2 0 1 0 -15: Dist vec 2: 1 0 0 1 0 1 -15: Dist vec 3: 0 0 1 +15: Dist vec 1: 5 3 4 2 +15: Dist vec 2: 0 0 0 0 0 0 +15: Dist vec 3: 0 0 0 +15: Test distribution: +15: Dist vec 1: 5 3 4 2 +15: Dist vec 2: 0 0 0 0 0 0 +15: Dist vec 3: 0 0 0 15: Test 10 Test passed! 15: 15: Test 11: ( 3 | 1 2 ) 15: Reference distribution: -15: Dist vec 1: 2 0 1 0 -15: Dist vec 2: 1 0 0 1 0 1 -15: Dist vec 3: 0 0 1 -15: Test distribution: -15: Dist vec 1: 2 0 1 0 -15: Dist vec 2: 1 0 0 1 0 1 -15: Dist vec 3: 0 0 1 +15: Dist vec 1: 5 3 4 2 +15: Dist vec 2: 0 0 0 0 0 0 +15: Dist vec 3: 0 0 0 +15: Test distribution: +15: Dist vec 1: 5 3 4 2 +15: Dist vec 2: 0 0 0 0 0 0 +15: Dist vec 3: 0 0 0 15: Test 11 Test passed! 15: 15: Test 12: ( 3 1 | 2 ) 15: Reference distribution: -15: Dist vec 1: 2 0 1 0 -15: Dist vec 2: 1 0 0 1 0 1 -15: Dist vec 3: 0 0 1 -15: Test distribution: -15: Dist vec 1: 2 0 1 0 -15: Dist vec 2: 1 0 0 1 0 1 -15: Dist vec 3: 0 0 1 +15: Dist vec 1: 5 3 4 2 +15: Dist vec 2: 0 0 0 0 0 0 +15: Dist vec 3: 0 0 0 +15: Test distribution: +15: Dist vec 1: 5 3 4 2 +15: Dist vec 2: 0 0 0 0 0 0 +15: Dist vec 3: 0 0 0 15: Test 12 Test passed! 15: 15: -------------------------------------------------------------------------------- @@ -53182,937 +53194,937 @@ 15: 15: Test 1: ( 1 | 2 3 4 ) 15: Reference distribution: -15: Dist vec 1: 0 1 -15: Dist vec 2: 0 1 0 0 1 0 1 0 1 1 0 0 1 -15: Dist vec 3: 0 1 0 1 1 0 1 +15: Dist vec 1: 3 5 +15: Dist vec 2: 0 0 0 0 0 0 0 0 0 0 0 0 0 +15: Dist vec 3: 0 0 0 0 0 0 0 15: Dist vec 4: 0 0 0 15: Test distribution: -15: Dist vec 1: 0 1 -15: Dist vec 2: 0 1 0 0 1 0 1 0 1 1 0 0 1 -15: Dist vec 3: 0 1 0 1 1 0 1 +15: Dist vec 1: 3 5 +15: Dist vec 2: 0 0 0 0 0 0 0 0 0 0 0 0 0 +15: Dist vec 3: 0 0 0 0 0 0 0 15: Dist vec 4: 0 0 0 15: Test 1 Test passed! 15: 15: Test 2: ( 1 2 | 3 4 ) 15: Reference distribution: -15: Dist vec 1: 0 1 -15: Dist vec 2: 0 1 0 0 1 0 1 0 1 1 0 0 1 -15: Dist vec 3: 0 1 0 1 1 0 1 +15: Dist vec 1: 3 5 +15: Dist vec 2: 0 0 0 0 0 0 0 0 0 0 0 0 0 +15: Dist vec 3: 0 0 0 0 0 0 0 15: Dist vec 4: 0 0 0 15: Test distribution: -15: Dist vec 1: 0 1 -15: Dist vec 2: 0 1 0 0 1 0 1 0 1 1 0 0 1 -15: Dist vec 3: 0 1 0 1 1 0 1 +15: Dist vec 1: 3 5 +15: Dist vec 2: 0 0 0 0 0 0 0 0 0 0 0 0 0 +15: Dist vec 3: 0 0 0 0 0 0 0 15: Dist vec 4: 0 0 0 15: Test 2 Test passed! 15: 15: Test 3: ( 1 2 3 | 4 ) 15: Reference distribution: -15: Dist vec 1: 0 1 -15: Dist vec 2: 0 1 0 0 1 0 1 0 1 1 0 0 1 -15: Dist vec 3: 0 1 0 1 1 0 1 +15: Dist vec 1: 3 5 +15: Dist vec 2: 0 0 0 0 0 0 0 0 0 0 0 0 0 +15: Dist vec 3: 0 0 0 0 0 0 0 15: Dist vec 4: 0 0 0 15: Test distribution: -15: Dist vec 1: 0 1 -15: Dist vec 2: 0 1 0 0 1 0 1 0 1 1 0 0 1 -15: Dist vec 3: 0 1 0 1 1 0 1 +15: Dist vec 1: 3 5 +15: Dist vec 2: 0 0 0 0 0 0 0 0 0 0 0 0 0 +15: Dist vec 3: 0 0 0 0 0 0 0 15: Dist vec 4: 0 0 0 15: Test 3 Test passed! 15: 15: Test 4: ( 1 | 2 4 3 ) 15: Reference distribution: -15: Dist vec 1: 0 1 -15: Dist vec 2: 0 1 0 0 1 0 1 0 1 1 0 0 1 -15: Dist vec 3: 0 1 0 1 1 0 1 +15: Dist vec 1: 3 5 +15: Dist vec 2: 0 0 0 0 0 0 0 0 0 0 0 0 0 +15: Dist vec 3: 0 0 0 0 0 0 0 15: Dist vec 4: 0 0 0 15: Test distribution: -15: Dist vec 1: 0 1 -15: Dist vec 2: 0 1 0 0 1 0 1 0 1 1 0 0 1 -15: Dist vec 3: 0 1 0 1 1 0 1 +15: Dist vec 1: 3 5 +15: Dist vec 2: 0 0 0 0 0 0 0 0 0 0 0 0 0 +15: Dist vec 3: 0 0 0 0 0 0 0 15: Dist vec 4: 0 0 0 15: Test 4 Test passed! 15: 15: Test 5: ( 1 2 | 4 3 ) 15: Reference distribution: -15: Dist vec 1: 0 1 -15: Dist vec 2: 0 1 0 0 1 0 1 0 1 1 0 0 1 -15: Dist vec 3: 0 1 0 1 1 0 1 +15: Dist vec 1: 3 5 +15: Dist vec 2: 0 0 0 0 0 0 0 0 0 0 0 0 0 +15: Dist vec 3: 0 0 0 0 0 0 0 15: Dist vec 4: 0 0 0 15: Test distribution: -15: Dist vec 1: 0 1 -15: Dist vec 2: 0 1 0 0 1 0 1 0 1 1 0 0 1 -15: Dist vec 3: 0 1 0 1 1 0 1 +15: Dist vec 1: 3 5 +15: Dist vec 2: 0 0 0 0 0 0 0 0 0 0 0 0 0 +15: Dist vec 3: 0 0 0 0 0 0 0 15: Dist vec 4: 0 0 0 15: Test 5 Test passed! 15: 15: Test 6: ( 1 2 4 | 3 ) 15: Reference distribution: -15: Dist vec 1: 0 1 -15: Dist vec 2: 0 1 0 0 1 0 1 0 1 1 0 0 1 -15: Dist vec 3: 0 1 0 1 1 0 1 +15: Dist vec 1: 3 5 +15: Dist vec 2: 0 0 0 0 0 0 0 0 0 0 0 0 0 +15: Dist vec 3: 0 0 0 0 0 0 0 15: Dist vec 4: 0 0 0 15: Test distribution: -15: Dist vec 1: 0 1 -15: Dist vec 2: 0 1 0 0 1 0 1 0 1 1 0 0 1 -15: Dist vec 3: 0 1 0 1 1 0 1 +15: Dist vec 1: 3 5 +15: Dist vec 2: 0 0 0 0 0 0 0 0 0 0 0 0 0 +15: Dist vec 3: 0 0 0 0 0 0 0 15: Dist vec 4: 0 0 0 15: Test 6 Test passed! 15: 15: Test 7: ( 1 | 3 2 4 ) 15: Reference distribution: -15: Dist vec 1: 0 1 -15: Dist vec 2: 0 1 0 0 1 0 1 0 1 1 0 0 1 -15: Dist vec 3: 0 1 0 1 1 0 1 +15: Dist vec 1: 3 5 +15: Dist vec 2: 0 0 0 0 0 0 0 0 0 0 0 0 0 +15: Dist vec 3: 0 0 0 0 0 0 0 15: Dist vec 4: 0 0 0 15: Test distribution: -15: Dist vec 1: 0 1 -15: Dist vec 2: 0 1 0 0 1 0 1 0 1 1 0 0 1 -15: Dist vec 3: 0 1 0 1 1 0 1 +15: Dist vec 1: 3 5 +15: Dist vec 2: 0 0 0 0 0 0 0 0 0 0 0 0 0 +15: Dist vec 3: 0 0 0 0 0 0 0 15: Dist vec 4: 0 0 0 15: Test 7 Test passed! 15: 15: Test 8: ( 1 3 | 2 4 ) 15: Reference distribution: -15: Dist vec 1: 0 1 -15: Dist vec 2: 0 1 0 0 1 0 1 0 1 1 0 0 1 -15: Dist vec 3: 0 1 0 1 1 0 1 +15: Dist vec 1: 3 5 +15: Dist vec 2: 0 0 0 0 0 0 0 0 0 0 0 0 0 +15: Dist vec 3: 0 0 0 0 0 0 0 15: Dist vec 4: 0 0 0 15: Test distribution: -15: Dist vec 1: 0 1 -15: Dist vec 2: 0 1 0 0 1 0 1 0 1 1 0 0 1 -15: Dist vec 3: 0 1 0 1 1 0 1 +15: Dist vec 1: 3 5 +15: Dist vec 2: 0 0 0 0 0 0 0 0 0 0 0 0 0 +15: Dist vec 3: 0 0 0 0 0 0 0 15: Dist vec 4: 0 0 0 15: Test 8 Test passed! 15: 15: Test 9: ( 1 3 2 | 4 ) 15: Reference distribution: -15: Dist vec 1: 0 1 -15: Dist vec 2: 0 1 0 0 1 0 1 0 1 1 0 0 1 -15: Dist vec 3: 0 1 0 1 1 0 1 +15: Dist vec 1: 3 5 +15: Dist vec 2: 0 0 0 0 0 0 0 0 0 0 0 0 0 +15: Dist vec 3: 0 0 0 0 0 0 0 15: Dist vec 4: 0 0 0 15: Test distribution: -15: Dist vec 1: 0 1 -15: Dist vec 2: 0 1 0 0 1 0 1 0 1 1 0 0 1 -15: Dist vec 3: 0 1 0 1 1 0 1 +15: Dist vec 1: 3 5 +15: Dist vec 2: 0 0 0 0 0 0 0 0 0 0 0 0 0 +15: Dist vec 3: 0 0 0 0 0 0 0 15: Dist vec 4: 0 0 0 15: Test 9 Test passed! 15: 15: Test 10: ( 1 | 3 4 2 ) 15: Reference distribution: -15: Dist vec 1: 0 1 -15: Dist vec 2: 0 1 0 0 1 0 1 0 1 1 0 0 1 -15: Dist vec 3: 0 1 0 1 1 0 1 +15: Dist vec 1: 3 5 +15: Dist vec 2: 0 0 0 0 0 0 0 0 0 0 0 0 0 +15: Dist vec 3: 0 0 0 0 0 0 0 15: Dist vec 4: 0 0 0 15: Test distribution: -15: Dist vec 1: 0 1 -15: Dist vec 2: 0 1 0 0 1 0 1 0 1 1 0 0 1 -15: Dist vec 3: 0 1 0 1 1 0 1 +15: Dist vec 1: 3 5 +15: Dist vec 2: 0 0 0 0 0 0 0 0 0 0 0 0 0 +15: Dist vec 3: 0 0 0 0 0 0 0 15: Dist vec 4: 0 0 0 15: Test 10 Test passed! 15: 15: Test 11: ( 1 3 | 4 2 ) 15: Reference distribution: -15: Dist vec 1: 0 1 -15: Dist vec 2: 0 1 0 0 1 0 1 0 1 1 0 0 1 -15: Dist vec 3: 0 1 0 1 1 0 1 +15: Dist vec 1: 3 5 +15: Dist vec 2: 0 0 0 0 0 0 0 0 0 0 0 0 0 +15: Dist vec 3: 0 0 0 0 0 0 0 15: Dist vec 4: 0 0 0 15: Test distribution: -15: Dist vec 1: 0 1 -15: Dist vec 2: 0 1 0 0 1 0 1 0 1 1 0 0 1 -15: Dist vec 3: 0 1 0 1 1 0 1 +15: Dist vec 1: 3 5 +15: Dist vec 2: 0 0 0 0 0 0 0 0 0 0 0 0 0 +15: Dist vec 3: 0 0 0 0 0 0 0 15: Dist vec 4: 0 0 0 15: Test 11 Test passed! 15: 15: Test 12: ( 1 3 4 | 2 ) 15: Reference distribution: -15: Dist vec 1: 0 1 -15: Dist vec 2: 0 1 0 0 1 0 1 0 1 1 0 0 1 -15: Dist vec 3: 0 1 0 1 1 0 1 +15: Dist vec 1: 3 5 +15: Dist vec 2: 0 0 0 0 0 0 0 0 0 0 0 0 0 +15: Dist vec 3: 0 0 0 0 0 0 0 15: Dist vec 4: 0 0 0 15: Test distribution: -15: Dist vec 1: 0 1 -15: Dist vec 2: 0 1 0 0 1 0 1 0 1 1 0 0 1 -15: Dist vec 3: 0 1 0 1 1 0 1 +15: Dist vec 1: 3 5 +15: Dist vec 2: 0 0 0 0 0 0 0 0 0 0 0 0 0 +15: Dist vec 3: 0 0 0 0 0 0 0 15: Dist vec 4: 0 0 0 15: Test 12 Test passed! 15: 15: Test 13: ( 1 | 4 3 2 ) 15: Reference distribution: -15: Dist vec 1: 0 1 -15: Dist vec 2: 0 1 0 0 1 0 1 0 1 1 0 0 1 -15: Dist vec 3: 0 1 0 1 1 0 1 +15: Dist vec 1: 3 5 +15: Dist vec 2: 0 0 0 0 0 0 0 0 0 0 0 0 0 +15: Dist vec 3: 0 0 0 0 0 0 0 15: Dist vec 4: 0 0 0 15: Test distribution: -15: Dist vec 1: 0 1 -15: Dist vec 2: 0 1 0 0 1 0 1 0 1 1 0 0 1 -15: Dist vec 3: 0 1 0 1 1 0 1 +15: Dist vec 1: 3 5 +15: Dist vec 2: 0 0 0 0 0 0 0 0 0 0 0 0 0 +15: Dist vec 3: 0 0 0 0 0 0 0 15: Dist vec 4: 0 0 0 15: Test 13 Test passed! 15: 15: Test 14: ( 1 4 | 3 2 ) 15: Reference distribution: -15: Dist vec 1: 0 1 -15: Dist vec 2: 0 1 0 0 1 0 1 0 1 1 0 0 1 -15: Dist vec 3: 0 1 0 1 1 0 1 +15: Dist vec 1: 3 5 +15: Dist vec 2: 0 0 0 0 0 0 0 0 0 0 0 0 0 +15: Dist vec 3: 0 0 0 0 0 0 0 15: Dist vec 4: 0 0 0 15: Test distribution: -15: Dist vec 1: 0 1 -15: Dist vec 2: 0 1 0 0 1 0 1 0 1 1 0 0 1 -15: Dist vec 3: 0 1 0 1 1 0 1 +15: Dist vec 1: 3 5 +15: Dist vec 2: 0 0 0 0 0 0 0 0 0 0 0 0 0 +15: Dist vec 3: 0 0 0 0 0 0 0 15: Dist vec 4: 0 0 0 15: Test 14 Test passed! 15: 15: Test 15: ( 1 4 3 | 2 ) 15: Reference distribution: -15: Dist vec 1: 0 1 -15: Dist vec 2: 0 1 0 0 1 0 1 0 1 1 0 0 1 -15: Dist vec 3: 0 1 0 1 1 0 1 +15: Dist vec 1: 3 5 +15: Dist vec 2: 0 0 0 0 0 0 0 0 0 0 0 0 0 +15: Dist vec 3: 0 0 0 0 0 0 0 15: Dist vec 4: 0 0 0 15: Test distribution: -15: Dist vec 1: 0 1 -15: Dist vec 2: 0 1 0 0 1 0 1 0 1 1 0 0 1 -15: Dist vec 3: 0 1 0 1 1 0 1 +15: Dist vec 1: 3 5 +15: Dist vec 2: 0 0 0 0 0 0 0 0 0 0 0 0 0 +15: Dist vec 3: 0 0 0 0 0 0 0 15: Dist vec 4: 0 0 0 15: Test 15 Test passed! 15: 15: Test 16: ( 1 | 4 2 3 ) 15: Reference distribution: -15: Dist vec 1: 0 1 -15: Dist vec 2: 0 1 0 0 1 0 1 0 1 1 0 0 1 -15: Dist vec 3: 0 1 0 1 1 0 1 +15: Dist vec 1: 3 5 +15: Dist vec 2: 0 0 0 0 0 0 0 0 0 0 0 0 0 +15: Dist vec 3: 0 0 0 0 0 0 0 15: Dist vec 4: 0 0 0 15: Test distribution: -15: Dist vec 1: 0 1 -15: Dist vec 2: 0 1 0 0 1 0 1 0 1 1 0 0 1 -15: Dist vec 3: 0 1 0 1 1 0 1 +15: Dist vec 1: 3 5 +15: Dist vec 2: 0 0 0 0 0 0 0 0 0 0 0 0 0 +15: Dist vec 3: 0 0 0 0 0 0 0 15: Dist vec 4: 0 0 0 15: Test 16 Test passed! 15: 15: Test 17: ( 1 4 | 2 3 ) 15: Reference distribution: -15: Dist vec 1: 0 1 -15: Dist vec 2: 0 1 0 0 1 0 1 0 1 1 0 0 1 -15: Dist vec 3: 0 1 0 1 1 0 1 +15: Dist vec 1: 3 5 +15: Dist vec 2: 0 0 0 0 0 0 0 0 0 0 0 0 0 +15: Dist vec 3: 0 0 0 0 0 0 0 15: Dist vec 4: 0 0 0 15: Test distribution: -15: Dist vec 1: 0 1 -15: Dist vec 2: 0 1 0 0 1 0 1 0 1 1 0 0 1 -15: Dist vec 3: 0 1 0 1 1 0 1 +15: Dist vec 1: 3 5 +15: Dist vec 2: 0 0 0 0 0 0 0 0 0 0 0 0 0 +15: Dist vec 3: 0 0 0 0 0 0 0 15: Dist vec 4: 0 0 0 15: Test 17 Test passed! 15: 15: Test 18: ( 1 4 2 | 3 ) 15: Reference distribution: -15: Dist vec 1: 0 1 -15: Dist vec 2: 0 1 0 0 1 0 1 0 1 1 0 0 1 -15: Dist vec 3: 0 1 0 1 1 0 1 +15: Dist vec 1: 3 5 +15: Dist vec 2: 0 0 0 0 0 0 0 0 0 0 0 0 0 +15: Dist vec 3: 0 0 0 0 0 0 0 15: Dist vec 4: 0 0 0 15: Test distribution: -15: Dist vec 1: 0 1 -15: Dist vec 2: 0 1 0 0 1 0 1 0 1 1 0 0 1 -15: Dist vec 3: 0 1 0 1 1 0 1 +15: Dist vec 1: 3 5 +15: Dist vec 2: 0 0 0 0 0 0 0 0 0 0 0 0 0 +15: Dist vec 3: 0 0 0 0 0 0 0 15: Dist vec 4: 0 0 0 15: Test 18 Test passed! 15: 15: Test 19: ( 2 | 1 3 4 ) 15: Reference distribution: -15: Dist vec 1: 0 1 -15: Dist vec 2: 0 1 0 0 1 0 1 0 1 1 0 0 1 -15: Dist vec 3: 0 1 0 1 1 0 1 +15: Dist vec 1: 3 5 +15: Dist vec 2: 0 0 0 0 0 0 0 0 0 0 0 0 0 +15: Dist vec 3: 0 0 0 0 0 0 0 15: Dist vec 4: 0 0 0 15: Test distribution: -15: Dist vec 1: 0 1 -15: Dist vec 2: 0 1 0 0 1 0 1 0 1 1 0 0 1 -15: Dist vec 3: 0 1 0 1 1 0 1 +15: Dist vec 1: 3 5 +15: Dist vec 2: 0 0 0 0 0 0 0 0 0 0 0 0 0 +15: Dist vec 3: 0 0 0 0 0 0 0 15: Dist vec 4: 0 0 0 15: Test 19 Test passed! 15: 15: Test 20: ( 2 1 | 3 4 ) 15: Reference distribution: -15: Dist vec 1: 0 1 -15: Dist vec 2: 0 1 0 0 1 0 1 0 1 1 0 0 1 -15: Dist vec 3: 0 1 0 1 1 0 1 +15: Dist vec 1: 3 5 +15: Dist vec 2: 0 0 0 0 0 0 0 0 0 0 0 0 0 +15: Dist vec 3: 0 0 0 0 0 0 0 15: Dist vec 4: 0 0 0 15: Test distribution: -15: Dist vec 1: 0 1 -15: Dist vec 2: 0 1 0 0 1 0 1 0 1 1 0 0 1 -15: Dist vec 3: 0 1 0 1 1 0 1 +15: Dist vec 1: 3 5 +15: Dist vec 2: 0 0 0 0 0 0 0 0 0 0 0 0 0 +15: Dist vec 3: 0 0 0 0 0 0 0 15: Dist vec 4: 0 0 0 15: Test 20 Test passed! 15: 15: Test 21: ( 2 1 3 | 4 ) 15: Reference distribution: -15: Dist vec 1: 0 1 -15: Dist vec 2: 0 1 0 0 1 0 1 0 1 1 0 0 1 -15: Dist vec 3: 0 1 0 1 1 0 1 +15: Dist vec 1: 3 5 +15: Dist vec 2: 0 0 0 0 0 0 0 0 0 0 0 0 0 +15: Dist vec 3: 0 0 0 0 0 0 0 15: Dist vec 4: 0 0 0 15: Test distribution: -15: Dist vec 1: 0 1 -15: Dist vec 2: 0 1 0 0 1 0 1 0 1 1 0 0 1 -15: Dist vec 3: 0 1 0 1 1 0 1 +15: Dist vec 1: 3 5 +15: Dist vec 2: 0 0 0 0 0 0 0 0 0 0 0 0 0 +15: Dist vec 3: 0 0 0 0 0 0 0 15: Dist vec 4: 0 0 0 15: Test 21 Test passed! 15: 15: Test 22: ( 2 | 1 4 3 ) 15: Reference distribution: -15: Dist vec 1: 0 1 -15: Dist vec 2: 0 1 0 0 1 0 1 0 1 1 0 0 1 -15: Dist vec 3: 0 1 0 1 1 0 1 +15: Dist vec 1: 3 5 +15: Dist vec 2: 0 0 0 0 0 0 0 0 0 0 0 0 0 +15: Dist vec 3: 0 0 0 0 0 0 0 15: Dist vec 4: 0 0 0 15: Test distribution: -15: Dist vec 1: 0 1 -15: Dist vec 2: 0 1 0 0 1 0 1 0 1 1 0 0 1 -15: Dist vec 3: 0 1 0 1 1 0 1 +15: Dist vec 1: 3 5 +15: Dist vec 2: 0 0 0 0 0 0 0 0 0 0 0 0 0 +15: Dist vec 3: 0 0 0 0 0 0 0 15: Dist vec 4: 0 0 0 15: Test 22 Test passed! 15: 15: Test 23: ( 2 1 | 4 3 ) 15: Reference distribution: -15: Dist vec 1: 0 1 -15: Dist vec 2: 0 1 0 0 1 0 1 0 1 1 0 0 1 -15: Dist vec 3: 0 1 0 1 1 0 1 +15: Dist vec 1: 3 5 +15: Dist vec 2: 0 0 0 0 0 0 0 0 0 0 0 0 0 +15: Dist vec 3: 0 0 0 0 0 0 0 15: Dist vec 4: 0 0 0 15: Test distribution: -15: Dist vec 1: 0 1 -15: Dist vec 2: 0 1 0 0 1 0 1 0 1 1 0 0 1 -15: Dist vec 3: 0 1 0 1 1 0 1 +15: Dist vec 1: 3 5 +15: Dist vec 2: 0 0 0 0 0 0 0 0 0 0 0 0 0 +15: Dist vec 3: 0 0 0 0 0 0 0 15: Dist vec 4: 0 0 0 15: Test 23 Test passed! 15: 15: Test 24: ( 2 1 4 | 3 ) 15: Reference distribution: -15: Dist vec 1: 0 1 -15: Dist vec 2: 0 1 0 0 1 0 1 0 1 1 0 0 1 -15: Dist vec 3: 0 1 0 1 1 0 1 +15: Dist vec 1: 3 5 +15: Dist vec 2: 0 0 0 0 0 0 0 0 0 0 0 0 0 +15: Dist vec 3: 0 0 0 0 0 0 0 15: Dist vec 4: 0 0 0 15: Test distribution: -15: Dist vec 1: 0 1 -15: Dist vec 2: 0 1 0 0 1 0 1 0 1 1 0 0 1 -15: Dist vec 3: 0 1 0 1 1 0 1 +15: Dist vec 1: 3 5 +15: Dist vec 2: 0 0 0 0 0 0 0 0 0 0 0 0 0 +15: Dist vec 3: 0 0 0 0 0 0 0 15: Dist vec 4: 0 0 0 15: Test 24 Test passed! 15: 15: Test 25: ( 2 | 3 1 4 ) 15: Reference distribution: -15: Dist vec 1: 0 1 -15: Dist vec 2: 0 1 0 0 1 0 1 0 1 1 0 0 1 -15: Dist vec 3: 0 1 0 1 1 0 1 +15: Dist vec 1: 3 5 +15: Dist vec 2: 0 0 0 0 0 0 0 0 0 0 0 0 0 +15: Dist vec 3: 0 0 0 0 0 0 0 15: Dist vec 4: 0 0 0 15: Test distribution: -15: Dist vec 1: 0 1 -15: Dist vec 2: 0 1 0 0 1 0 1 0 1 1 0 0 1 -15: Dist vec 3: 0 1 0 1 1 0 1 +15: Dist vec 1: 3 5 +15: Dist vec 2: 0 0 0 0 0 0 0 0 0 0 0 0 0 +15: Dist vec 3: 0 0 0 0 0 0 0 15: Dist vec 4: 0 0 0 15: Test 25 Test passed! 15: 15: Test 26: ( 2 3 | 1 4 ) 15: Reference distribution: -15: Dist vec 1: 0 1 -15: Dist vec 2: 0 1 0 0 1 0 1 0 1 1 0 0 1 -15: Dist vec 3: 0 1 0 1 1 0 1 +15: Dist vec 1: 3 5 +15: Dist vec 2: 0 0 0 0 0 0 0 0 0 0 0 0 0 +15: Dist vec 3: 0 0 0 0 0 0 0 15: Dist vec 4: 0 0 0 15: Test distribution: -15: Dist vec 1: 0 1 -15: Dist vec 2: 0 1 0 0 1 0 1 0 1 1 0 0 1 -15: Dist vec 3: 0 1 0 1 1 0 1 +15: Dist vec 1: 3 5 +15: Dist vec 2: 0 0 0 0 0 0 0 0 0 0 0 0 0 +15: Dist vec 3: 0 0 0 0 0 0 0 15: Dist vec 4: 0 0 0 15: Test 26 Test passed! 15: 15: Test 27: ( 2 3 1 | 4 ) 15: Reference distribution: -15: Dist vec 1: 0 1 -15: Dist vec 2: 0 1 0 0 1 0 1 0 1 1 0 0 1 -15: Dist vec 3: 0 1 0 1 1 0 1 +15: Dist vec 1: 3 5 +15: Dist vec 2: 0 0 0 0 0 0 0 0 0 0 0 0 0 +15: Dist vec 3: 0 0 0 0 0 0 0 15: Dist vec 4: 0 0 0 15: Test distribution: -15: Dist vec 1: 0 1 -15: Dist vec 2: 0 1 0 0 1 0 1 0 1 1 0 0 1 -15: Dist vec 3: 0 1 0 1 1 0 1 +15: Dist vec 1: 3 5 +15: Dist vec 2: 0 0 0 0 0 0 0 0 0 0 0 0 0 +15: Dist vec 3: 0 0 0 0 0 0 0 15: Dist vec 4: 0 0 0 15: Test 27 Test passed! 15: 15: Test 28: ( 2 | 3 4 1 ) 15: Reference distribution: -15: Dist vec 1: 0 1 -15: Dist vec 2: 0 1 0 0 1 0 1 0 1 1 0 0 1 -15: Dist vec 3: 0 1 0 1 1 0 1 +15: Dist vec 1: 3 5 +15: Dist vec 2: 0 0 0 0 0 0 0 0 0 0 0 0 0 +15: Dist vec 3: 0 0 0 0 0 0 0 15: Dist vec 4: 0 0 0 15: Test distribution: -15: Dist vec 1: 0 1 -15: Dist vec 2: 0 1 0 0 1 0 1 0 1 1 0 0 1 -15: Dist vec 3: 0 1 0 1 1 0 1 +15: Dist vec 1: 3 5 +15: Dist vec 2: 0 0 0 0 0 0 0 0 0 0 0 0 0 +15: Dist vec 3: 0 0 0 0 0 0 0 15: Dist vec 4: 0 0 0 15: Test 28 Test passed! 15: 15: Test 29: ( 2 3 | 4 1 ) 15: Reference distribution: -15: Dist vec 1: 0 1 -15: Dist vec 2: 0 1 0 0 1 0 1 0 1 1 0 0 1 -15: Dist vec 3: 0 1 0 1 1 0 1 +15: Dist vec 1: 3 5 +15: Dist vec 2: 0 0 0 0 0 0 0 0 0 0 0 0 0 +15: Dist vec 3: 0 0 0 0 0 0 0 15: Dist vec 4: 0 0 0 15: Test distribution: -15: Dist vec 1: 0 1 -15: Dist vec 2: 0 1 0 0 1 0 1 0 1 1 0 0 1 -15: Dist vec 3: 0 1 0 1 1 0 1 +15: Dist vec 1: 3 5 +15: Dist vec 2: 0 0 0 0 0 0 0 0 0 0 0 0 0 +15: Dist vec 3: 0 0 0 0 0 0 0 15: Dist vec 4: 0 0 0 15: Test 29 Test passed! 15: 15: Test 30: ( 2 3 4 | 1 ) 15: Reference distribution: -15: Dist vec 1: 0 1 -15: Dist vec 2: 0 1 0 0 1 0 1 0 1 1 0 0 1 -15: Dist vec 3: 0 1 0 1 1 0 1 +15: Dist vec 1: 3 5 +15: Dist vec 2: 0 0 0 0 0 0 0 0 0 0 0 0 0 +15: Dist vec 3: 0 0 0 0 0 0 0 15: Dist vec 4: 0 0 0 15: Test distribution: -15: Dist vec 1: 0 1 -15: Dist vec 2: 0 1 0 0 1 0 1 0 1 1 0 0 1 -15: Dist vec 3: 0 1 0 1 1 0 1 +15: Dist vec 1: 3 5 +15: Dist vec 2: 0 0 0 0 0 0 0 0 0 0 0 0 0 +15: Dist vec 3: 0 0 0 0 0 0 0 15: Dist vec 4: 0 0 0 15: Test 30 Test passed! 15: 15: Test 31: ( 2 | 4 3 1 ) 15: Reference distribution: -15: Dist vec 1: 0 1 -15: Dist vec 2: 0 1 0 0 1 0 1 0 1 1 0 0 1 -15: Dist vec 3: 0 1 0 1 1 0 1 +15: Dist vec 1: 3 5 +15: Dist vec 2: 0 0 0 0 0 0 0 0 0 0 0 0 0 +15: Dist vec 3: 0 0 0 0 0 0 0 15: Dist vec 4: 0 0 0 15: Test distribution: -15: Dist vec 1: 0 1 -15: Dist vec 2: 0 1 0 0 1 0 1 0 1 1 0 0 1 -15: Dist vec 3: 0 1 0 1 1 0 1 +15: Dist vec 1: 3 5 +15: Dist vec 2: 0 0 0 0 0 0 0 0 0 0 0 0 0 +15: Dist vec 3: 0 0 0 0 0 0 0 15: Dist vec 4: 0 0 0 15: Test 31 Test passed! 15: 15: Test 32: ( 2 4 | 3 1 ) 15: Reference distribution: -15: Dist vec 1: 0 1 -15: Dist vec 2: 0 1 0 0 1 0 1 0 1 1 0 0 1 -15: Dist vec 3: 0 1 0 1 1 0 1 +15: Dist vec 1: 3 5 +15: Dist vec 2: 0 0 0 0 0 0 0 0 0 0 0 0 0 +15: Dist vec 3: 0 0 0 0 0 0 0 15: Dist vec 4: 0 0 0 15: Test distribution: -15: Dist vec 1: 0 1 -15: Dist vec 2: 0 1 0 0 1 0 1 0 1 1 0 0 1 -15: Dist vec 3: 0 1 0 1 1 0 1 +15: Dist vec 1: 3 5 +15: Dist vec 2: 0 0 0 0 0 0 0 0 0 0 0 0 0 +15: Dist vec 3: 0 0 0 0 0 0 0 15: Dist vec 4: 0 0 0 15: Test 32 Test passed! 15: 15: Test 33: ( 2 4 3 | 1 ) 15: Reference distribution: -15: Dist vec 1: 0 1 -15: Dist vec 2: 0 1 0 0 1 0 1 0 1 1 0 0 1 -15: Dist vec 3: 0 1 0 1 1 0 1 +15: Dist vec 1: 3 5 +15: Dist vec 2: 0 0 0 0 0 0 0 0 0 0 0 0 0 +15: Dist vec 3: 0 0 0 0 0 0 0 15: Dist vec 4: 0 0 0 15: Test distribution: -15: Dist vec 1: 0 1 -15: Dist vec 2: 0 1 0 0 1 0 1 0 1 1 0 0 1 -15: Dist vec 3: 0 1 0 1 1 0 1 +15: Dist vec 1: 3 5 +15: Dist vec 2: 0 0 0 0 0 0 0 0 0 0 0 0 0 +15: Dist vec 3: 0 0 0 0 0 0 0 15: Dist vec 4: 0 0 0 15: Test 33 Test passed! 15: 15: Test 34: ( 2 | 4 1 3 ) 15: Reference distribution: -15: Dist vec 1: 0 1 -15: Dist vec 2: 0 1 0 0 1 0 1 0 1 1 0 0 1 -15: Dist vec 3: 0 1 0 1 1 0 1 +15: Dist vec 1: 3 5 +15: Dist vec 2: 0 0 0 0 0 0 0 0 0 0 0 0 0 +15: Dist vec 3: 0 0 0 0 0 0 0 15: Dist vec 4: 0 0 0 15: Test distribution: -15: Dist vec 1: 0 1 -15: Dist vec 2: 0 1 0 0 1 0 1 0 1 1 0 0 1 -15: Dist vec 3: 0 1 0 1 1 0 1 +15: Dist vec 1: 3 5 +15: Dist vec 2: 0 0 0 0 0 0 0 0 0 0 0 0 0 +15: Dist vec 3: 0 0 0 0 0 0 0 15: Dist vec 4: 0 0 0 15: Test 34 Test passed! 15: 15: Test 35: ( 2 4 | 1 3 ) 15: Reference distribution: -15: Dist vec 1: 0 1 -15: Dist vec 2: 0 1 0 0 1 0 1 0 1 1 0 0 1 -15: Dist vec 3: 0 1 0 1 1 0 1 +15: Dist vec 1: 3 5 +15: Dist vec 2: 0 0 0 0 0 0 0 0 0 0 0 0 0 +15: Dist vec 3: 0 0 0 0 0 0 0 15: Dist vec 4: 0 0 0 15: Test distribution: -15: Dist vec 1: 0 1 -15: Dist vec 2: 0 1 0 0 1 0 1 0 1 1 0 0 1 -15: Dist vec 3: 0 1 0 1 1 0 1 +15: Dist vec 1: 3 5 +15: Dist vec 2: 0 0 0 0 0 0 0 0 0 0 0 0 0 +15: Dist vec 3: 0 0 0 0 0 0 0 15: Dist vec 4: 0 0 0 15: Test 35 Test passed! 15: 15: Test 36: ( 2 4 1 | 3 ) 15: Reference distribution: -15: Dist vec 1: 0 1 -15: Dist vec 2: 0 1 0 0 1 0 1 0 1 1 0 0 1 -15: Dist vec 3: 0 1 0 1 1 0 1 +15: Dist vec 1: 3 5 +15: Dist vec 2: 0 0 0 0 0 0 0 0 0 0 0 0 0 +15: Dist vec 3: 0 0 0 0 0 0 0 15: Dist vec 4: 0 0 0 15: Test distribution: -15: Dist vec 1: 0 1 -15: Dist vec 2: 0 1 0 0 1 0 1 0 1 1 0 0 1 -15: Dist vec 3: 0 1 0 1 1 0 1 +15: Dist vec 1: 3 5 +15: Dist vec 2: 0 0 0 0 0 0 0 0 0 0 0 0 0 +15: Dist vec 3: 0 0 0 0 0 0 0 15: Dist vec 4: 0 0 0 15: Test 36 Test passed! 15: 15: Test 37: ( 3 | 2 1 4 ) 15: Reference distribution: -15: Dist vec 1: 0 1 -15: Dist vec 2: 0 1 0 0 1 0 1 0 1 1 0 0 1 -15: Dist vec 3: 0 1 0 1 1 0 1 +15: Dist vec 1: 3 5 +15: Dist vec 2: 0 0 0 0 0 0 0 0 0 0 0 0 0 +15: Dist vec 3: 0 0 0 0 0 0 0 15: Dist vec 4: 0 0 0 15: Test distribution: -15: Dist vec 1: 0 1 -15: Dist vec 2: 0 1 0 0 1 0 1 0 1 1 0 0 1 -15: Dist vec 3: 0 1 0 1 1 0 1 +15: Dist vec 1: 3 5 +15: Dist vec 2: 0 0 0 0 0 0 0 0 0 0 0 0 0 +15: Dist vec 3: 0 0 0 0 0 0 0 15: Dist vec 4: 0 0 0 15: Test 37 Test passed! 15: 15: Test 38: ( 3 2 | 1 4 ) 15: Reference distribution: -15: Dist vec 1: 0 1 -15: Dist vec 2: 0 1 0 0 1 0 1 0 1 1 0 0 1 -15: Dist vec 3: 0 1 0 1 1 0 1 +15: Dist vec 1: 3 5 +15: Dist vec 2: 0 0 0 0 0 0 0 0 0 0 0 0 0 +15: Dist vec 3: 0 0 0 0 0 0 0 15: Dist vec 4: 0 0 0 15: Test distribution: -15: Dist vec 1: 0 1 -15: Dist vec 2: 0 1 0 0 1 0 1 0 1 1 0 0 1 -15: Dist vec 3: 0 1 0 1 1 0 1 +15: Dist vec 1: 3 5 +15: Dist vec 2: 0 0 0 0 0 0 0 0 0 0 0 0 0 +15: Dist vec 3: 0 0 0 0 0 0 0 15: Dist vec 4: 0 0 0 15: Test 38 Test passed! 15: 15: Test 39: ( 3 2 1 | 4 ) 15: Reference distribution: -15: Dist vec 1: 0 1 -15: Dist vec 2: 0 1 0 0 1 0 1 0 1 1 0 0 1 -15: Dist vec 3: 0 1 0 1 1 0 1 +15: Dist vec 1: 3 5 +15: Dist vec 2: 0 0 0 0 0 0 0 0 0 0 0 0 0 +15: Dist vec 3: 0 0 0 0 0 0 0 15: Dist vec 4: 0 0 0 15: Test distribution: -15: Dist vec 1: 0 1 -15: Dist vec 2: 0 1 0 0 1 0 1 0 1 1 0 0 1 -15: Dist vec 3: 0 1 0 1 1 0 1 +15: Dist vec 1: 3 5 +15: Dist vec 2: 0 0 0 0 0 0 0 0 0 0 0 0 0 +15: Dist vec 3: 0 0 0 0 0 0 0 15: Dist vec 4: 0 0 0 15: Test 39 Test passed! 15: 15: Test 40: ( 3 | 2 4 1 ) 15: Reference distribution: -15: Dist vec 1: 0 1 -15: Dist vec 2: 0 1 0 0 1 0 1 0 1 1 0 0 1 -15: Dist vec 3: 0 1 0 1 1 0 1 +15: Dist vec 1: 3 5 +15: Dist vec 2: 0 0 0 0 0 0 0 0 0 0 0 0 0 +15: Dist vec 3: 0 0 0 0 0 0 0 15: Dist vec 4: 0 0 0 15: Test distribution: -15: Dist vec 1: 0 1 -15: Dist vec 2: 0 1 0 0 1 0 1 0 1 1 0 0 1 -15: Dist vec 3: 0 1 0 1 1 0 1 +15: Dist vec 1: 3 5 +15: Dist vec 2: 0 0 0 0 0 0 0 0 0 0 0 0 0 +15: Dist vec 3: 0 0 0 0 0 0 0 15: Dist vec 4: 0 0 0 15: Test 40 Test passed! 15: 15: Test 41: ( 3 2 | 4 1 ) 15: Reference distribution: -15: Dist vec 1: 0 1 -15: Dist vec 2: 0 1 0 0 1 0 1 0 1 1 0 0 1 -15: Dist vec 3: 0 1 0 1 1 0 1 +15: Dist vec 1: 3 5 +15: Dist vec 2: 0 0 0 0 0 0 0 0 0 0 0 0 0 +15: Dist vec 3: 0 0 0 0 0 0 0 15: Dist vec 4: 0 0 0 15: Test distribution: -15: Dist vec 1: 0 1 -15: Dist vec 2: 0 1 0 0 1 0 1 0 1 1 0 0 1 -15: Dist vec 3: 0 1 0 1 1 0 1 +15: Dist vec 1: 3 5 +15: Dist vec 2: 0 0 0 0 0 0 0 0 0 0 0 0 0 +15: Dist vec 3: 0 0 0 0 0 0 0 15: Dist vec 4: 0 0 0 15: Test 41 Test passed! 15: 15: Test 42: ( 3 2 4 | 1 ) 15: Reference distribution: -15: Dist vec 1: 0 1 -15: Dist vec 2: 0 1 0 0 1 0 1 0 1 1 0 0 1 -15: Dist vec 3: 0 1 0 1 1 0 1 +15: Dist vec 1: 3 5 +15: Dist vec 2: 0 0 0 0 0 0 0 0 0 0 0 0 0 +15: Dist vec 3: 0 0 0 0 0 0 0 15: Dist vec 4: 0 0 0 15: Test distribution: -15: Dist vec 1: 0 1 -15: Dist vec 2: 0 1 0 0 1 0 1 0 1 1 0 0 1 -15: Dist vec 3: 0 1 0 1 1 0 1 +15: Dist vec 1: 3 5 +15: Dist vec 2: 0 0 0 0 0 0 0 0 0 0 0 0 0 +15: Dist vec 3: 0 0 0 0 0 0 0 15: Dist vec 4: 0 0 0 15: Test 42 Test passed! 15: 15: Test 43: ( 3 | 1 2 4 ) 15: Reference distribution: -15: Dist vec 1: 0 1 -15: Dist vec 2: 0 1 0 0 1 0 1 0 1 1 0 0 1 -15: Dist vec 3: 0 1 0 1 1 0 1 +15: Dist vec 1: 3 5 +15: Dist vec 2: 0 0 0 0 0 0 0 0 0 0 0 0 0 +15: Dist vec 3: 0 0 0 0 0 0 0 15: Dist vec 4: 0 0 0 15: Test distribution: -15: Dist vec 1: 0 1 -15: Dist vec 2: 0 1 0 0 1 0 1 0 1 1 0 0 1 -15: Dist vec 3: 0 1 0 1 1 0 1 +15: Dist vec 1: 3 5 +15: Dist vec 2: 0 0 0 0 0 0 0 0 0 0 0 0 0 +15: Dist vec 3: 0 0 0 0 0 0 0 15: Dist vec 4: 0 0 0 15: Test 43 Test passed! 15: 15: Test 44: ( 3 1 | 2 4 ) 15: Reference distribution: -15: Dist vec 1: 0 1 -15: Dist vec 2: 0 1 0 0 1 0 1 0 1 1 0 0 1 -15: Dist vec 3: 0 1 0 1 1 0 1 +15: Dist vec 1: 3 5 +15: Dist vec 2: 0 0 0 0 0 0 0 0 0 0 0 0 0 +15: Dist vec 3: 0 0 0 0 0 0 0 15: Dist vec 4: 0 0 0 15: Test distribution: -15: Dist vec 1: 0 1 -15: Dist vec 2: 0 1 0 0 1 0 1 0 1 1 0 0 1 -15: Dist vec 3: 0 1 0 1 1 0 1 +15: Dist vec 1: 3 5 +15: Dist vec 2: 0 0 0 0 0 0 0 0 0 0 0 0 0 +15: Dist vec 3: 0 0 0 0 0 0 0 15: Dist vec 4: 0 0 0 15: Test 44 Test passed! 15: 15: Test 45: ( 3 1 2 | 4 ) 15: Reference distribution: -15: Dist vec 1: 0 1 -15: Dist vec 2: 0 1 0 0 1 0 1 0 1 1 0 0 1 -15: Dist vec 3: 0 1 0 1 1 0 1 +15: Dist vec 1: 3 5 +15: Dist vec 2: 0 0 0 0 0 0 0 0 0 0 0 0 0 +15: Dist vec 3: 0 0 0 0 0 0 0 15: Dist vec 4: 0 0 0 15: Test distribution: -15: Dist vec 1: 0 1 -15: Dist vec 2: 0 1 0 0 1 0 1 0 1 1 0 0 1 -15: Dist vec 3: 0 1 0 1 1 0 1 +15: Dist vec 1: 3 5 +15: Dist vec 2: 0 0 0 0 0 0 0 0 0 0 0 0 0 +15: Dist vec 3: 0 0 0 0 0 0 0 15: Dist vec 4: 0 0 0 15: Test 45 Test passed! 15: 15: Test 46: ( 3 | 1 4 2 ) 15: Reference distribution: -15: Dist vec 1: 0 1 -15: Dist vec 2: 0 1 0 0 1 0 1 0 1 1 0 0 1 -15: Dist vec 3: 0 1 0 1 1 0 1 +15: Dist vec 1: 3 5 +15: Dist vec 2: 0 0 0 0 0 0 0 0 0 0 0 0 0 +15: Dist vec 3: 0 0 0 0 0 0 0 15: Dist vec 4: 0 0 0 15: Test distribution: -15: Dist vec 1: 0 1 -15: Dist vec 2: 0 1 0 0 1 0 1 0 1 1 0 0 1 -15: Dist vec 3: 0 1 0 1 1 0 1 +15: Dist vec 1: 3 5 +15: Dist vec 2: 0 0 0 0 0 0 0 0 0 0 0 0 0 +15: Dist vec 3: 0 0 0 0 0 0 0 15: Dist vec 4: 0 0 0 15: Test 46 Test passed! 15: 15: Test 47: ( 3 1 | 4 2 ) 15: Reference distribution: -15: Dist vec 1: 0 1 -15: Dist vec 2: 0 1 0 0 1 0 1 0 1 1 0 0 1 -15: Dist vec 3: 0 1 0 1 1 0 1 +15: Dist vec 1: 3 5 +15: Dist vec 2: 0 0 0 0 0 0 0 0 0 0 0 0 0 +15: Dist vec 3: 0 0 0 0 0 0 0 15: Dist vec 4: 0 0 0 15: Test distribution: -15: Dist vec 1: 0 1 -15: Dist vec 2: 0 1 0 0 1 0 1 0 1 1 0 0 1 -15: Dist vec 3: 0 1 0 1 1 0 1 +15: Dist vec 1: 3 5 +15: Dist vec 2: 0 0 0 0 0 0 0 0 0 0 0 0 0 +15: Dist vec 3: 0 0 0 0 0 0 0 15: Dist vec 4: 0 0 0 15: Test 47 Test passed! 15: 15: Test 48: ( 3 1 4 | 2 ) 15: Reference distribution: -15: Dist vec 1: 0 1 -15: Dist vec 2: 0 1 0 0 1 0 1 0 1 1 0 0 1 -15: Dist vec 3: 0 1 0 1 1 0 1 +15: Dist vec 1: 3 5 +15: Dist vec 2: 0 0 0 0 0 0 0 0 0 0 0 0 0 +15: Dist vec 3: 0 0 0 0 0 0 0 15: Dist vec 4: 0 0 0 15: Test distribution: -15: Dist vec 1: 0 1 -15: Dist vec 2: 0 1 0 0 1 0 1 0 1 1 0 0 1 -15: Dist vec 3: 0 1 0 1 1 0 1 +15: Dist vec 1: 3 5 +15: Dist vec 2: 0 0 0 0 0 0 0 0 0 0 0 0 0 +15: Dist vec 3: 0 0 0 0 0 0 0 15: Dist vec 4: 0 0 0 15: Test 48 Test passed! 15: 15: Test 49: ( 3 | 4 1 2 ) 15: Reference distribution: -15: Dist vec 1: 0 1 -15: Dist vec 2: 0 1 0 0 1 0 1 0 1 1 0 0 1 -15: Dist vec 3: 0 1 0 1 1 0 1 +15: Dist vec 1: 3 5 +15: Dist vec 2: 0 0 0 0 0 0 0 0 0 0 0 0 0 +15: Dist vec 3: 0 0 0 0 0 0 0 15: Dist vec 4: 0 0 0 15: Test distribution: -15: Dist vec 1: 0 1 -15: Dist vec 2: 0 1 0 0 1 0 1 0 1 1 0 0 1 -15: Dist vec 3: 0 1 0 1 1 0 1 +15: Dist vec 1: 3 5 +15: Dist vec 2: 0 0 0 0 0 0 0 0 0 0 0 0 0 +15: Dist vec 3: 0 0 0 0 0 0 0 15: Dist vec 4: 0 0 0 15: Test 49 Test passed! 15: 15: Test 50: ( 3 4 | 1 2 ) 15: Reference distribution: -15: Dist vec 1: 0 1 -15: Dist vec 2: 0 1 0 0 1 0 1 0 1 1 0 0 1 -15: Dist vec 3: 0 1 0 1 1 0 1 +15: Dist vec 1: 3 5 +15: Dist vec 2: 0 0 0 0 0 0 0 0 0 0 0 0 0 +15: Dist vec 3: 0 0 0 0 0 0 0 15: Dist vec 4: 0 0 0 15: Test distribution: -15: Dist vec 1: 0 1 -15: Dist vec 2: 0 1 0 0 1 0 1 0 1 1 0 0 1 -15: Dist vec 3: 0 1 0 1 1 0 1 +15: Dist vec 1: 3 5 +15: Dist vec 2: 0 0 0 0 0 0 0 0 0 0 0 0 0 +15: Dist vec 3: 0 0 0 0 0 0 0 15: Dist vec 4: 0 0 0 15: Test 50 Test passed! 15: 15: Test 51: ( 3 4 1 | 2 ) 15: Reference distribution: -15: Dist vec 1: 0 1 -15: Dist vec 2: 0 1 0 0 1 0 1 0 1 1 0 0 1 -15: Dist vec 3: 0 1 0 1 1 0 1 +15: Dist vec 1: 3 5 +15: Dist vec 2: 0 0 0 0 0 0 0 0 0 0 0 0 0 +15: Dist vec 3: 0 0 0 0 0 0 0 15: Dist vec 4: 0 0 0 15: Test distribution: -15: Dist vec 1: 0 1 -15: Dist vec 2: 0 1 0 0 1 0 1 0 1 1 0 0 1 -15: Dist vec 3: 0 1 0 1 1 0 1 +15: Dist vec 1: 3 5 +15: Dist vec 2: 0 0 0 0 0 0 0 0 0 0 0 0 0 +15: Dist vec 3: 0 0 0 0 0 0 0 15: Dist vec 4: 0 0 0 15: Test 51 Test passed! 15: 15: Test 52: ( 3 | 4 2 1 ) 15: Reference distribution: -15: Dist vec 1: 0 1 -15: Dist vec 2: 0 1 0 0 1 0 1 0 1 1 0 0 1 -15: Dist vec 3: 0 1 0 1 1 0 1 +15: Dist vec 1: 3 5 +15: Dist vec 2: 0 0 0 0 0 0 0 0 0 0 0 0 0 +15: Dist vec 3: 0 0 0 0 0 0 0 15: Dist vec 4: 0 0 0 15: Test distribution: -15: Dist vec 1: 0 1 -15: Dist vec 2: 0 1 0 0 1 0 1 0 1 1 0 0 1 -15: Dist vec 3: 0 1 0 1 1 0 1 +15: Dist vec 1: 3 5 +15: Dist vec 2: 0 0 0 0 0 0 0 0 0 0 0 0 0 +15: Dist vec 3: 0 0 0 0 0 0 0 15: Dist vec 4: 0 0 0 15: Test 52 Test passed! 15: 15: Test 53: ( 3 4 | 2 1 ) 15: Reference distribution: -15: Dist vec 1: 0 1 -15: Dist vec 2: 0 1 0 0 1 0 1 0 1 1 0 0 1 -15: Dist vec 3: 0 1 0 1 1 0 1 +15: Dist vec 1: 3 5 +15: Dist vec 2: 0 0 0 0 0 0 0 0 0 0 0 0 0 +15: Dist vec 3: 0 0 0 0 0 0 0 15: Dist vec 4: 0 0 0 15: Test distribution: -15: Dist vec 1: 0 1 -15: Dist vec 2: 0 1 0 0 1 0 1 0 1 1 0 0 1 -15: Dist vec 3: 0 1 0 1 1 0 1 +15: Dist vec 1: 3 5 +15: Dist vec 2: 0 0 0 0 0 0 0 0 0 0 0 0 0 +15: Dist vec 3: 0 0 0 0 0 0 0 15: Dist vec 4: 0 0 0 15: Test 53 Test passed! 15: 15: Test 54: ( 3 4 2 | 1 ) 15: Reference distribution: -15: Dist vec 1: 0 1 -15: Dist vec 2: 0 1 0 0 1 0 1 0 1 1 0 0 1 -15: Dist vec 3: 0 1 0 1 1 0 1 +15: Dist vec 1: 3 5 +15: Dist vec 2: 0 0 0 0 0 0 0 0 0 0 0 0 0 +15: Dist vec 3: 0 0 0 0 0 0 0 15: Dist vec 4: 0 0 0 15: Test distribution: -15: Dist vec 1: 0 1 -15: Dist vec 2: 0 1 0 0 1 0 1 0 1 1 0 0 1 -15: Dist vec 3: 0 1 0 1 1 0 1 +15: Dist vec 1: 3 5 +15: Dist vec 2: 0 0 0 0 0 0 0 0 0 0 0 0 0 +15: Dist vec 3: 0 0 0 0 0 0 0 15: Dist vec 4: 0 0 0 15: Test 54 Test passed! 15: 15: Test 55: ( 4 | 2 3 1 ) 15: Reference distribution: -15: Dist vec 1: 0 1 -15: Dist vec 2: 0 1 0 0 1 0 1 0 1 1 0 0 1 -15: Dist vec 3: 0 1 0 1 1 0 1 +15: Dist vec 1: 3 5 +15: Dist vec 2: 0 0 0 0 0 0 0 0 0 0 0 0 0 +15: Dist vec 3: 0 0 0 0 0 0 0 15: Dist vec 4: 0 0 0 15: Test distribution: -15: Dist vec 1: 0 1 -15: Dist vec 2: 0 1 0 0 1 0 1 0 1 1 0 0 1 -15: Dist vec 3: 0 1 0 1 1 0 1 +15: Dist vec 1: 3 5 +15: Dist vec 2: 0 0 0 0 0 0 0 0 0 0 0 0 0 +15: Dist vec 3: 0 0 0 0 0 0 0 15: Dist vec 4: 0 0 0 15: Test 55 Test passed! 15: 15: Test 56: ( 4 2 | 3 1 ) 15: Reference distribution: -15: Dist vec 1: 0 1 -15: Dist vec 2: 0 1 0 0 1 0 1 0 1 1 0 0 1 -15: Dist vec 3: 0 1 0 1 1 0 1 +15: Dist vec 1: 3 5 +15: Dist vec 2: 0 0 0 0 0 0 0 0 0 0 0 0 0 +15: Dist vec 3: 0 0 0 0 0 0 0 15: Dist vec 4: 0 0 0 15: Test distribution: -15: Dist vec 1: 0 1 -15: Dist vec 2: 0 1 0 0 1 0 1 0 1 1 0 0 1 -15: Dist vec 3: 0 1 0 1 1 0 1 +15: Dist vec 1: 3 5 +15: Dist vec 2: 0 0 0 0 0 0 0 0 0 0 0 0 0 +15: Dist vec 3: 0 0 0 0 0 0 0 15: Dist vec 4: 0 0 0 15: Test 56 Test passed! 15: 15: Test 57: ( 4 2 3 | 1 ) 15: Reference distribution: -15: Dist vec 1: 0 1 -15: Dist vec 2: 0 1 0 0 1 0 1 0 1 1 0 0 1 -15: Dist vec 3: 0 1 0 1 1 0 1 +15: Dist vec 1: 3 5 +15: Dist vec 2: 0 0 0 0 0 0 0 0 0 0 0 0 0 +15: Dist vec 3: 0 0 0 0 0 0 0 15: Dist vec 4: 0 0 0 15: Test distribution: -15: Dist vec 1: 0 1 -15: Dist vec 2: 0 1 0 0 1 0 1 0 1 1 0 0 1 -15: Dist vec 3: 0 1 0 1 1 0 1 +15: Dist vec 1: 3 5 +15: Dist vec 2: 0 0 0 0 0 0 0 0 0 0 0 0 0 +15: Dist vec 3: 0 0 0 0 0 0 0 15: Dist vec 4: 0 0 0 15: Test 57 Test passed! 15: 15: Test 58: ( 4 | 2 1 3 ) 15: Reference distribution: -15: Dist vec 1: 0 1 -15: Dist vec 2: 0 1 0 0 1 0 1 0 1 1 0 0 1 -15: Dist vec 3: 0 1 0 1 1 0 1 +15: Dist vec 1: 3 5 +15: Dist vec 2: 0 0 0 0 0 0 0 0 0 0 0 0 0 +15: Dist vec 3: 0 0 0 0 0 0 0 15: Dist vec 4: 0 0 0 15: Test distribution: -15: Dist vec 1: 0 1 -15: Dist vec 2: 0 1 0 0 1 0 1 0 1 1 0 0 1 -15: Dist vec 3: 0 1 0 1 1 0 1 +15: Dist vec 1: 3 5 +15: Dist vec 2: 0 0 0 0 0 0 0 0 0 0 0 0 0 +15: Dist vec 3: 0 0 0 0 0 0 0 15: Dist vec 4: 0 0 0 15: Test 58 Test passed! 15: 15: Test 59: ( 4 2 | 1 3 ) 15: Reference distribution: -15: Dist vec 1: 0 1 -15: Dist vec 2: 0 1 0 0 1 0 1 0 1 1 0 0 1 -15: Dist vec 3: 0 1 0 1 1 0 1 +15: Dist vec 1: 3 5 +15: Dist vec 2: 0 0 0 0 0 0 0 0 0 0 0 0 0 +15: Dist vec 3: 0 0 0 0 0 0 0 15: Dist vec 4: 0 0 0 15: Test distribution: -15: Dist vec 1: 0 1 -15: Dist vec 2: 0 1 0 0 1 0 1 0 1 1 0 0 1 -15: Dist vec 3: 0 1 0 1 1 0 1 +15: Dist vec 1: 3 5 +15: Dist vec 2: 0 0 0 0 0 0 0 0 0 0 0 0 0 +15: Dist vec 3: 0 0 0 0 0 0 0 15: Dist vec 4: 0 0 0 15: Test 59 Test passed! 15: 15: Test 60: ( 4 2 1 | 3 ) 15: Reference distribution: -15: Dist vec 1: 0 1 -15: Dist vec 2: 0 1 0 0 1 0 1 0 1 1 0 0 1 -15: Dist vec 3: 0 1 0 1 1 0 1 +15: Dist vec 1: 3 5 +15: Dist vec 2: 0 0 0 0 0 0 0 0 0 0 0 0 0 +15: Dist vec 3: 0 0 0 0 0 0 0 15: Dist vec 4: 0 0 0 15: Test distribution: -15: Dist vec 1: 0 1 -15: Dist vec 2: 0 1 0 0 1 0 1 0 1 1 0 0 1 -15: Dist vec 3: 0 1 0 1 1 0 1 +15: Dist vec 1: 3 5 +15: Dist vec 2: 0 0 0 0 0 0 0 0 0 0 0 0 0 +15: Dist vec 3: 0 0 0 0 0 0 0 15: Dist vec 4: 0 0 0 15: Test 60 Test passed! 15: 15: Test 61: ( 4 | 3 2 1 ) 15: Reference distribution: -15: Dist vec 1: 0 1 -15: Dist vec 2: 0 1 0 0 1 0 1 0 1 1 0 0 1 -15: Dist vec 3: 0 1 0 1 1 0 1 +15: Dist vec 1: 3 5 +15: Dist vec 2: 0 0 0 0 0 0 0 0 0 0 0 0 0 +15: Dist vec 3: 0 0 0 0 0 0 0 15: Dist vec 4: 0 0 0 15: Test distribution: -15: Dist vec 1: 0 1 -15: Dist vec 2: 0 1 0 0 1 0 1 0 1 1 0 0 1 -15: Dist vec 3: 0 1 0 1 1 0 1 +15: Dist vec 1: 3 5 +15: Dist vec 2: 0 0 0 0 0 0 0 0 0 0 0 0 0 +15: Dist vec 3: 0 0 0 0 0 0 0 15: Dist vec 4: 0 0 0 15: Test 61 Test passed! 15: 15: Test 62: ( 4 3 | 2 1 ) 15: Reference distribution: -15: Dist vec 1: 0 1 -15: Dist vec 2: 0 1 0 0 1 0 1 0 1 1 0 0 1 -15: Dist vec 3: 0 1 0 1 1 0 1 +15: Dist vec 1: 3 5 +15: Dist vec 2: 0 0 0 0 0 0 0 0 0 0 0 0 0 +15: Dist vec 3: 0 0 0 0 0 0 0 15: Dist vec 4: 0 0 0 15: Test distribution: -15: Dist vec 1: 0 1 -15: Dist vec 2: 0 1 0 0 1 0 1 0 1 1 0 0 1 -15: Dist vec 3: 0 1 0 1 1 0 1 +15: Dist vec 1: 3 5 +15: Dist vec 2: 0 0 0 0 0 0 0 0 0 0 0 0 0 +15: Dist vec 3: 0 0 0 0 0 0 0 15: Dist vec 4: 0 0 0 15: Test 62 Test passed! 15: 15: Test 63: ( 4 3 2 | 1 ) 15: Reference distribution: -15: Dist vec 1: 0 1 -15: Dist vec 2: 0 1 0 0 1 0 1 0 1 1 0 0 1 -15: Dist vec 3: 0 1 0 1 1 0 1 +15: Dist vec 1: 3 5 +15: Dist vec 2: 0 0 0 0 0 0 0 0 0 0 0 0 0 +15: Dist vec 3: 0 0 0 0 0 0 0 15: Dist vec 4: 0 0 0 15: Test distribution: -15: Dist vec 1: 0 1 -15: Dist vec 2: 0 1 0 0 1 0 1 0 1 1 0 0 1 -15: Dist vec 3: 0 1 0 1 1 0 1 +15: Dist vec 1: 3 5 +15: Dist vec 2: 0 0 0 0 0 0 0 0 0 0 0 0 0 +15: Dist vec 3: 0 0 0 0 0 0 0 15: Dist vec 4: 0 0 0 15: Test 63 Test passed! 15: 15: Test 64: ( 4 | 3 1 2 ) 15: Reference distribution: -15: Dist vec 1: 0 1 -15: Dist vec 2: 0 1 0 0 1 0 1 0 1 1 0 0 1 -15: Dist vec 3: 0 1 0 1 1 0 1 +15: Dist vec 1: 3 5 +15: Dist vec 2: 0 0 0 0 0 0 0 0 0 0 0 0 0 +15: Dist vec 3: 0 0 0 0 0 0 0 15: Dist vec 4: 0 0 0 15: Test distribution: -15: Dist vec 1: 0 1 -15: Dist vec 2: 0 1 0 0 1 0 1 0 1 1 0 0 1 -15: Dist vec 3: 0 1 0 1 1 0 1 +15: Dist vec 1: 3 5 +15: Dist vec 2: 0 0 0 0 0 0 0 0 0 0 0 0 0 +15: Dist vec 3: 0 0 0 0 0 0 0 15: Dist vec 4: 0 0 0 15: Test 64 Test passed! 15: 15: Test 65: ( 4 3 | 1 2 ) 15: Reference distribution: -15: Dist vec 1: 0 1 -15: Dist vec 2: 0 1 0 0 1 0 1 0 1 1 0 0 1 -15: Dist vec 3: 0 1 0 1 1 0 1 +15: Dist vec 1: 3 5 +15: Dist vec 2: 0 0 0 0 0 0 0 0 0 0 0 0 0 +15: Dist vec 3: 0 0 0 0 0 0 0 15: Dist vec 4: 0 0 0 15: Test distribution: -15: Dist vec 1: 0 1 -15: Dist vec 2: 0 1 0 0 1 0 1 0 1 1 0 0 1 -15: Dist vec 3: 0 1 0 1 1 0 1 +15: Dist vec 1: 3 5 +15: Dist vec 2: 0 0 0 0 0 0 0 0 0 0 0 0 0 +15: Dist vec 3: 0 0 0 0 0 0 0 15: Dist vec 4: 0 0 0 15: Test 65 Test passed! 15: 15: Test 66: ( 4 3 1 | 2 ) 15: Reference distribution: -15: Dist vec 1: 0 1 -15: Dist vec 2: 0 1 0 0 1 0 1 0 1 1 0 0 1 -15: Dist vec 3: 0 1 0 1 1 0 1 +15: Dist vec 1: 3 5 +15: Dist vec 2: 0 0 0 0 0 0 0 0 0 0 0 0 0 +15: Dist vec 3: 0 0 0 0 0 0 0 15: Dist vec 4: 0 0 0 15: Test distribution: -15: Dist vec 1: 0 1 -15: Dist vec 2: 0 1 0 0 1 0 1 0 1 1 0 0 1 -15: Dist vec 3: 0 1 0 1 1 0 1 +15: Dist vec 1: 3 5 +15: Dist vec 2: 0 0 0 0 0 0 0 0 0 0 0 0 0 +15: Dist vec 3: 0 0 0 0 0 0 0 15: Dist vec 4: 0 0 0 15: Test 66 Test passed! 15: 15: Test 67: ( 4 | 1 3 2 ) 15: Reference distribution: -15: Dist vec 1: 0 1 -15: Dist vec 2: 0 1 0 0 1 0 1 0 1 1 0 0 1 -15: Dist vec 3: 0 1 0 1 1 0 1 +15: Dist vec 1: 3 5 +15: Dist vec 2: 0 0 0 0 0 0 0 0 0 0 0 0 0 +15: Dist vec 3: 0 0 0 0 0 0 0 15: Dist vec 4: 0 0 0 15: Test distribution: -15: Dist vec 1: 0 1 -15: Dist vec 2: 0 1 0 0 1 0 1 0 1 1 0 0 1 -15: Dist vec 3: 0 1 0 1 1 0 1 +15: Dist vec 1: 3 5 +15: Dist vec 2: 0 0 0 0 0 0 0 0 0 0 0 0 0 +15: Dist vec 3: 0 0 0 0 0 0 0 15: Dist vec 4: 0 0 0 15: Test 67 Test passed! 15: 15: Test 68: ( 4 1 | 3 2 ) 15: Reference distribution: -15: Dist vec 1: 0 1 -15: Dist vec 2: 0 1 0 0 1 0 1 0 1 1 0 0 1 -15: Dist vec 3: 0 1 0 1 1 0 1 +15: Dist vec 1: 3 5 +15: Dist vec 2: 0 0 0 0 0 0 0 0 0 0 0 0 0 +15: Dist vec 3: 0 0 0 0 0 0 0 15: Dist vec 4: 0 0 0 15: Test distribution: -15: Dist vec 1: 0 1 -15: Dist vec 2: 0 1 0 0 1 0 1 0 1 1 0 0 1 -15: Dist vec 3: 0 1 0 1 1 0 1 +15: Dist vec 1: 3 5 +15: Dist vec 2: 0 0 0 0 0 0 0 0 0 0 0 0 0 +15: Dist vec 3: 0 0 0 0 0 0 0 15: Dist vec 4: 0 0 0 15: Test 68 Test passed! 15: 15: Test 69: ( 4 1 3 | 2 ) 15: Reference distribution: -15: Dist vec 1: 0 1 -15: Dist vec 2: 0 1 0 0 1 0 1 0 1 1 0 0 1 -15: Dist vec 3: 0 1 0 1 1 0 1 +15: Dist vec 1: 3 5 +15: Dist vec 2: 0 0 0 0 0 0 0 0 0 0 0 0 0 +15: Dist vec 3: 0 0 0 0 0 0 0 15: Dist vec 4: 0 0 0 15: Test distribution: -15: Dist vec 1: 0 1 -15: Dist vec 2: 0 1 0 0 1 0 1 0 1 1 0 0 1 -15: Dist vec 3: 0 1 0 1 1 0 1 +15: Dist vec 1: 3 5 +15: Dist vec 2: 0 0 0 0 0 0 0 0 0 0 0 0 0 +15: Dist vec 3: 0 0 0 0 0 0 0 15: Dist vec 4: 0 0 0 15: Test 69 Test passed! 15: 15: Test 70: ( 4 | 1 2 3 ) 15: Reference distribution: -15: Dist vec 1: 0 1 -15: Dist vec 2: 0 1 0 0 1 0 1 0 1 1 0 0 1 -15: Dist vec 3: 0 1 0 1 1 0 1 +15: Dist vec 1: 3 5 +15: Dist vec 2: 0 0 0 0 0 0 0 0 0 0 0 0 0 +15: Dist vec 3: 0 0 0 0 0 0 0 15: Dist vec 4: 0 0 0 15: Test distribution: -15: Dist vec 1: 0 1 -15: Dist vec 2: 0 1 0 0 1 0 1 0 1 1 0 0 1 -15: Dist vec 3: 0 1 0 1 1 0 1 +15: Dist vec 1: 3 5 +15: Dist vec 2: 0 0 0 0 0 0 0 0 0 0 0 0 0 +15: Dist vec 3: 0 0 0 0 0 0 0 15: Dist vec 4: 0 0 0 15: Test 70 Test passed! 15: 15: Test 71: ( 4 1 | 2 3 ) 15: Reference distribution: -15: Dist vec 1: 0 1 -15: Dist vec 2: 0 1 0 0 1 0 1 0 1 1 0 0 1 -15: Dist vec 3: 0 1 0 1 1 0 1 +15: Dist vec 1: 3 5 +15: Dist vec 2: 0 0 0 0 0 0 0 0 0 0 0 0 0 +15: Dist vec 3: 0 0 0 0 0 0 0 15: Dist vec 4: 0 0 0 15: Test distribution: -15: Dist vec 1: 0 1 -15: Dist vec 2: 0 1 0 0 1 0 1 0 1 1 0 0 1 -15: Dist vec 3: 0 1 0 1 1 0 1 +15: Dist vec 1: 3 5 +15: Dist vec 2: 0 0 0 0 0 0 0 0 0 0 0 0 0 +15: Dist vec 3: 0 0 0 0 0 0 0 15: Dist vec 4: 0 0 0 15: Test 71 Test passed! 15: 15: Test 72: ( 4 1 2 | 3 ) 15: Reference distribution: -15: Dist vec 1: 0 1 -15: Dist vec 2: 0 1 0 0 1 0 1 0 1 1 0 0 1 -15: Dist vec 3: 0 1 0 1 1 0 1 +15: Dist vec 1: 3 5 +15: Dist vec 2: 0 0 0 0 0 0 0 0 0 0 0 0 0 +15: Dist vec 3: 0 0 0 0 0 0 0 15: Dist vec 4: 0 0 0 15: Test distribution: -15: Dist vec 1: 0 1 -15: Dist vec 2: 0 1 0 0 1 0 1 0 1 1 0 0 1 -15: Dist vec 3: 0 1 0 1 1 0 1 +15: Dist vec 1: 3 5 +15: Dist vec 2: 0 0 0 0 0 0 0 0 0 0 0 0 0 +15: Dist vec 3: 0 0 0 0 0 0 0 15: Dist vec 4: 0 0 0 15: Test 72 Test passed! 15: @@ -54125,27 +54137,27 @@ 15: GLOBAL INFO OF (12|3) 15: block dimensions: 4 11 9 15: full dimensions: 25 83 74 -15: process grid dimensions: 3 2 2 +15: process grid dimensions: 7 1 1 15: 15: DISTRIBUTION OF (12|3) 15: Number of non-zero blocks: 32 15: Percentage of non-zero blocks: 8.08 -15: Average number of blocks per CPU: 3 -15: Maximum number of blocks per CPU: 8 -15: Average number of matrix elements per CPU: 1360 -15: Maximum number of matrix elements per CPU: 4149 +15: Average number of blocks per CPU: 5 +15: Maximum number of blocks per CPU: 11 +15: Average number of matrix elements per CPU: 2330 +15: Maximum number of matrix elements per CPU: 7584 15: GLOBAL INFO OF (3|4) 15: block dimensions: 9 5 15: full dimensions: 74 32 -15: process grid dimensions: 4 3 +15: process grid dimensions: 7 1 15: 15: DISTRIBUTION OF (3|4) 15: Number of non-zero blocks: 12 15: Percentage of non-zero blocks: 26.67 -15: Average number of blocks per CPU: 1 -15: Maximum number of blocks per CPU: 3 -15: Average number of matrix elements per CPU: 65 -15: Maximum number of matrix elements per CPU: 299 +15: Average number of blocks per CPU: 2 +15: Maximum number of blocks per CPU: 4 +15: Average number of matrix elements per CPU: 111 +15: Maximum number of matrix elements per CPU: 483 15: INDEX INFO 15: tensor index: (bac) x (cd) = (bad) 15: matrix index: (ba|c) x (c|d) = (ba|d) @@ -54169,80 +54181,80 @@ 15: -------------------------------------------------------------------------------- 15: mm dims: 44 9 5 15: MM PARAMETERS -15: Est. number of matrix elements per CPU of result matrix: 1338 -15: Est. optimal split factor: 12 +15: Est. number of matrix elements per CPU of result matrix: 2293 +15: Est. optimal split factor: 7 15: No redistribution of (12|3) matrix and (12|4) matrix -15: Change split factor of (12|3) matrix : Yes -15: Change split factor of (12|4) matrix : Yes +15: Change split factor of (12|3) matrix : No +15: Change split factor of (12|4) matrix : No 15: mm case: | x + = | 15: SPLIT / PARALLELIZATION INFO -15: splitting rows by factor 6 -15: global grid sizes: 6x 2 -15: grid sizes on subgroups: 1x 2 +15: splitting rows by factor 7 +15: global grid sizes: 7x 1 +15: grid sizes on subgroups: 1x 1 15: GLOBAL INFO OF (12|3) matrix 15: block dimensions: 44 9 15: full dimensions: 2075 74 -15: process grid dimensions: 6 2 +15: process grid dimensions: 7 1 15: GLOBAL INFO OF (3|4) matrix 15: block dimensions: 9 5 15: full dimensions: 74 32 -15: process grid dimensions: 6 2 +15: process grid dimensions: 7 1 15: GLOBAL INFO OF (12|4) matrix 15: block dimensions: 44 5 15: full dimensions: 2075 32 -15: process grid dimensions: 6 2 +15: process grid dimensions: 7 1 15: Change process grid: No 15: DISTRIBUTION OF (12|3) matrix 15: Number of non-zero blocks: 32 15: Percentage of non-zero blocks: 8.08 -15: Average number of blocks per group: 6 -15: Maximum number of blocks per group: 13 -15: Average number of matrix elements per group: 2719 -15: Maximum number of matrix elements per group: 5772 -15: Average number of blocks per CPU: 3 -15: Maximum number of blocks per CPU: 8 -15: Average number of matrix elements per CPU: 1360 -15: Maximum number of matrix elements per CPU: 4149 +15: Average number of blocks per group: 5 +15: Maximum number of blocks per group: 11 +15: Average number of matrix elements per group: 2330 +15: Maximum number of matrix elements per group: 7584 +15: Average number of blocks per CPU: 5 +15: Maximum number of blocks per CPU: 11 +15: Average number of matrix elements per CPU: 2330 +15: Maximum number of matrix elements per CPU: 7584 15: DISTRIBUTION OF (3|4) matrix replicated -15: Number of non-zero blocks: 72 +15: Number of non-zero blocks: 84 15: Percentage of non-zero blocks: 26.67 15: Average number of blocks per group: 12 15: Maximum number of blocks per group: 12 15: Average number of matrix elements per group: 776 15: Maximum number of matrix elements per group: 776 -15: Average number of blocks per CPU: 6 -15: Maximum number of blocks per CPU: 6 -15: Average number of matrix elements per CPU: 388 -15: Maximum number of matrix elements per CPU: 450 +15: Average number of blocks per CPU: 12 +15: Maximum number of blocks per CPU: 12 +15: Average number of matrix elements per CPU: 776 +15: Maximum number of matrix elements per CPU: 776 15: DISTRIBUTION OF (12|4) matrix -15: Number of non-zero blocks: 38 -15: Percentage of non-zero blocks: 17.27 -15: Average number of blocks per group: 7 -15: Maximum number of blocks per group: 15 -15: Average number of matrix elements per group: 2675 -15: Maximum number of matrix elements per group: 6300 -15: Average number of blocks per CPU: 4 -15: Maximum number of blocks per CPU: 8 -15: Average number of matrix elements per CPU: 1338 -15: Maximum number of matrix elements per CPU: 3924 +15: Number of non-zero blocks: 42 +15: Percentage of non-zero blocks: 19.09 +15: Average number of blocks per group: 6 +15: Maximum number of blocks per group: 14 +15: Average number of matrix elements per group: 2397 +15: Maximum number of matrix elements per group: 8478 +15: Average number of blocks per CPU: 6 +15: Maximum number of blocks per CPU: 14 +15: Average number of matrix elements per CPU: 2397 +15: Maximum number of matrix elements per CPU: 8478 15: MM PARAMETERS -15: Number of matrix elements per CPU of result matrix: 1338 -15: Optimal split factor: 12 +15: Number of matrix elements per CPU of result matrix: 2293 +15: Optimal split factor: 7 15: -------------------------------------------------------------------------------- 15: TAS MATRIX MULTIPLICATION DONE 15: -------------------------------------------------------------------------------- 15: GLOBAL INFO OF (12|4) 15: block dimensions: 4 11 5 15: full dimensions: 25 83 32 -15: process grid dimensions: 3 2 2 +15: process grid dimensions: 7 1 1 15: 15: DISTRIBUTION OF (12|4) 15: Number of non-zero blocks: 42 15: Percentage of non-zero blocks: 19.09 -15: Average number of blocks per CPU: 4 -15: Maximum number of blocks per CPU: 8 -15: Average number of matrix elements per CPU: 1398 -15: Maximum number of matrix elements per CPU: 3924 +15: Average number of blocks per CPU: 6 +15: Maximum number of blocks per CPU: 14 +15: Average number of matrix elements per CPU: 2397 +15: Maximum number of matrix elements per CPU: 8478 15: -------------------------------------------------------------------------------- 15: TENSOR CONTRACTION DONE 15: -------------------------------------------------------------------------------- @@ -54257,27 +54269,27 @@ 15: GLOBAL INFO OF (2|31) 15: block dimensions: 4 11 9 15: full dimensions: 25 83 74 -15: process grid dimensions: 3 2 2 +15: process grid dimensions: 7 1 1 15: 15: DISTRIBUTION OF (2|31) 15: Number of non-zero blocks: 32 15: Percentage of non-zero blocks: 8.08 -15: Average number of blocks per CPU: 3 -15: Maximum number of blocks per CPU: 8 -15: Average number of matrix elements per CPU: 1360 -15: Maximum number of matrix elements per CPU: 4149 +15: Average number of blocks per CPU: 5 +15: Maximum number of blocks per CPU: 11 +15: Average number of matrix elements per CPU: 2330 +15: Maximum number of matrix elements per CPU: 7584 15: GLOBAL INFO OF (4|3) 15: block dimensions: 9 5 15: full dimensions: 74 32 -15: process grid dimensions: 4 3 +15: process grid dimensions: 7 1 15: 15: DISTRIBUTION OF (4|3) 15: Number of non-zero blocks: 12 15: Percentage of non-zero blocks: 26.67 -15: Average number of blocks per CPU: 1 -15: Maximum number of blocks per CPU: 3 -15: Average number of matrix elements per CPU: 65 -15: Maximum number of matrix elements per CPU: 299 +15: Average number of blocks per CPU: 2 +15: Maximum number of blocks per CPU: 4 +15: Average number of matrix elements per CPU: 111 +15: Maximum number of matrix elements per CPU: 483 15: INDEX INFO 15: tensor index: (abc) x (cd) = (abd) 15: matrix index: (b|ca) x (d|c) = (bd|a) @@ -54301,106 +54313,106 @@ 15: GLOBAL INFO OF (2|31) 15: block dimensions: 11 9 4 15: full dimensions: 83 74 25 -15: process grid dimensions: 3 2 2 +15: process grid dimensions: 7 1 1 15: 15: DISTRIBUTION OF (2|31) 15: Number of non-zero blocks: 32 15: Percentage of non-zero blocks: 8.08 -15: Average number of blocks per CPU: 3 -15: Maximum number of blocks per CPU: 5 -15: Average number of matrix elements per CPU: 1360 +15: Average number of blocks per CPU: 5 +15: Maximum number of blocks per CPU: 7 +15: Average number of matrix elements per CPU: 2330 15: Maximum number of matrix elements per CPU: 4032 15: -------------------------------------------------------------------------------- 15: DBCSR TAS MATRIX MULTIPLICATION: (2|31) matrix x (4|3) matrix = (24|1) matrix 15: -------------------------------------------------------------------------------- 15: mm dims: 44 9 5 15: MM PARAMETERS -15: Est. number of matrix elements per CPU of result matrix: 1338 -15: Est. optimal split factor: 12 +15: Est. number of matrix elements per CPU of result matrix: 2293 +15: Est. optimal split factor: 7 15: No redistribution of (2|31) matrix and (24|1) matrix -15: Change split factor of (2|31) matrix : Yes -15: Change split factor of (24|1) matrix : Yes +15: Change split factor of (2|31) matrix : No +15: Change split factor of (24|1) matrix : No 15: mm case: | x + = | 15: SPLIT / PARALLELIZATION INFO -15: splitting rows by factor 6 -15: global grid sizes: 6x 2 -15: grid sizes on subgroups: 1x 2 +15: splitting rows by factor 7 +15: global grid sizes: 7x 1 +15: grid sizes on subgroups: 1x 1 15: GLOBAL INFO OF (2|31) matrix 15: block dimensions: 44 9 15: full dimensions: 2075 74 -15: process grid dimensions: 6 2 +15: process grid dimensions: 7 1 15: GLOBAL INFO OF (4|3) matrix 15: block dimensions: 9 5 15: full dimensions: 74 32 -15: process grid dimensions: 6 2 +15: process grid dimensions: 7 1 15: GLOBAL INFO OF (24|1) matrix 15: block dimensions: 44 5 15: full dimensions: 2075 32 -15: process grid dimensions: 6 2 +15: process grid dimensions: 7 1 15: Change process grid: No 15: DISTRIBUTION OF (2|31) matrix 15: Number of non-zero blocks: 32 15: Percentage of non-zero blocks: 8.08 -15: Average number of blocks per group: 6 -15: Maximum number of blocks per group: 8 -15: Average number of matrix elements per group: 2719 -15: Maximum number of matrix elements per group: 6501 -15: Average number of blocks per CPU: 3 -15: Maximum number of blocks per CPU: 5 -15: Average number of matrix elements per CPU: 1360 +15: Average number of blocks per group: 5 +15: Maximum number of blocks per group: 7 +15: Average number of matrix elements per group: 2330 +15: Maximum number of matrix elements per group: 4032 +15: Average number of blocks per CPU: 5 +15: Maximum number of blocks per CPU: 7 +15: Average number of matrix elements per CPU: 2330 15: Maximum number of matrix elements per CPU: 4032 15: DISTRIBUTION OF (4|3) matrix replicated -15: Number of non-zero blocks: 72 +15: Number of non-zero blocks: 84 15: Percentage of non-zero blocks: 26.67 15: Average number of blocks per group: 12 15: Maximum number of blocks per group: 12 15: Average number of matrix elements per group: 776 15: Maximum number of matrix elements per group: 776 -15: Average number of blocks per CPU: 6 -15: Maximum number of blocks per CPU: 6 -15: Average number of matrix elements per CPU: 388 -15: Maximum number of matrix elements per CPU: 450 +15: Average number of blocks per CPU: 12 +15: Maximum number of blocks per CPU: 12 +15: Average number of matrix elements per CPU: 776 +15: Maximum number of matrix elements per CPU: 776 15: DISTRIBUTION OF (24|1) matrix 15: Number of non-zero blocks: 38 15: Percentage of non-zero blocks: 17.27 -15: Average number of blocks per group: 7 +15: Average number of blocks per group: 6 15: Maximum number of blocks per group: 11 -15: Average number of matrix elements per group: 2675 +15: Average number of matrix elements per group: 2293 15: Maximum number of matrix elements per group: 7680 -15: Average number of blocks per CPU: 4 -15: Maximum number of blocks per CPU: 6 -15: Average number of matrix elements per CPU: 1338 -15: Maximum number of matrix elements per CPU: 4992 +15: Average number of blocks per CPU: 6 +15: Maximum number of blocks per CPU: 11 +15: Average number of matrix elements per CPU: 2293 +15: Maximum number of matrix elements per CPU: 7680 15: MM PARAMETERS -15: Number of matrix elements per CPU of result matrix: 1338 -15: Optimal split factor: 12 +15: Number of matrix elements per CPU of result matrix: 2293 +15: Optimal split factor: 7 15: -------------------------------------------------------------------------------- 15: TAS MATRIX MULTIPLICATION DONE 15: -------------------------------------------------------------------------------- 15: GLOBAL INFO OF (24|1) 15: block dimensions: 11 5 4 15: full dimensions: 83 32 25 -15: process grid dimensions: 3 2 2 +15: process grid dimensions: 7 1 1 15: 15: DISTRIBUTION OF (24|1) 15: Number of non-zero blocks: 38 15: Percentage of non-zero blocks: 17.27 -15: Average number of blocks per CPU: 4 -15: Maximum number of blocks per CPU: 6 -15: Average number of matrix elements per CPU: 1338 -15: Maximum number of matrix elements per CPU: 4992 +15: Average number of blocks per CPU: 6 +15: Maximum number of blocks per CPU: 11 +15: Average number of matrix elements per CPU: 2293 +15: Maximum number of matrix elements per CPU: 7680 15: GLOBAL INFO OF (24|1) 15: block dimensions: 4 11 5 15: full dimensions: 25 83 32 -15: process grid dimensions: 3 2 2 +15: process grid dimensions: 7 1 1 15: 15: DISTRIBUTION OF (24|1) 15: Number of non-zero blocks: 42 15: Percentage of non-zero blocks: 19.09 -15: Average number of blocks per CPU: 4 -15: Maximum number of blocks per CPU: 8 -15: Average number of matrix elements per CPU: 1398 -15: Maximum number of matrix elements per CPU: 3924 +15: Average number of blocks per CPU: 6 +15: Maximum number of blocks per CPU: 14 +15: Average number of matrix elements per CPU: 2397 +15: Maximum number of matrix elements per CPU: 8478 15: -------------------------------------------------------------------------------- 15: TENSOR CONTRACTION DONE 15: -------------------------------------------------------------------------------- @@ -54415,27 +54427,27 @@ 15: GLOBAL INFO OF (4|3) 15: block dimensions: 9 5 15: full dimensions: 74 32 -15: process grid dimensions: 4 3 +15: process grid dimensions: 7 1 15: 15: DISTRIBUTION OF (4|3) 15: Number of non-zero blocks: 12 15: Percentage of non-zero blocks: 26.67 -15: Average number of blocks per CPU: 1 -15: Maximum number of blocks per CPU: 3 -15: Average number of matrix elements per CPU: 65 -15: Maximum number of matrix elements per CPU: 299 +15: Average number of blocks per CPU: 2 +15: Maximum number of blocks per CPU: 4 +15: Average number of matrix elements per CPU: 111 +15: Maximum number of matrix elements per CPU: 483 15: GLOBAL INFO OF (1|32) 15: block dimensions: 4 11 9 15: full dimensions: 25 83 74 -15: process grid dimensions: 3 2 2 +15: process grid dimensions: 7 1 1 15: 15: DISTRIBUTION OF (1|32) 15: Number of non-zero blocks: 30 15: Percentage of non-zero blocks: 7.58 -15: Average number of blocks per CPU: 3 -15: Maximum number of blocks per CPU: 8 -15: Average number of matrix elements per CPU: 1355 -15: Maximum number of matrix elements per CPU: 4149 +15: Average number of blocks per CPU: 5 +15: Maximum number of blocks per CPU: 10 +15: Average number of matrix elements per CPU: 2322 +15: Maximum number of matrix elements per CPU: 7584 15: INDEX INFO 15: tensor index: (ba) x (cdb) = (cda) 15: matrix index: (a|b) x (c|bd) = (da|c) @@ -54459,106 +54471,106 @@ 15: GLOBAL INFO OF (1|32) 15: block dimensions: 4 9 11 15: full dimensions: 25 74 83 -15: process grid dimensions: 3 2 2 +15: process grid dimensions: 7 1 1 15: 15: DISTRIBUTION OF (1|32) 15: Number of non-zero blocks: 30 15: Percentage of non-zero blocks: 7.58 -15: Average number of blocks per CPU: 3 -15: Maximum number of blocks per CPU: 8 -15: Average number of matrix elements per CPU: 1355 -15: Maximum number of matrix elements per CPU: 4149 +15: Average number of blocks per CPU: 5 +15: Maximum number of blocks per CPU: 10 +15: Average number of matrix elements per CPU: 2322 +15: Maximum number of matrix elements per CPU: 7584 15: -------------------------------------------------------------------------------- 15: DBCSR TAS MATRIX MULTIPLICATION: (4|3) matrix x (1|32) matrix = (24|1) matrix 15: -------------------------------------------------------------------------------- 15: mm dims: 5 9 44 15: MM PARAMETERS -15: Est. number of matrix elements per CPU of result matrix: 1338 -15: Est. optimal split factor: 12 +15: Est. number of matrix elements per CPU of result matrix: 2293 +15: Est. optimal split factor: 7 15: No redistribution of (1|32) matrix and (24|1) matrix -15: Change split factor of (1|32) matrix : Yes -15: Change split factor of (24|1) matrix : Yes +15: Change split factor of (1|32) matrix : No +15: Change split factor of (24|1) matrix : No 15: mm case: + x |T = |T 15: SPLIT / PARALLELIZATION INFO -15: splitting rows by factor 6 -15: global grid sizes: 6x 2 -15: grid sizes on subgroups: 1x 2 +15: splitting rows by factor 7 +15: global grid sizes: 7x 1 +15: grid sizes on subgroups: 1x 1 15: GLOBAL INFO OF (4|3) matrix 15: block dimensions: 5 9 15: full dimensions: 32 74 -15: process grid dimensions: 6 2 +15: process grid dimensions: 7 1 15: GLOBAL INFO OF (1|32) matrix 15: block dimensions: 44 9 15: full dimensions: 2075 74 -15: process grid dimensions: 6 2 +15: process grid dimensions: 7 1 15: GLOBAL INFO OF (24|1) matrix 15: block dimensions: 44 5 15: full dimensions: 2075 32 -15: process grid dimensions: 6 2 +15: process grid dimensions: 7 1 15: Change process grid: No 15: DISTRIBUTION OF (4|3) matrix replicated -15: Number of non-zero blocks: 72 +15: Number of non-zero blocks: 84 15: Percentage of non-zero blocks: 26.67 15: Average number of blocks per group: 12 15: Maximum number of blocks per group: 12 15: Average number of matrix elements per group: 776 15: Maximum number of matrix elements per group: 776 -15: Average number of blocks per CPU: 6 -15: Maximum number of blocks per CPU: 7 -15: Average number of matrix elements per CPU: 388 -15: Maximum number of matrix elements per CPU: 573 +15: Average number of blocks per CPU: 12 +15: Maximum number of blocks per CPU: 12 +15: Average number of matrix elements per CPU: 776 +15: Maximum number of matrix elements per CPU: 776 15: DISTRIBUTION OF (1|32) matrix 15: Number of non-zero blocks: 30 15: Percentage of non-zero blocks: 7.58 15: Average number of blocks per group: 5 -15: Maximum number of blocks per group: 12 -15: Average number of matrix elements per group: 2709 -15: Maximum number of matrix elements per group: 5772 -15: Average number of blocks per CPU: 3 -15: Maximum number of blocks per CPU: 8 -15: Average number of matrix elements per CPU: 1355 -15: Maximum number of matrix elements per CPU: 4149 +15: Maximum number of blocks per group: 10 +15: Average number of matrix elements per group: 2322 +15: Maximum number of matrix elements per group: 7584 +15: Average number of blocks per CPU: 5 +15: Maximum number of blocks per CPU: 10 +15: Average number of matrix elements per CPU: 2322 +15: Maximum number of matrix elements per CPU: 7584 15: DISTRIBUTION OF (24|1) matrix 15: Number of non-zero blocks: 38 15: Percentage of non-zero blocks: 17.27 -15: Average number of blocks per group: 7 -15: Maximum number of blocks per group: 15 -15: Average number of matrix elements per group: 2675 -15: Maximum number of matrix elements per group: 6300 -15: Average number of blocks per CPU: 4 -15: Maximum number of blocks per CPU: 8 -15: Average number of matrix elements per CPU: 1338 -15: Maximum number of matrix elements per CPU: 3924 +15: Average number of blocks per group: 6 +15: Maximum number of blocks per group: 13 +15: Average number of matrix elements per group: 2293 +15: Maximum number of matrix elements per group: 8244 +15: Average number of blocks per CPU: 6 +15: Maximum number of blocks per CPU: 13 +15: Average number of matrix elements per CPU: 2293 +15: Maximum number of matrix elements per CPU: 8244 15: MM PARAMETERS -15: Number of matrix elements per CPU of result matrix: 1338 -15: Optimal split factor: 12 +15: Number of matrix elements per CPU of result matrix: 2293 +15: Optimal split factor: 7 15: -------------------------------------------------------------------------------- 15: TAS MATRIX MULTIPLICATION DONE 15: -------------------------------------------------------------------------------- 15: GLOBAL INFO OF (24|1) 15: block dimensions: 11 5 4 15: full dimensions: 83 32 25 -15: process grid dimensions: 2 2 3 +15: process grid dimensions: 1 1 7 15: 15: DISTRIBUTION OF (24|1) 15: Number of non-zero blocks: 38 15: Percentage of non-zero blocks: 17.27 -15: Average number of blocks per CPU: 4 -15: Maximum number of blocks per CPU: 8 -15: Average number of matrix elements per CPU: 1338 -15: Maximum number of matrix elements per CPU: 3924 +15: Average number of blocks per CPU: 6 +15: Maximum number of blocks per CPU: 13 +15: Average number of matrix elements per CPU: 2293 +15: Maximum number of matrix elements per CPU: 8244 15: GLOBAL INFO OF (24|1) 15: block dimensions: 4 11 5 15: full dimensions: 25 83 32 -15: process grid dimensions: 3 2 2 +15: process grid dimensions: 7 1 1 15: 15: DISTRIBUTION OF (24|1) 15: Number of non-zero blocks: 42 15: Percentage of non-zero blocks: 19.09 -15: Average number of blocks per CPU: 4 -15: Maximum number of blocks per CPU: 8 -15: Average number of matrix elements per CPU: 1398 -15: Maximum number of matrix elements per CPU: 3924 +15: Average number of blocks per CPU: 6 +15: Maximum number of blocks per CPU: 14 +15: Average number of matrix elements per CPU: 2397 +15: Maximum number of matrix elements per CPU: 8478 15: -------------------------------------------------------------------------------- 15: TENSOR CONTRACTION DONE 15: -------------------------------------------------------------------------------- @@ -54573,27 +54585,27 @@ 15: GLOBAL INFO OF (1|24) 15: block dimensions: 4 11 5 15: full dimensions: 25 83 32 -15: process grid dimensions: 3 2 2 +15: process grid dimensions: 7 1 1 15: 15: DISTRIBUTION OF (1|24) 15: Number of non-zero blocks: 3 15: Percentage of non-zero blocks: 1.36 15: Average number of blocks per CPU: 1 -15: Maximum number of blocks per CPU: 1 -15: Average number of matrix elements per CPU: 57 -15: Maximum number of matrix elements per CPU: 416 +15: Maximum number of blocks per CPU: 2 +15: Average number of matrix elements per CPU: 98 +15: Maximum number of matrix elements per CPU: 446 15: GLOBAL INFO OF (3|4) 15: block dimensions: 9 5 15: full dimensions: 74 32 -15: process grid dimensions: 4 3 +15: process grid dimensions: 7 1 15: 15: DISTRIBUTION OF (3|4) 15: Number of non-zero blocks: 12 15: Percentage of non-zero blocks: 26.67 -15: Average number of blocks per CPU: 1 -15: Maximum number of blocks per CPU: 3 -15: Average number of matrix elements per CPU: 65 -15: Maximum number of matrix elements per CPU: 299 +15: Average number of blocks per CPU: 2 +15: Maximum number of blocks per CPU: 4 +15: Average number of matrix elements per CPU: 111 +15: Maximum number of matrix elements per CPU: 483 15: INDEX INFO 15: tensor index: (abc) x (dc) = (abd) 15: matrix index: (a|bc) x (d|c) = (ba|d) @@ -54616,78 +54628,78 @@ 15: GLOBAL INFO OF (1|24) 15: block dimensions: 4 11 5 15: full dimensions: 25 83 32 -15: process grid dimensions: 3 2 2 +15: process grid dimensions: 7 1 1 15: 15: DISTRIBUTION OF (1|24) 15: Number of non-zero blocks: 3 15: Percentage of non-zero blocks: 1.36 15: Average number of blocks per CPU: 1 -15: Maximum number of blocks per CPU: 1 -15: Average number of matrix elements per CPU: 57 -15: Maximum number of matrix elements per CPU: 416 +15: Maximum number of blocks per CPU: 2 +15: Average number of matrix elements per CPU: 98 +15: Maximum number of matrix elements per CPU: 446 15: -------------------------------------------------------------------------------- 15: DBCSR TAS MATRIX MULTIPLICATION: (1|24) matrix x (3|4) matrix = (21|3) matrix 15: -------------------------------------------------------------------------------- 15: mm dims: 44 5 9 15: MM PARAMETERS -15: Est. number of matrix elements per CPU of result matrix: 113 +15: Est. number of matrix elements per CPU of result matrix: 193 15: Est. optimal split factor: 2 15: No redistribution of (1|24) matrix and (21|3) matrix -15: Change split factor of (1|24) matrix : No -15: Change split factor of (21|3) matrix : No +15: Change split factor of (1|24) matrix : Yes +15: Change split factor of (21|3) matrix : Yes 15: mm case: | x + = | 15: SPLIT / PARALLELIZATION INFO -15: splitting rows by factor 3 -15: global grid sizes: 6x 2 -15: grid sizes on subgroups: 2x 2 +15: splitting rows by factor 1 +15: global grid sizes: 7x 1 +15: grid sizes on subgroups: 7x 1 15: GLOBAL INFO OF (1|24) matrix 15: block dimensions: 44 5 15: full dimensions: 2075 32 -15: process grid dimensions: 6 2 +15: process grid dimensions: 7 1 15: GLOBAL INFO OF (3|4) matrix 15: block dimensions: 5 9 15: full dimensions: 32 74 -15: process grid dimensions: 6 2 +15: process grid dimensions: 7 1 15: GLOBAL INFO OF (21|3) matrix 15: block dimensions: 44 9 15: full dimensions: 2075 74 -15: process grid dimensions: 6 2 +15: process grid dimensions: 7 1 15: Change process grid: No 15: DISTRIBUTION OF (1|24) matrix 15: Number of non-zero blocks: 3 15: Percentage of non-zero blocks: 1.36 -15: Average number of blocks per group: 1 -15: Maximum number of blocks per group: 2 -15: Average number of matrix elements per group: 227 -15: Maximum number of matrix elements per group: 446 +15: Average number of blocks per group: 3 +15: Maximum number of blocks per group: 3 +15: Average number of matrix elements per group: 680 +15: Maximum number of matrix elements per group: 680 15: Average number of blocks per CPU: 1 -15: Maximum number of blocks per CPU: 1 -15: Average number of matrix elements per CPU: 57 -15: Maximum number of matrix elements per CPU: 416 +15: Maximum number of blocks per CPU: 2 +15: Average number of matrix elements per CPU: 98 +15: Maximum number of matrix elements per CPU: 446 15: DISTRIBUTION OF (3|4) matrix replicated -15: Number of non-zero blocks: 36 +15: Number of non-zero blocks: 12 15: Percentage of non-zero blocks: 26.67 15: Average number of blocks per group: 12 15: Maximum number of blocks per group: 12 15: Average number of matrix elements per group: 776 15: Maximum number of matrix elements per group: 776 -15: Average number of blocks per CPU: 3 -15: Maximum number of blocks per CPU: 5 -15: Average number of matrix elements per CPU: 194 -15: Maximum number of matrix elements per CPU: 347 +15: Average number of blocks per CPU: 2 +15: Maximum number of blocks per CPU: 4 +15: Average number of matrix elements per CPU: 111 +15: Maximum number of matrix elements per CPU: 338 15: DISTRIBUTION OF (21|3) matrix -15: Number of non-zero blocks: 38 -15: Percentage of non-zero blocks: 9.60 -15: Average number of blocks per group: 13 -15: Maximum number of blocks per group: 19 -15: Average number of matrix elements per group: 5887 -15: Maximum number of matrix elements per group: 9921 -15: Average number of blocks per CPU: 4 -15: Maximum number of blocks per CPU: 8 -15: Average number of matrix elements per CPU: 1472 -15: Maximum number of matrix elements per CPU: 4149 +15: Number of non-zero blocks: 6 +15: Percentage of non-zero blocks: 1.52 +15: Average number of blocks per group: 6 +15: Maximum number of blocks per group: 6 +15: Average number of matrix elements per group: 1350 +15: Maximum number of matrix elements per group: 1350 +15: Average number of blocks per CPU: 1 +15: Maximum number of blocks per CPU: 4 +15: Average number of matrix elements per CPU: 193 +15: Maximum number of matrix elements per CPU: 882 15: MM PARAMETERS -15: Number of matrix elements per CPU of result matrix: 113 +15: Number of matrix elements per CPU of result matrix: 193 15: Optimal split factor: 2 15: -------------------------------------------------------------------------------- 15: TAS MATRIX MULTIPLICATION DONE @@ -54695,15 +54707,15 @@ 15: GLOBAL INFO OF (21|3) 15: block dimensions: 11 4 9 15: full dimensions: 83 25 74 -15: process grid dimensions: 2 3 2 +15: process grid dimensions: 1 7 1 15: 15: DISTRIBUTION OF (21|3) 15: Number of non-zero blocks: 38 15: Percentage of non-zero blocks: 9.60 -15: Average number of blocks per CPU: 4 -15: Maximum number of blocks per CPU: 8 -15: Average number of matrix elements per CPU: 1472 -15: Maximum number of matrix elements per CPU: 4149 +15: Average number of blocks per CPU: 6 +15: Maximum number of blocks per CPU: 11 +15: Average number of matrix elements per CPU: 2523 +15: Maximum number of matrix elements per CPU: 7584 15: -------------------------------------------------------------------------------- 15: TENSOR CONTRACTION DONE 15: -------------------------------------------------------------------------------- @@ -54718,27 +54730,27 @@ 15: GLOBAL INFO OF (12|3) 15: block dimensions: 4 11 9 15: full dimensions: 25 83 74 -15: process grid dimensions: 3 2 2 +15: process grid dimensions: 7 1 1 15: 15: DISTRIBUTION OF (12|3) 15: Number of non-zero blocks: 13 15: Percentage of non-zero blocks: 3.28 15: Average number of blocks per CPU: 2 -15: Maximum number of blocks per CPU: 3 -15: Average number of matrix elements per CPU: 738 -15: Maximum number of matrix elements per CPU: 4149 +15: Maximum number of blocks per CPU: 5 +15: Average number of matrix elements per CPU: 1265 +15: Maximum number of matrix elements per CPU: 4464 15: GLOBAL INFO OF (12|45) 15: block dimensions: 4 11 5 3 15: full dimensions: 25 83 32 28 -15: process grid dimensions: 3 2 2 1 +15: process grid dimensions: 7 1 1 1 15: 15: DISTRIBUTION OF (12|45) 15: Number of non-zero blocks: 21 15: Percentage of non-zero blocks: 3.18 -15: Average number of blocks per CPU: 2 -15: Maximum number of blocks per CPU: 4 -15: Average number of matrix elements per CPU: 11467 -15: Maximum number of matrix elements per CPU: 96768 +15: Average number of blocks per CPU: 3 +15: Maximum number of blocks per CPU: 11 +15: Average number of matrix elements per CPU: 19657 +15: Maximum number of matrix elements per CPU: 126828 15: INDEX INFO 15: tensor index: (cba) x (cbde) = (ade) 15: matrix index: (cb|a) x (cb|de) = (a|de) @@ -54762,80 +54774,80 @@ 15: -------------------------------------------------------------------------------- 15: mm dims: 9 44 15 15: MM PARAMETERS -15: Est. number of matrix elements per CPU of result matrix: 703 -15: Est. optimal split factor: 12 +15: Est. number of matrix elements per CPU of result matrix: 1204 +15: Est. optimal split factor: 7 15: No redistribution of (12|3) matrix and (12|45) matrix -15: Change split factor of (12|3) matrix : Yes -15: Change split factor of (12|45) matrix : Yes +15: Change split factor of (12|3) matrix : No +15: Change split factor of (12|45) matrix : No 15: mm case: |T x | = + 15: SPLIT / PARALLELIZATION INFO -15: splitting rows by factor 6 -15: global grid sizes: 6x 2 -15: grid sizes on subgroups: 1x 2 +15: splitting rows by factor 7 +15: global grid sizes: 7x 1 +15: grid sizes on subgroups: 1x 1 15: GLOBAL INFO OF (12|3) matrix 15: block dimensions: 44 9 15: full dimensions: 2075 74 -15: process grid dimensions: 6 2 +15: process grid dimensions: 7 1 15: GLOBAL INFO OF (12|45) matrix 15: block dimensions: 44 15 15: full dimensions: 2075 896 -15: process grid dimensions: 6 2 +15: process grid dimensions: 7 1 15: GLOBAL INFO OF (3|45) matrix 15: block dimensions: 9 15 15: full dimensions: 74 896 -15: process grid dimensions: 6 2 +15: process grid dimensions: 7 1 15: Change process grid: No 15: DISTRIBUTION OF (12|3) matrix 15: Number of non-zero blocks: 13 15: Percentage of non-zero blocks: 3.28 -15: Average number of blocks per group: 3 -15: Maximum number of blocks per group: 4 -15: Average number of matrix elements per group: 1476 -15: Maximum number of matrix elements per group: 4149 +15: Average number of blocks per group: 2 +15: Maximum number of blocks per group: 5 +15: Average number of matrix elements per group: 1265 +15: Maximum number of matrix elements per group: 4464 15: Average number of blocks per CPU: 2 -15: Maximum number of blocks per CPU: 3 -15: Average number of matrix elements per CPU: 738 -15: Maximum number of matrix elements per CPU: 4149 +15: Maximum number of blocks per CPU: 5 +15: Average number of matrix elements per CPU: 1265 +15: Maximum number of matrix elements per CPU: 4464 15: DISTRIBUTION OF (12|45) matrix 15: Number of non-zero blocks: 21 15: Percentage of non-zero blocks: 3.18 -15: Average number of blocks per group: 4 -15: Maximum number of blocks per group: 6 -15: Average number of matrix elements per group: 22933 -15: Maximum number of matrix elements per group: 105984 -15: Average number of blocks per CPU: 2 -15: Maximum number of blocks per CPU: 4 -15: Average number of matrix elements per CPU: 11467 -15: Maximum number of matrix elements per CPU: 96768 +15: Average number of blocks per group: 3 +15: Maximum number of blocks per group: 11 +15: Average number of matrix elements per group: 19657 +15: Maximum number of matrix elements per group: 126828 +15: Average number of blocks per CPU: 3 +15: Maximum number of blocks per CPU: 11 +15: Average number of matrix elements per CPU: 19657 +15: Maximum number of matrix elements per CPU: 126828 15: DISTRIBUTION OF (3|45) matrix replicated 15: Number of non-zero blocks: 14 -15: Percentage of non-zero blocks: 1.73 -15: Average number of blocks per group: 3 -15: Maximum number of blocks per group: 7 -15: Average number of matrix elements per group: 1405 -15: Maximum number of matrix elements per group: 7014 +15: Percentage of non-zero blocks: 1.48 +15: Average number of blocks per group: 2 +15: Maximum number of blocks per group: 8 +15: Average number of matrix elements per group: 1204 +15: Maximum number of matrix elements per group: 7174 15: Average number of blocks per CPU: 2 -15: Maximum number of blocks per CPU: 5 -15: Average number of matrix elements per CPU: 703 -15: Maximum number of matrix elements per CPU: 6598 +15: Maximum number of blocks per CPU: 8 +15: Average number of matrix elements per CPU: 1204 +15: Maximum number of matrix elements per CPU: 7174 15: MM PARAMETERS -15: Number of matrix elements per CPU of result matrix: 585 -15: Optimal split factor: 12 +15: Number of matrix elements per CPU of result matrix: 1025 +15: Optimal split factor: 7 15: -------------------------------------------------------------------------------- 15: TAS MATRIX MULTIPLICATION DONE 15: -------------------------------------------------------------------------------- 15: GLOBAL INFO OF (3|45) 15: block dimensions: 9 5 3 15: full dimensions: 74 32 28 -15: process grid dimensions: 3 2 2 +15: process grid dimensions: 7 1 1 15: 15: DISTRIBUTION OF (3|45) 15: Number of non-zero blocks: 22 15: Percentage of non-zero blocks: 16.30 -15: Average number of blocks per CPU: 2 -15: Maximum number of blocks per CPU: 5 -15: Average number of matrix elements per CPU: 896 -15: Maximum number of matrix elements per CPU: 3982 +15: Average number of blocks per CPU: 4 +15: Maximum number of blocks per CPU: 7 +15: Average number of matrix elements per CPU: 1536 +15: Maximum number of matrix elements per CPU: 4104 15: -------------------------------------------------------------------------------- 15: TENSOR CONTRACTION DONE 15: -------------------------------------------------------------------------------- @@ -54850,27 +54862,27 @@ 15: GLOBAL INFO OF (3|21) 15: block dimensions: 4 11 9 15: full dimensions: 25 83 74 -15: process grid dimensions: 3 2 2 +15: process grid dimensions: 7 1 1 15: 15: DISTRIBUTION OF (3|21) 15: Number of non-zero blocks: 32 15: Percentage of non-zero blocks: 8.08 -15: Average number of blocks per CPU: 3 -15: Maximum number of blocks per CPU: 8 -15: Average number of matrix elements per CPU: 1360 -15: Maximum number of matrix elements per CPU: 4149 +15: Average number of blocks per CPU: 5 +15: Maximum number of blocks per CPU: 11 +15: Average number of matrix elements per CPU: 2330 +15: Maximum number of matrix elements per CPU: 7584 15: GLOBAL INFO OF (12|45) 15: block dimensions: 4 11 5 3 15: full dimensions: 25 83 32 28 -15: process grid dimensions: 3 2 2 1 +15: process grid dimensions: 7 1 1 1 15: 15: DISTRIBUTION OF (12|45) 15: Number of non-zero blocks: 36 15: Percentage of non-zero blocks: 5.45 -15: Average number of blocks per CPU: 3 -15: Maximum number of blocks per CPU: 6 -15: Average number of matrix elements per CPU: 12458 -15: Maximum number of matrix elements per CPU: 96912 +15: Average number of blocks per CPU: 6 +15: Maximum number of blocks per CPU: 15 +15: Average number of matrix elements per CPU: 21356 +15: Maximum number of matrix elements per CPU: 130644 15: INDEX INFO 15: tensor index: (cba) x (cbde) = (ade) 15: matrix index: (a|bc) x (cb|de) = (a|de) @@ -54893,94 +54905,94 @@ 15: GLOBAL INFO OF (3|21) 15: block dimensions: 9 11 4 15: full dimensions: 74 83 25 -15: process grid dimensions: 2 2 3 +15: process grid dimensions: 1 1 7 15: 15: DISTRIBUTION OF (3|21) 15: Number of non-zero blocks: 32 15: Percentage of non-zero blocks: 8.08 -15: Average number of blocks per CPU: 3 -15: Maximum number of blocks per CPU: 8 -15: Average number of matrix elements per CPU: 1360 -15: Maximum number of matrix elements per CPU: 4149 +15: Average number of blocks per CPU: 5 +15: Maximum number of blocks per CPU: 11 +15: Average number of matrix elements per CPU: 2330 +15: Maximum number of matrix elements per CPU: 7584 15: -------------------------------------------------------------------------------- 15: DBCSR TAS MATRIX MULTIPLICATION: (3|21) matrix x (12|45) matrix = (3|45) matrix 15: -------------------------------------------------------------------------------- 15: mm dims: 9 44 15 15: MM PARAMETERS -15: Est. number of matrix elements per CPU of result matrix: 879 -15: Est. optimal split factor: 12 +15: Est. number of matrix elements per CPU of result matrix: 1506 +15: Est. optimal split factor: 7 15: No redistribution of (3|21) matrix and (12|45) matrix -15: Change split factor of (3|21) matrix : Yes -15: Change split factor of (12|45) matrix : Yes +15: Change split factor of (3|21) matrix : No +15: Change split factor of (12|45) matrix : No 15: mm case: |T x | = + 15: SPLIT / PARALLELIZATION INFO -15: splitting rows by factor 6 -15: global grid sizes: 6x 2 -15: grid sizes on subgroups: 1x 2 +15: splitting rows by factor 7 +15: global grid sizes: 7x 1 +15: grid sizes on subgroups: 1x 1 15: GLOBAL INFO OF (3|21) matrix 15: block dimensions: 44 9 15: full dimensions: 2075 74 -15: process grid dimensions: 6 2 +15: process grid dimensions: 7 1 15: GLOBAL INFO OF (12|45) matrix 15: block dimensions: 44 15 15: full dimensions: 2075 896 -15: process grid dimensions: 6 2 +15: process grid dimensions: 7 1 15: GLOBAL INFO OF (3|45) matrix 15: block dimensions: 9 15 15: full dimensions: 74 896 -15: process grid dimensions: 6 2 +15: process grid dimensions: 7 1 15: Change process grid: No 15: DISTRIBUTION OF (3|21) matrix 15: Number of non-zero blocks: 32 15: Percentage of non-zero blocks: 8.08 -15: Average number of blocks per group: 6 -15: Maximum number of blocks per group: 13 -15: Average number of matrix elements per group: 2719 -15: Maximum number of matrix elements per group: 5772 -15: Average number of blocks per CPU: 3 -15: Maximum number of blocks per CPU: 8 -15: Average number of matrix elements per CPU: 1360 -15: Maximum number of matrix elements per CPU: 4149 +15: Average number of blocks per group: 5 +15: Maximum number of blocks per group: 11 +15: Average number of matrix elements per group: 2330 +15: Maximum number of matrix elements per group: 7584 +15: Average number of blocks per CPU: 5 +15: Maximum number of blocks per CPU: 11 +15: Average number of matrix elements per CPU: 2330 +15: Maximum number of matrix elements per CPU: 7584 15: DISTRIBUTION OF (12|45) matrix 15: Number of non-zero blocks: 36 15: Percentage of non-zero blocks: 5.45 15: Average number of blocks per group: 6 -15: Maximum number of blocks per group: 9 -15: Average number of matrix elements per group: 24915 -15: Maximum number of matrix elements per group: 108504 -15: Average number of blocks per CPU: 3 -15: Maximum number of blocks per CPU: 6 -15: Average number of matrix elements per CPU: 12458 -15: Maximum number of matrix elements per CPU: 96912 +15: Maximum number of blocks per group: 15 +15: Average number of matrix elements per group: 21356 +15: Maximum number of matrix elements per group: 130644 +15: Average number of blocks per CPU: 6 +15: Maximum number of blocks per CPU: 15 +15: Average number of matrix elements per CPU: 21356 +15: Maximum number of matrix elements per CPU: 130644 15: DISTRIBUTION OF (3|45) matrix replicated 15: Number of non-zero blocks: 23 -15: Percentage of non-zero blocks: 2.84 +15: Percentage of non-zero blocks: 2.43 15: Average number of blocks per group: 4 -15: Maximum number of blocks per group: 8 -15: Average number of matrix elements per group: 1784 -15: Maximum number of matrix elements per group: 7014 -15: Average number of blocks per CPU: 2 -15: Maximum number of blocks per CPU: 6 -15: Average number of matrix elements per CPU: 892 -15: Maximum number of matrix elements per CPU: 6598 +15: Maximum number of blocks per group: 9 +15: Average number of matrix elements per group: 1529 +15: Maximum number of matrix elements per group: 7266 +15: Average number of blocks per CPU: 4 +15: Maximum number of blocks per CPU: 9 +15: Average number of matrix elements per CPU: 1529 +15: Maximum number of matrix elements per CPU: 7266 15: MM PARAMETERS -15: Number of matrix elements per CPU of result matrix: 585 -15: Optimal split factor: 12 +15: Number of matrix elements per CPU of result matrix: 1038 +15: Optimal split factor: 7 15: -------------------------------------------------------------------------------- 15: TAS MATRIX MULTIPLICATION DONE 15: -------------------------------------------------------------------------------- 15: GLOBAL INFO OF (3|45) 15: block dimensions: 9 5 3 15: full dimensions: 74 32 28 -15: process grid dimensions: 3 2 2 +15: process grid dimensions: 7 1 1 15: 15: DISTRIBUTION OF (3|45) 15: Number of non-zero blocks: 29 15: Percentage of non-zero blocks: 21.48 -15: Average number of blocks per CPU: 3 -15: Maximum number of blocks per CPU: 5 -15: Average number of matrix elements per CPU: 1072 -15: Maximum number of matrix elements per CPU: 3982 +15: Average number of blocks per CPU: 5 +15: Maximum number of blocks per CPU: 8 +15: Average number of matrix elements per CPU: 1838 +15: Maximum number of matrix elements per CPU: 4760 15: -------------------------------------------------------------------------------- 15: TENSOR CONTRACTION DONE 15: -------------------------------------------------------------------------------- @@ -54995,27 +55007,27 @@ 15: GLOBAL INFO OF (13|2) 15: block dimensions: 4 11 9 15: full dimensions: 25 83 74 -15: process grid dimensions: 3 2 2 +15: process grid dimensions: 7 1 1 15: 15: DISTRIBUTION OF (13|2) 15: Number of non-zero blocks: 32 15: Percentage of non-zero blocks: 8.08 -15: Average number of blocks per CPU: 3 -15: Maximum number of blocks per CPU: 8 -15: Average number of matrix elements per CPU: 1360 -15: Maximum number of matrix elements per CPU: 4149 +15: Average number of blocks per CPU: 5 +15: Maximum number of blocks per CPU: 11 +15: Average number of matrix elements per CPU: 2330 +15: Maximum number of matrix elements per CPU: 7584 15: GLOBAL INFO OF (54|21) 15: block dimensions: 4 11 5 3 15: full dimensions: 25 83 32 28 -15: process grid dimensions: 3 2 2 1 +15: process grid dimensions: 7 1 1 1 15: 15: DISTRIBUTION OF (54|21) 15: Number of non-zero blocks: 36 15: Percentage of non-zero blocks: 5.45 -15: Average number of blocks per CPU: 3 -15: Maximum number of blocks per CPU: 6 -15: Average number of matrix elements per CPU: 12458 -15: Maximum number of matrix elements per CPU: 96912 +15: Average number of blocks per CPU: 6 +15: Maximum number of blocks per CPU: 15 +15: Average number of matrix elements per CPU: 21356 +15: Maximum number of matrix elements per CPU: 130644 15: INDEX INFO 15: tensor index: (bca) x (bcde) = (ade) 15: matrix index: (ba|c) x (ed|cb) = (a|de) @@ -55039,106 +55051,106 @@ 15: GLOBAL INFO OF (13|2) 15: block dimensions: 4 9 11 15: full dimensions: 25 74 83 -15: process grid dimensions: 3 2 2 +15: process grid dimensions: 7 1 1 15: 15: DISTRIBUTION OF (13|2) 15: Number of non-zero blocks: 32 15: Percentage of non-zero blocks: 8.08 -15: Average number of blocks per CPU: 3 -15: Maximum number of blocks per CPU: 8 -15: Average number of matrix elements per CPU: 1360 -15: Maximum number of matrix elements per CPU: 4149 +15: Average number of blocks per CPU: 5 +15: Maximum number of blocks per CPU: 11 +15: Average number of matrix elements per CPU: 2330 +15: Maximum number of matrix elements per CPU: 7584 15: -------------------------------------------------------------------------------- 15: DBCSR TAS MATRIX MULTIPLICATION: (13|2) matrix x (54|21) matrix = (3|45) matrix 15: -------------------------------------------------------------------------------- 15: mm dims: 9 44 15 15: MM PARAMETERS -15: Est. number of matrix elements per CPU of result matrix: 879 -15: Est. optimal split factor: 12 +15: Est. number of matrix elements per CPU of result matrix: 1506 +15: Est. optimal split factor: 7 15: No redistribution of (13|2) matrix and (54|21) matrix -15: Change split factor of (13|2) matrix : Yes -15: Change split factor of (54|21) matrix : Yes +15: Change split factor of (13|2) matrix : No +15: Change split factor of (54|21) matrix : No 15: mm case: -- x --T = + 15: SPLIT / PARALLELIZATION INFO -15: splitting columns by factor 6 -15: global grid sizes: 2x 6 -15: grid sizes on subgroups: 2x 1 +15: splitting columns by factor 7 +15: global grid sizes: 1x 7 +15: grid sizes on subgroups: 1x 1 15: GLOBAL INFO OF (13|2) matrix 15: block dimensions: 9 44 15: full dimensions: 74 2075 -15: process grid dimensions: 2 6 +15: process grid dimensions: 1 7 15: GLOBAL INFO OF (54|21) matrix 15: block dimensions: 15 44 15: full dimensions: 896 2075 -15: process grid dimensions: 2 6 +15: process grid dimensions: 1 7 15: GLOBAL INFO OF (3|45) matrix 15: block dimensions: 9 15 15: full dimensions: 74 896 -15: process grid dimensions: 2 6 +15: process grid dimensions: 1 7 15: Change process grid: No 15: DISTRIBUTION OF (13|2) matrix 15: Number of non-zero blocks: 32 15: Percentage of non-zero blocks: 8.08 -15: Average number of blocks per group: 6 -15: Maximum number of blocks per group: 13 -15: Average number of matrix elements per group: 2719 -15: Maximum number of matrix elements per group: 5772 -15: Average number of blocks per CPU: 3 -15: Maximum number of blocks per CPU: 8 -15: Average number of matrix elements per CPU: 1360 -15: Maximum number of matrix elements per CPU: 4149 +15: Average number of blocks per group: 5 +15: Maximum number of blocks per group: 11 +15: Average number of matrix elements per group: 2330 +15: Maximum number of matrix elements per group: 7584 +15: Average number of blocks per CPU: 5 +15: Maximum number of blocks per CPU: 11 +15: Average number of matrix elements per CPU: 2330 +15: Maximum number of matrix elements per CPU: 7584 15: DISTRIBUTION OF (54|21) matrix 15: Number of non-zero blocks: 36 15: Percentage of non-zero blocks: 5.45 15: Average number of blocks per group: 6 -15: Maximum number of blocks per group: 9 -15: Average number of matrix elements per group: 24915 -15: Maximum number of matrix elements per group: 108504 -15: Average number of blocks per CPU: 3 -15: Maximum number of blocks per CPU: 6 -15: Average number of matrix elements per CPU: 12458 -15: Maximum number of matrix elements per CPU: 96912 +15: Maximum number of blocks per group: 15 +15: Average number of matrix elements per group: 21356 +15: Maximum number of matrix elements per group: 130644 +15: Average number of blocks per CPU: 6 +15: Maximum number of blocks per CPU: 15 +15: Average number of matrix elements per CPU: 21356 +15: Maximum number of matrix elements per CPU: 130644 15: DISTRIBUTION OF (3|45) matrix replicated 15: Number of non-zero blocks: 23 -15: Percentage of non-zero blocks: 2.84 +15: Percentage of non-zero blocks: 2.43 15: Average number of blocks per group: 4 -15: Maximum number of blocks per group: 8 -15: Average number of matrix elements per group: 1784 -15: Maximum number of matrix elements per group: 7014 -15: Average number of blocks per CPU: 2 -15: Maximum number of blocks per CPU: 7 -15: Average number of matrix elements per CPU: 892 -15: Maximum number of matrix elements per CPU: 7014 +15: Maximum number of blocks per group: 9 +15: Average number of matrix elements per group: 1529 +15: Maximum number of matrix elements per group: 7266 +15: Average number of blocks per CPU: 4 +15: Maximum number of blocks per CPU: 9 +15: Average number of matrix elements per CPU: 1529 +15: Maximum number of matrix elements per CPU: 7266 15: MM PARAMETERS -15: Number of matrix elements per CPU of result matrix: 585 -15: Optimal split factor: 12 +15: Number of matrix elements per CPU of result matrix: 1038 +15: Optimal split factor: 7 15: -------------------------------------------------------------------------------- 15: TAS MATRIX MULTIPLICATION DONE 15: -------------------------------------------------------------------------------- 15: GLOBAL INFO OF (3|45) 15: block dimensions: 9 5 3 15: full dimensions: 74 32 28 -15: process grid dimensions: 3 2 2 +15: process grid dimensions: 7 1 1 15: 15: DISTRIBUTION OF (3|45) 15: Number of non-zero blocks: 21 15: Percentage of non-zero blocks: 15.56 -15: Average number of blocks per CPU: 2 -15: Maximum number of blocks per CPU: 4 -15: Average number of matrix elements per CPU: 879 -15: Maximum number of matrix elements per CPU: 3718 +15: Average number of blocks per CPU: 3 +15: Maximum number of blocks per CPU: 5 +15: Average number of matrix elements per CPU: 1506 +15: Maximum number of matrix elements per CPU: 4760 15: GLOBAL INFO OF (3|45) 15: block dimensions: 9 5 3 15: full dimensions: 74 32 28 -15: process grid dimensions: 3 2 2 +15: process grid dimensions: 7 1 1 15: 15: DISTRIBUTION OF (3|45) 15: Number of non-zero blocks: 29 15: Percentage of non-zero blocks: 21.48 -15: Average number of blocks per CPU: 3 -15: Maximum number of blocks per CPU: 5 -15: Average number of matrix elements per CPU: 1072 -15: Maximum number of matrix elements per CPU: 3982 +15: Average number of blocks per CPU: 5 +15: Maximum number of blocks per CPU: 8 +15: Average number of matrix elements per CPU: 1838 +15: Maximum number of matrix elements per CPU: 4760 15: -------------------------------------------------------------------------------- 15: TENSOR CONTRACTION DONE 15: -------------------------------------------------------------------------------- @@ -55153,27 +55165,27 @@ 15: GLOBAL INFO OF (54|21) 15: block dimensions: 4 11 5 3 15: full dimensions: 25 83 32 28 -15: process grid dimensions: 3 2 2 1 +15: process grid dimensions: 7 1 1 1 15: 15: DISTRIBUTION OF (54|21) 15: Number of non-zero blocks: 36 15: Percentage of non-zero blocks: 5.45 -15: Average number of blocks per CPU: 3 -15: Maximum number of blocks per CPU: 6 -15: Average number of matrix elements per CPU: 12458 -15: Maximum number of matrix elements per CPU: 96912 +15: Average number of blocks per CPU: 6 +15: Maximum number of blocks per CPU: 15 +15: Average number of matrix elements per CPU: 21356 +15: Maximum number of matrix elements per CPU: 130644 15: GLOBAL INFO OF (2|31) 15: block dimensions: 4 11 9 15: full dimensions: 25 83 74 -15: process grid dimensions: 3 2 2 +15: process grid dimensions: 7 1 1 15: 15: DISTRIBUTION OF (2|31) 15: Number of non-zero blocks: 32 15: Percentage of non-zero blocks: 8.08 -15: Average number of blocks per CPU: 3 -15: Maximum number of blocks per CPU: 8 -15: Average number of matrix elements per CPU: 1360 -15: Maximum number of matrix elements per CPU: 4149 +15: Average number of blocks per CPU: 5 +15: Maximum number of blocks per CPU: 11 +15: Average number of matrix elements per CPU: 2330 +15: Maximum number of matrix elements per CPU: 7584 15: INDEX INFO 15: tensor index: (dcba) x (dce) = (eba) 15: matrix index: (ab|cd) x (c|ed) = (be|a) @@ -55197,106 +55209,106 @@ 15: GLOBAL INFO OF (2|31) 15: block dimensions: 11 9 4 15: full dimensions: 83 74 25 -15: process grid dimensions: 2 2 3 +15: process grid dimensions: 1 1 7 15: 15: DISTRIBUTION OF (2|31) 15: Number of non-zero blocks: 32 15: Percentage of non-zero blocks: 8.08 -15: Average number of blocks per CPU: 3 -15: Maximum number of blocks per CPU: 8 -15: Average number of matrix elements per CPU: 1360 -15: Maximum number of matrix elements per CPU: 4149 +15: Average number of blocks per CPU: 5 +15: Maximum number of blocks per CPU: 11 +15: Average number of matrix elements per CPU: 2330 +15: Maximum number of matrix elements per CPU: 7584 15: -------------------------------------------------------------------------------- 15: DBCSR TAS MATRIX MULTIPLICATION: (54|21) matrix x (2|31) matrix = (43|5) matrix 15: -------------------------------------------------------------------------------- 15: mm dims: 15 44 9 15: MM PARAMETERS -15: Est. number of matrix elements per CPU of result matrix: 879 -15: Est. optimal split factor: 12 +15: Est. number of matrix elements per CPU of result matrix: 1506 +15: Est. optimal split factor: 7 15: No redistribution of (54|21) matrix and (2|31) matrix -15: Change split factor of (54|21) matrix : Yes -15: Change split factor of (2|31) matrix : Yes +15: Change split factor of (54|21) matrix : No +15: Change split factor of (2|31) matrix : No 15: mm case: -- x --T = + 15: SPLIT / PARALLELIZATION INFO -15: splitting columns by factor 6 -15: global grid sizes: 2x 6 -15: grid sizes on subgroups: 2x 1 +15: splitting columns by factor 7 +15: global grid sizes: 1x 7 +15: grid sizes on subgroups: 1x 1 15: GLOBAL INFO OF (54|21) matrix 15: block dimensions: 15 44 15: full dimensions: 896 2075 -15: process grid dimensions: 2 6 +15: process grid dimensions: 1 7 15: GLOBAL INFO OF (2|31) matrix 15: block dimensions: 9 44 15: full dimensions: 74 2075 -15: process grid dimensions: 2 6 +15: process grid dimensions: 1 7 15: GLOBAL INFO OF (43|5) matrix 15: block dimensions: 15 9 15: full dimensions: 896 74 -15: process grid dimensions: 2 6 +15: process grid dimensions: 1 7 15: Change process grid: No 15: DISTRIBUTION OF (54|21) matrix 15: Number of non-zero blocks: 36 15: Percentage of non-zero blocks: 5.45 15: Average number of blocks per group: 6 -15: Maximum number of blocks per group: 9 -15: Average number of matrix elements per group: 24915 -15: Maximum number of matrix elements per group: 108504 -15: Average number of blocks per CPU: 3 -15: Maximum number of blocks per CPU: 6 -15: Average number of matrix elements per CPU: 12458 -15: Maximum number of matrix elements per CPU: 96912 +15: Maximum number of blocks per group: 15 +15: Average number of matrix elements per group: 21356 +15: Maximum number of matrix elements per group: 130644 +15: Average number of blocks per CPU: 6 +15: Maximum number of blocks per CPU: 15 +15: Average number of matrix elements per CPU: 21356 +15: Maximum number of matrix elements per CPU: 130644 15: DISTRIBUTION OF (2|31) matrix 15: Number of non-zero blocks: 32 15: Percentage of non-zero blocks: 8.08 -15: Average number of blocks per group: 6 -15: Maximum number of blocks per group: 13 -15: Average number of matrix elements per group: 2719 -15: Maximum number of matrix elements per group: 5772 -15: Average number of blocks per CPU: 3 -15: Maximum number of blocks per CPU: 8 -15: Average number of matrix elements per CPU: 1360 -15: Maximum number of matrix elements per CPU: 4149 +15: Average number of blocks per group: 5 +15: Maximum number of blocks per group: 11 +15: Average number of matrix elements per group: 2330 +15: Maximum number of matrix elements per group: 7584 +15: Average number of blocks per CPU: 5 +15: Maximum number of blocks per CPU: 11 +15: Average number of matrix elements per CPU: 2330 +15: Maximum number of matrix elements per CPU: 7584 15: DISTRIBUTION OF (43|5) matrix replicated 15: Number of non-zero blocks: 23 -15: Percentage of non-zero blocks: 2.84 +15: Percentage of non-zero blocks: 2.43 15: Average number of blocks per group: 4 -15: Maximum number of blocks per group: 8 -15: Average number of matrix elements per group: 1784 -15: Maximum number of matrix elements per group: 7014 -15: Average number of blocks per CPU: 2 -15: Maximum number of blocks per CPU: 6 -15: Average number of matrix elements per CPU: 892 -15: Maximum number of matrix elements per CPU: 6598 +15: Maximum number of blocks per group: 9 +15: Average number of matrix elements per group: 1529 +15: Maximum number of matrix elements per group: 7266 +15: Average number of blocks per CPU: 4 +15: Maximum number of blocks per CPU: 9 +15: Average number of matrix elements per CPU: 1529 +15: Maximum number of matrix elements per CPU: 7266 15: MM PARAMETERS -15: Number of matrix elements per CPU of result matrix: 585 -15: Optimal split factor: 12 +15: Number of matrix elements per CPU of result matrix: 1038 +15: Optimal split factor: 7 15: -------------------------------------------------------------------------------- 15: TAS MATRIX MULTIPLICATION DONE 15: -------------------------------------------------------------------------------- 15: GLOBAL INFO OF (43|5) 15: block dimensions: 5 9 3 15: full dimensions: 32 74 28 -15: process grid dimensions: 2 2 3 +15: process grid dimensions: 1 1 7 15: 15: DISTRIBUTION OF (43|5) 15: Number of non-zero blocks: 21 15: Percentage of non-zero blocks: 15.56 -15: Average number of blocks per CPU: 2 -15: Maximum number of blocks per CPU: 5 -15: Average number of matrix elements per CPU: 879 -15: Maximum number of matrix elements per CPU: 6292 +15: Average number of blocks per CPU: 3 +15: Maximum number of blocks per CPU: 8 +15: Average number of matrix elements per CPU: 1506 +15: Maximum number of matrix elements per CPU: 8118 15: GLOBAL INFO OF (43|5) 15: block dimensions: 9 5 3 15: full dimensions: 74 32 28 -15: process grid dimensions: 3 2 2 +15: process grid dimensions: 7 1 1 15: 15: DISTRIBUTION OF (43|5) 15: Number of non-zero blocks: 29 15: Percentage of non-zero blocks: 21.48 -15: Average number of blocks per CPU: 3 -15: Maximum number of blocks per CPU: 5 -15: Average number of matrix elements per CPU: 1072 -15: Maximum number of matrix elements per CPU: 3982 +15: Average number of blocks per CPU: 5 +15: Maximum number of blocks per CPU: 8 +15: Average number of matrix elements per CPU: 1838 +15: Maximum number of matrix elements per CPU: 4760 15: -------------------------------------------------------------------------------- 15: TENSOR CONTRACTION DONE 15: -------------------------------------------------------------------------------- @@ -55311,27 +55323,27 @@ 15: GLOBAL INFO OF (241|5) 15: block dimensions: 4 11 5 3 15: full dimensions: 25 83 32 28 -15: process grid dimensions: 3 2 2 1 +15: process grid dimensions: 7 1 1 1 15: 15: DISTRIBUTION OF (241|5) 15: Number of non-zero blocks: 36 15: Percentage of non-zero blocks: 5.45 -15: Average number of blocks per CPU: 3 -15: Maximum number of blocks per CPU: 6 -15: Average number of matrix elements per CPU: 12458 -15: Maximum number of matrix elements per CPU: 96912 +15: Average number of blocks per CPU: 6 +15: Maximum number of blocks per CPU: 15 +15: Average number of matrix elements per CPU: 21356 +15: Maximum number of matrix elements per CPU: 130644 15: GLOBAL INFO OF (31|2) 15: block dimensions: 4 11 9 15: full dimensions: 25 83 74 -15: process grid dimensions: 3 2 2 +15: process grid dimensions: 7 1 1 15: 15: DISTRIBUTION OF (31|2) 15: Number of non-zero blocks: 32 15: Percentage of non-zero blocks: 8.08 -15: Average number of blocks per CPU: 3 -15: Maximum number of blocks per CPU: 8 -15: Average number of matrix elements per CPU: 1360 -15: Maximum number of matrix elements per CPU: 4149 +15: Average number of blocks per CPU: 5 +15: Maximum number of blocks per CPU: 11 +15: Average number of matrix elements per CPU: 2330 +15: Maximum number of matrix elements per CPU: 7584 15: INDEX INFO 15: tensor index: (dcab) x (dce) = (eab) 15: matrix index: (cad|b) x (ed|c) = (b|ae) @@ -55356,118 +55368,118 @@ 15: GLOBAL INFO OF (241|5) 15: block dimensions: 11 5 4 3 15: full dimensions: 83 32 25 28 -15: process grid dimensions: 3 2 2 1 +15: process grid dimensions: 7 1 1 1 15: 15: DISTRIBUTION OF (241|5) 15: Number of non-zero blocks: 36 15: Percentage of non-zero blocks: 5.45 -15: Average number of blocks per CPU: 3 -15: Maximum number of blocks per CPU: 6 -15: Average number of matrix elements per CPU: 12458 -15: Maximum number of matrix elements per CPU: 82368 +15: Average number of blocks per CPU: 6 +15: Maximum number of blocks per CPU: 14 +15: Average number of matrix elements per CPU: 21356 +15: Maximum number of matrix elements per CPU: 91584 15: GLOBAL INFO OF (31|2) 15: block dimensions: 9 4 11 15: full dimensions: 74 25 83 -15: process grid dimensions: 2 2 3 +15: process grid dimensions: 1 1 7 15: 15: DISTRIBUTION OF (31|2) 15: Number of non-zero blocks: 32 15: Percentage of non-zero blocks: 8.08 -15: Average number of blocks per CPU: 3 -15: Maximum number of blocks per CPU: 5 -15: Average number of matrix elements per CPU: 1360 +15: Average number of blocks per CPU: 5 +15: Maximum number of blocks per CPU: 7 +15: Average number of matrix elements per CPU: 2330 15: Maximum number of matrix elements per CPU: 4032 15: -------------------------------------------------------------------------------- 15: DBCSR TAS MATRIX MULTIPLICATION: (241|5) matrix x (31|2) matrix = (5|43) matrix 15: -------------------------------------------------------------------------------- 15: mm dims: 15 44 9 15: MM PARAMETERS -15: Est. number of matrix elements per CPU of result matrix: 879 -15: Est. optimal split factor: 12 +15: Est. number of matrix elements per CPU of result matrix: 1506 +15: Est. optimal split factor: 7 15: No redistribution of (241|5) matrix and (31|2) matrix -15: Change split factor of (241|5) matrix : Yes -15: Change split factor of (31|2) matrix : Yes +15: Change split factor of (241|5) matrix : No +15: Change split factor of (31|2) matrix : No 15: mm case: |T x | = + 15: SPLIT / PARALLELIZATION INFO -15: splitting rows by factor 6 -15: global grid sizes: 6x 2 -15: grid sizes on subgroups: 1x 2 +15: splitting rows by factor 7 +15: global grid sizes: 7x 1 +15: grid sizes on subgroups: 1x 1 15: GLOBAL INFO OF (241|5) matrix 15: block dimensions: 44 15 15: full dimensions: 2075 896 -15: process grid dimensions: 6 2 +15: process grid dimensions: 7 1 15: GLOBAL INFO OF (31|2) matrix 15: block dimensions: 44 9 15: full dimensions: 2075 74 -15: process grid dimensions: 6 2 +15: process grid dimensions: 7 1 15: GLOBAL INFO OF (5|43) matrix 15: block dimensions: 15 9 15: full dimensions: 896 74 -15: process grid dimensions: 6 2 +15: process grid dimensions: 7 1 15: Change process grid: No 15: DISTRIBUTION OF (241|5) matrix 15: Number of non-zero blocks: 36 15: Percentage of non-zero blocks: 5.45 15: Average number of blocks per group: 6 -15: Maximum number of blocks per group: 10 -15: Average number of matrix elements per group: 24915 +15: Maximum number of blocks per group: 14 +15: Average number of matrix elements per group: 21356 15: Maximum number of matrix elements per group: 91584 -15: Average number of blocks per CPU: 3 -15: Maximum number of blocks per CPU: 6 -15: Average number of matrix elements per CPU: 12458 -15: Maximum number of matrix elements per CPU: 82368 +15: Average number of blocks per CPU: 6 +15: Maximum number of blocks per CPU: 14 +15: Average number of matrix elements per CPU: 21356 +15: Maximum number of matrix elements per CPU: 91584 15: DISTRIBUTION OF (31|2) matrix 15: Number of non-zero blocks: 32 15: Percentage of non-zero blocks: 8.08 -15: Average number of blocks per group: 6 -15: Maximum number of blocks per group: 8 -15: Average number of matrix elements per group: 2719 -15: Maximum number of matrix elements per group: 6501 -15: Average number of blocks per CPU: 3 -15: Maximum number of blocks per CPU: 5 -15: Average number of matrix elements per CPU: 1360 +15: Average number of blocks per group: 5 +15: Maximum number of blocks per group: 7 +15: Average number of matrix elements per group: 2330 +15: Maximum number of matrix elements per group: 4032 +15: Average number of blocks per CPU: 5 +15: Maximum number of blocks per CPU: 7 +15: Average number of matrix elements per CPU: 2330 15: Maximum number of matrix elements per CPU: 4032 15: DISTRIBUTION OF (5|43) matrix replicated 15: Number of non-zero blocks: 23 -15: Percentage of non-zero blocks: 2.84 +15: Percentage of non-zero blocks: 2.43 15: Average number of blocks per group: 4 15: Maximum number of blocks per group: 9 -15: Average number of matrix elements per group: 1784 +15: Average number of matrix elements per group: 1529 15: Maximum number of matrix elements per group: 4134 -15: Average number of blocks per CPU: 2 -15: Maximum number of blocks per CPU: 5 -15: Average number of matrix elements per CPU: 892 +15: Average number of blocks per CPU: 4 +15: Maximum number of blocks per CPU: 9 +15: Average number of matrix elements per CPU: 1529 15: Maximum number of matrix elements per CPU: 4134 15: MM PARAMETERS -15: Number of matrix elements per CPU of result matrix: 345 -15: Optimal split factor: 12 +15: Number of matrix elements per CPU of result matrix: 591 +15: Optimal split factor: 7 15: -------------------------------------------------------------------------------- 15: TAS MATRIX MULTIPLICATION DONE 15: -------------------------------------------------------------------------------- 15: GLOBAL INFO OF (5|43) 15: block dimensions: 3 5 9 15: full dimensions: 28 32 74 -15: process grid dimensions: 1 2 6 +15: process grid dimensions: 1 1 7 15: 15: DISTRIBUTION OF (5|43) 15: Number of non-zero blocks: 21 15: Percentage of non-zero blocks: 15.56 -15: Average number of blocks per CPU: 2 -15: Maximum number of blocks per CPU: 3 -15: Average number of matrix elements per CPU: 879 -15: Maximum number of matrix elements per CPU: 3120 +15: Average number of blocks per CPU: 3 +15: Maximum number of blocks per CPU: 5 +15: Average number of matrix elements per CPU: 1506 +15: Maximum number of matrix elements per CPU: 4760 15: GLOBAL INFO OF (5|43) 15: block dimensions: 9 5 3 15: full dimensions: 74 32 28 -15: process grid dimensions: 3 2 2 +15: process grid dimensions: 7 1 1 15: 15: DISTRIBUTION OF (5|43) 15: Number of non-zero blocks: 29 15: Percentage of non-zero blocks: 21.48 -15: Average number of blocks per CPU: 3 -15: Maximum number of blocks per CPU: 5 -15: Average number of matrix elements per CPU: 1072 -15: Maximum number of matrix elements per CPU: 3982 +15: Average number of blocks per CPU: 5 +15: Maximum number of blocks per CPU: 8 +15: Average number of matrix elements per CPU: 1838 +15: Maximum number of matrix elements per CPU: 4760 15: -------------------------------------------------------------------------------- 15: TENSOR CONTRACTION DONE 15: -------------------------------------------------------------------------------- @@ -55482,27 +55494,27 @@ 15: GLOBAL INFO OF (34|5) 15: block dimensions: 9 5 3 15: full dimensions: 74 32 28 -15: process grid dimensions: 3 2 2 +15: process grid dimensions: 7 1 1 15: 15: DISTRIBUTION OF (34|5) 15: Number of non-zero blocks: 8 15: Percentage of non-zero blocks: 5.93 -15: Average number of blocks per CPU: 1 -15: Maximum number of blocks per CPU: 2 -15: Average number of matrix elements per CPU: 194 -15: Maximum number of matrix elements per CPU: 792 +15: Average number of blocks per CPU: 2 +15: Maximum number of blocks per CPU: 3 +15: Average number of matrix elements per CPU: 332 +15: Maximum number of matrix elements per CPU: 1224 15: GLOBAL INFO OF (12|3) 15: block dimensions: 4 11 9 15: full dimensions: 25 83 74 -15: process grid dimensions: 3 2 2 +15: process grid dimensions: 7 1 1 15: 15: DISTRIBUTION OF (12|3) 15: Number of non-zero blocks: 32 15: Percentage of non-zero blocks: 8.08 -15: Average number of blocks per CPU: 3 -15: Maximum number of blocks per CPU: 8 -15: Average number of matrix elements per CPU: 1360 -15: Maximum number of matrix elements per CPU: 4149 +15: Average number of blocks per CPU: 5 +15: Maximum number of blocks per CPU: 11 +15: Average number of matrix elements per CPU: 2330 +15: Maximum number of matrix elements per CPU: 7584 15: INDEX INFO 15: tensor index: (cab) x (dec) = (deab) 15: matrix index: (ca|b) x (de|c) = (da|eb) @@ -55526,106 +55538,106 @@ 15: GLOBAL INFO OF (34|5) 15: block dimensions: 9 5 3 15: full dimensions: 74 32 28 -15: process grid dimensions: 2 3 2 +15: process grid dimensions: 1 7 1 15: 15: DISTRIBUTION OF (34|5) 15: Number of non-zero blocks: 8 15: Percentage of non-zero blocks: 5.93 -15: Average number of blocks per CPU: 1 +15: Average number of blocks per CPU: 2 15: Maximum number of blocks per CPU: 2 -15: Average number of matrix elements per CPU: 194 +15: Average number of matrix elements per CPU: 332 15: Maximum number of matrix elements per CPU: 1056 15: -------------------------------------------------------------------------------- 15: DBCSR TAS MATRIX MULTIPLICATION: (34|5) matrix x (12|3) matrix = (14|25) matrix 15: -------------------------------------------------------------------------------- 15: mm dims: 15 9 44 15: MM PARAMETERS -15: Est. number of matrix elements per CPU of result matrix: 5390 -15: Est. optimal split factor: 12 +15: Est. number of matrix elements per CPU of result matrix: 9240 +15: Est. optimal split factor: 7 15: No redistribution of (12|3) matrix and (14|25) matrix -15: Change split factor of (12|3) matrix : Yes -15: Change split factor of (14|25) matrix : Yes +15: Change split factor of (12|3) matrix : No +15: Change split factor of (14|25) matrix : No 15: mm case: + x |T = |T 15: SPLIT / PARALLELIZATION INFO -15: splitting rows by factor 6 -15: global grid sizes: 6x 2 -15: grid sizes on subgroups: 1x 2 +15: splitting rows by factor 7 +15: global grid sizes: 7x 1 +15: grid sizes on subgroups: 1x 1 15: GLOBAL INFO OF (34|5) matrix 15: block dimensions: 15 9 15: full dimensions: 896 74 -15: process grid dimensions: 6 2 +15: process grid dimensions: 7 1 15: GLOBAL INFO OF (12|3) matrix 15: block dimensions: 44 9 15: full dimensions: 2075 74 -15: process grid dimensions: 6 2 +15: process grid dimensions: 7 1 15: GLOBAL INFO OF (14|25) matrix 15: block dimensions: 44 15 15: full dimensions: 2075 896 -15: process grid dimensions: 6 2 +15: process grid dimensions: 7 1 15: Change process grid: No 15: DISTRIBUTION OF (34|5) matrix replicated -15: Number of non-zero blocks: 48 +15: Number of non-zero blocks: 56 15: Percentage of non-zero blocks: 5.93 15: Average number of blocks per group: 8 15: Maximum number of blocks per group: 8 15: Average number of matrix elements per group: 2324 15: Maximum number of matrix elements per group: 2324 -15: Average number of blocks per CPU: 4 -15: Maximum number of blocks per CPU: 4 -15: Average number of matrix elements per CPU: 1162 -15: Maximum number of matrix elements per CPU: 1488 +15: Average number of blocks per CPU: 8 +15: Maximum number of blocks per CPU: 8 +15: Average number of matrix elements per CPU: 2324 +15: Maximum number of matrix elements per CPU: 2324 15: DISTRIBUTION OF (12|3) matrix 15: Number of non-zero blocks: 32 15: Percentage of non-zero blocks: 8.08 -15: Average number of blocks per group: 6 -15: Maximum number of blocks per group: 13 -15: Average number of matrix elements per group: 2719 -15: Maximum number of matrix elements per group: 5772 -15: Average number of blocks per CPU: 3 -15: Maximum number of blocks per CPU: 8 -15: Average number of matrix elements per CPU: 1360 -15: Maximum number of matrix elements per CPU: 4149 +15: Average number of blocks per group: 5 +15: Maximum number of blocks per group: 11 +15: Average number of matrix elements per group: 2330 +15: Maximum number of matrix elements per group: 7584 +15: Average number of blocks per CPU: 5 +15: Maximum number of blocks per CPU: 11 +15: Average number of matrix elements per CPU: 2330 +15: Maximum number of matrix elements per CPU: 7584 15: DISTRIBUTION OF (14|25) matrix 15: Number of non-zero blocks: 26 15: Percentage of non-zero blocks: 3.94 -15: Average number of blocks per group: 5 -15: Maximum number of blocks per group: 11 -15: Average number of matrix elements per group: 10780 -15: Maximum number of matrix elements per group: 31464 -15: Average number of blocks per CPU: 3 -15: Maximum number of blocks per CPU: 6 -15: Average number of matrix elements per CPU: 5390 -15: Maximum number of matrix elements per CPU: 29304 +15: Average number of blocks per group: 4 +15: Maximum number of blocks per group: 9 +15: Average number of matrix elements per group: 9240 +15: Maximum number of matrix elements per group: 33750 +15: Average number of blocks per CPU: 4 +15: Maximum number of blocks per CPU: 9 +15: Average number of matrix elements per CPU: 9240 +15: Maximum number of matrix elements per CPU: 33750 15: MM PARAMETERS -15: Number of matrix elements per CPU of result matrix: 5390 -15: Optimal split factor: 12 +15: Number of matrix elements per CPU of result matrix: 9240 +15: Optimal split factor: 7 15: -------------------------------------------------------------------------------- 15: TAS MATRIX MULTIPLICATION DONE 15: -------------------------------------------------------------------------------- 15: GLOBAL INFO OF (14|25) 15: block dimensions: 4 5 11 3 15: full dimensions: 25 32 83 28 -15: process grid dimensions: 3 2 2 1 +15: process grid dimensions: 7 1 1 1 15: 15: DISTRIBUTION OF (14|25) 15: Number of non-zero blocks: 26 15: Percentage of non-zero blocks: 3.94 -15: Average number of blocks per CPU: 3 -15: Maximum number of blocks per CPU: 6 -15: Average number of matrix elements per CPU: 5390 -15: Maximum number of matrix elements per CPU: 29304 +15: Average number of blocks per CPU: 4 +15: Maximum number of blocks per CPU: 9 +15: Average number of matrix elements per CPU: 9240 +15: Maximum number of matrix elements per CPU: 33750 15: GLOBAL INFO OF (14|25) 15: block dimensions: 4 11 5 3 15: full dimensions: 25 83 32 28 -15: process grid dimensions: 3 2 2 1 +15: process grid dimensions: 7 1 1 1 15: 15: DISTRIBUTION OF (14|25) 15: Number of non-zero blocks: 62 15: Percentage of non-zero blocks: 9.39 -15: Average number of blocks per CPU: 6 -15: Maximum number of blocks per CPU: 12 -15: Average number of matrix elements per CPU: 17848 -15: Maximum number of matrix elements per CPU: 126216 +15: Average number of blocks per CPU: 9 +15: Maximum number of blocks per CPU: 23 +15: Average number of matrix elements per CPU: 30596 +15: Maximum number of matrix elements per CPU: 164394 15: -------------------------------------------------------------------------------- 15: TENSOR CONTRACTION DONE 15: -------------------------------------------------------------------------------- @@ -55637,68 +55649,59 @@ 15: - - 15: ------------------------------------------------------------------------------- 15: COUNTER TOTAL BLAS SMM ACC -15: flops 5 x 3 x 6 180 100.0% 0.0% 0.0% -15: flops 5 x 7 x 6 420 100.0% 0.0% 0.0% +15: flops 9 x 1 x 3 54 100.0% 0.0% 0.0% +15: flops 9 x 1 x 7 126 100.0% 0.0% 0.0% +15: flops 9 x 6 x 3 324 100.0% 0.0% 0.0% +15: flops 9 x 4 x 7 504 100.0% 0.0% 0.0% +15: flops 36 x 1 x 7 504 100.0% 0.0% 0.0% 15: flops 1 x 1 x 1 522 100.0% 0.0% 0.0% 15: flops 96 x 1 x 3 576 100.0% 0.0% 0.0% 15: flops 24 x 2 x 7 672 100.0% 0.0% 0.0% -15: flops 16 x 5 x 6 960 100.0% 0.0% 0.0% -15: flops 36 x 1 x 7 1008 100.0% 0.0% 0.0% -15: flops 36 x 2 x 7 1008 100.0% 0.0% 0.0% 15: flops 288 x 1 x 3 1728 100.0% 0.0% 0.0% -15: flops 8 x 7 x 24 2688 100.0% 0.0% 0.0% 15: flops 24 x 4 x 7 2688 100.0% 0.0% 0.0% +15: flops 36 x 6 x 7 3024 100.0% 0.0% 0.0% 15: flops 96 x 6 x 3 3456 100.0% 0.0% 0.0% 15: flops 24 x 6 x 7 4032 100.0% 0.0% 0.0% -15: flops 7 x 8 x 24 5376 100.0% 0.0% 0.0% -15: flops 36 x 6 x 7 6048 100.0% 0.0% 0.0% -15: flops 96 x 13 x 3 7488 100.0% 0.0% 0.0% -15: flops 36 x 4 x 7 8064 100.0% 0.0% 0.0% +15: flops 36 x 4 x 7 4032 100.0% 0.0% 0.0% 15: flops 288 x 6 x 3 10368 100.0% 0.0% 0.0% -15: flops 288 x 13 x 3 22464 100.0% 0.0% 0.0% -15: flops inhomo. stacks 204098160 100.0% 0.0% 0.0% -15: flops total 204.177906E+06 100.0% 0.0% 0.0% -15: flops max/rank 58.818472E+06 100.0% 0.0% 0.0% -15: matmuls inhomo. stacks 235 100.0% 0.0% 0.0% +15: flops inhomo. stacks 430519336 100.0% 0.0% 0.0% +15: flops total 430.551946E+06 100.0% 0.0% 0.0% +15: flops max/rank 192.346864E+06 100.0% 0.0% 0.0% +15: matmuls inhomo. stacks 244 100.0% 0.0% 0.0% 15: matmuls total 522 100.0% 0.0% 0.0% -15: number of processed stacks 309 100.0% 0.0% 0.0% -15: average stack size 1.7 0.0 0.0 -15: marketing flops 1.690365E+09 +15: number of processed stacks 124 100.0% 0.0% 0.0% +15: average stack size 4.2 0.0 0.0 +15: marketing flops 1.690366E+09 15: ------------------------------------------------------------------------------- 15: # multiplications 20 -15: max memory usage/rank 117.600256E+06 -15: # max total images/rank 2 +15: max memory usage/rank 92.237824E+06 +15: # max total images/rank 7 15: # max 3D layers 1 -15: # MPI messages exchanged 372 +15: # MPI messages exchanged 42 15: MPI messages size (bytes): -15: total size 3.273920E+06 +15: total size 37.248000E+03 15: min size 0.000000E+00 -15: max size 752.832000E+03 -15: average size 8.800860E+03 +15: max size 2.704000E+03 +15: average size 886.857117E+00 15: MPI breakdown and total messages size (bytes): -15: size <= 128 262 4856 -15: 128 < size <= 8192 56 161880 -15: 8192 < size <= 32768 42 734752 -15: 32768 < size <= 131072 7 419456 -15: 131072 < size <= 4194304 5 1952976 +15: size <= 128 18 480 +15: 128 < size <= 8192 24 36768 +15: 8192 < size <= 32768 0 0 +15: 32768 < size <= 131072 0 0 +15: 131072 < size <= 4194304 0 0 15: 4194304 < size <= 16777216 0 0 15: 16777216 < size 0 0 15: ------------------------------------------------------------------------------- -15: -15: *** WARNING in dbcsr_mm.F:291 :: Using a non-square number of MPI ranks *** -15: *** might lead to poor performance. Used ranks: 2 Suggested: 1 4 *** -15: -15: ------------------------------------------------------------------------------- 15: - - 15: - DBCSR MESSAGE PASSING PERFORMANCE - 15: - - 15: ------------------------------------------------------------------------------- 15: ROUTINE CALLS AVE VOLUME [Bytes] -15: MP_Bcast 402 4. -15: MP_Allreduce 687 185245. -15: MP_Alltoall 179 162. -15: MP_ISend 510 4989. -15: MP_IRecv 514 4992. +15: MP_Bcast 398 4. +15: MP_Allreduce 679 187427. +15: MP_Alltoall 176 95. +15: MP_ISend 232 984. +15: MP_IRecv 276 3570. 15: ------------------------------------------------------------------------------- 15: 15: ------------------------------------------------------------------------------- @@ -55708,265 +55711,264 @@ 15: ------------------------------------------------------------------------------- 15: SUBROUTINE CALLS ASD SELF TIME TOTAL TIME MAXRANK 15: MAXIMUM AVERAGE MAXIMUM AVERAGE MAXIMUM -15: dbcsr_t_distribution_new 434 1.7 0.010 0.011 20.108 20.730 0 -15: dbcsr_t_total 96 1.0 0.003 0.009 18.662 18.754 8 -15: dbcsr_t_contract 10 2.0 0.006 0.014 16.228 16.235 0 -15: dbcsr_tas_create_split 382 4.1 0.002 0.002 14.905 15.521 0 -15: dbcsr_tas_create_split_rows_or 382 5.1 0.006 0.006 14.903 15.519 8 -15: dbcsr_tas_multiply 20 4.5 0.000 0.000 14.944 14.959 6 -15: dbcsr_tas_total 20 5.5 0.036 0.382 14.911 14.929 8 -15: dbcsr_tas_distribution_new 492 3.3 0.015 0.019 13.629 13.917 3 -15: dbcsr_t_create_new 217 1.2 0.089 0.491 9.190 9.852 6 -15: mp_cart_create 914 5.3 8.509 9.178 8.509 9.178 11 -15: mp_comm_split_direct 382 6.1 7.225 8.464 7.225 8.464 1 -15: mp_sync 272 3.0 6.531 7.746 6.531 7.746 9 -15: dbcsr_t_pgrid_create 440 2.7 0.004 0.007 7.007 7.719 9 -15: dbcsr_create_new 905 5.9 4.167 4.743 6.444 6.881 7 -15: dbcsr_checksum 40 1.0 1.884 3.096 5.882 6.182 6 -15: mp_comm_dup 372 6.1 5.483 6.157 5.483 6.157 5 -15: dbcsr_tas_dbcsr 20 6.5 0.000 0.000 6.025 6.040 5 -15: dbcsr_tas_result_index 10 5.0 0.001 0.002 5.888 5.908 9 -15: mp_sum_d 137 1.3 3.999 5.731 3.999 5.731 5 -15: dbcsr_multiply_generic 20 8.5 0.044 0.068 3.937 4.425 7 -15: dbcsr_tas_create_new 305 3.6 0.004 0.004 3.120 3.614 6 -15: mp_sum_l 491 4.7 2.154 2.859 2.154 2.859 2 -15: dbcsr_make_index_exist 905 6.9 2.275 2.791 2.275 2.791 8 -15: dbcsr_tas_mm_1N 6 7.5 0.000 0.000 2.046 2.711 8 -15: dbcsr_tas_mm_2 10 7.5 0.000 0.000 2.141 2.148 0 -15: dbcsr_t_copy 101 2.2 0.018 0.038 1.955 2.101 3 -15: reshape_mm_compatible 20 6.5 0.001 0.001 1.979 2.037 0 -15: multiply_cannon 20 9.5 0.195 0.245 1.651 1.929 1 -15: change_split 30 7.0 0.044 0.521 1.780 1.832 3 -15: mp_alltoall_i 139 4.9 1.650 1.786 1.650 1.786 9 -15: mp_bcast_i 394 6.0 0.995 1.710 0.995 1.710 11 -15: make_m2s 40 9.5 0.001 0.001 1.339 1.625 10 -15: make_images 40 10.5 0.288 0.371 1.208 1.444 11 -15: dbcsr_add_anytype 20 6.5 0.128 0.572 1.077 1.302 11 -15: dbcsr_iterator_start 1097 4.3 0.726 1.203 0.727 1.204 0 -15: dbcsr_finalize 968 3.4 0.274 0.331 0.827 1.063 10 -15: dbcsr_t_create_template 91 1.1 0.002 0.002 0.592 1.061 8 -15: multiply_cannon_loop 20 10.5 0.199 0.583 0.896 1.054 11 -15: dbcsr_tas_convert_to_dbcsr 40 1.0 0.132 0.394 0.552 0.867 6 -15: reshape_mm_small 20 6.5 0.004 0.004 0.832 0.861 9 -15: dbcsr_merge_all 39 9.7 0.369 0.481 0.530 0.824 4 -15: mp_waitall_1 604 13.0 0.393 0.815 0.393 0.815 9 -15: setup_buffer_matrices 40 10.5 0.035 0.419 0.300 0.744 10 -15: dbcsr_tas_mm_3T 4 7.5 0.000 0.000 0.548 0.694 0 -15: dbcsr_tas_reshape 24 6.7 0.001 0.001 0.548 0.611 4 -15: multiply_cannon_metrocomm1 40 11.5 0.000 0.000 0.288 0.588 3 -15: dbcsr_sort_data 38 11.7 0.101 0.580 0.101 0.580 3 -15: buffer_matrices_ensure_size 40 10.5 0.087 0.540 0.087 0.540 0 -15: dbcsr_reserve_blocks 512 4.7 0.125 0.538 0.126 0.538 7 -15: dbcsr_tas_reserve_blocks_index 452 3.9 0.002 0.003 0.119 0.527 0 -15: dbcsr_tas_copy 17 6.3 0.143 0.438 0.280 0.517 3 -15: make_images_sizes 40 11.5 0.000 0.000 0.337 0.515 10 -15: mp_alltoall_i44 40 12.5 0.337 0.515 0.337 0.515 0 -15: dbcsr_t_reserve_blocks_index 391 2.3 0.002 0.002 0.113 0.511 3 -15: dbcsr_scale_anytype 46 6.7 0.086 0.109 0.393 0.493 7 -15: dbcsr_t_remap 15 3.0 0.003 0.003 0.460 0.473 0 -15: dbcsr_tas_replicate 20 6.5 0.001 0.001 0.420 0.458 0 -15: convert_to_new_pgrid 60 6.5 0.000 0.000 0.365 0.438 5 -15: mp_max_lv 30 5.0 0.074 0.419 0.074 0.419 3 -15: dbcsr_tas_reshape_alltoall 24 7.7 0.000 0.000 0.340 0.407 0 -15: dbcsr_t_reserve_blocks_index_a 189 2.7 0.001 0.001 0.061 0.383 4 -15: dbcsr_t_reserve_blocks_templat 89 1.1 0.001 0.001 0.042 0.378 0 -15: mp_sum_dm4 7 1.0 0.340 0.366 0.340 0.366 1 -15: calculate_norms 80 11.5 0.247 0.344 0.247 0.344 1 -15: dbcsr_data_release 2690 6.9 0.031 0.333 0.031 0.333 0 -15: make_images_data 40 11.5 0.001 0.001 0.279 0.328 0 -15: dbcsr_copy 80 8.5 0.094 0.114 0.264 0.328 8 -15: hybrid_alltoall_any 40 12.5 0.112 0.181 0.247 0.311 6 -15: mp_sum_dm3 29 1.0 0.275 0.308 0.275 0.308 7 -15: mp_allgather_i34 20 10.5 0.106 0.211 0.106 0.211 0 -15: mp_waitall_2 261 6.1 0.140 0.209 0.140 0.209 3 -15: dbcsr_tas_merge 10 6.5 0.001 0.001 0.181 0.198 0 -15: dbcsr_filter_anytype 40 5.8 0.027 0.040 0.164 0.198 9 -15: mp_max_iv 75 3.8 0.172 0.195 0.172 0.195 1 -15: dbcsr_tas_replicate_alltoall 10 7.5 0.000 0.000 0.135 0.193 0 -15: mp_max_l 159 1.1 0.126 0.187 0.126 0.187 9 -15: dbcsr_special_finalize 49 11.2 0.033 0.054 0.114 0.183 11 -15: multiply_cannon_metrocomm3 40 11.5 0.000 0.000 0.063 0.179 0 -15: dbcsr_tas_reshape_buffer_fill 24 7.7 0.001 0.001 0.121 0.159 9 -15: dbcsr_t_communicate_buffer 95 3.3 0.001 0.002 0.068 0.158 3 -15: dbcsr_iterator_stop 1097 4.3 0.119 0.155 0.119 0.156 10 -15: mp_max_i 94 1.4 0.120 0.153 0.120 0.153 2 -15: dbcsr_make_index_list 49 10.2 0.104 0.141 0.104 0.141 11 -15: dbcsr_merge_single_wm 18 11.0 0.051 0.082 0.079 0.128 11 -15: multiply_cannon_multrec 40 11.5 0.092 0.122 0.098 0.126 11 -15: dbcsr_new_transposed 14 9.5 0.002 0.005 0.093 0.122 10 -15: dbcsr_tas_communicate_buffer 44 8.6 0.001 0.001 0.076 0.107 0 -15: dbcsr_destroy 865 5.0 0.011 0.097 0.013 0.099 6 -15: mp_sum_i 21 7.2 0.058 0.099 0.058 0.099 4 -15: dbcsr_t_nd_mp_comm 15 4.0 0.000 0.000 0.086 0.098 7 -15: dbcsr_tas_merge_alltoall 10 7.5 0.000 0.000 0.063 0.082 6 -15: setup_rec_index_2d 40 10.5 0.060 0.082 0.060 0.082 11 -15: dbcsr_add_wm_from_matrix 10 8.0 0.036 0.057 0.046 0.076 11 -15: dbcsr_tas_mp_comm 14 4.4 0.000 0.000 0.059 0.072 9 -15: merge_index 39 10.7 0.057 0.070 0.057 0.070 2 -15: dbcsr_make_untransposed_blocks 30 9.0 0.051 0.065 0.051 0.065 11 -15: dbcsr_tas_replicate_communicat 10 7.5 0.000 0.000 0.036 0.048 8 -15: mp_sum_dm 4 1.0 0.042 0.045 0.042 0.045 5 -15: dbcsr_make_index_local_row 49 10.2 0.027 0.044 0.027 0.044 7 -15: dbcsr_tas_merge_communicate_bu 10 7.5 0.000 0.000 0.016 0.043 9 -15: dbcsr_data_new 1359 7.7 0.006 0.042 0.006 0.042 6 -15: dbcsr_get_data_size_used 39 9.7 0.022 0.035 0.022 0.035 9 -15: dbcsr_tas_reshape_communicate_ 24 7.7 0.000 0.000 0.024 0.034 1 -15: mp_comm_free 1784 3.8 0.013 0.028 0.013 0.028 5 -15: dbcsr_fill_wm_from_matrix 10 9.0 0.010 0.023 0.010 0.023 7 -15: dbcsr_t_destroy 338 1.3 0.004 0.004 0.010 0.019 7 -15: dbcsr_tas_reshape_buffer_obtai 24 7.7 0.001 0.001 0.006 0.019 9 -15: dbcsr_mm_multrec_init 20 10.5 0.000 0.000 0.003 0.012 5 -15: dbcsr_mm_csr_init 20 11.5 0.003 0.012 0.003 0.012 9 -15: mp_sum_iv 20 10.5 0.003 0.012 0.003 0.012 0 -15: multiply_cannon_multrec_finali 20 12.5 0.000 0.000 0.005 0.012 1 -15: dbcsr_mm_multrec_finalize 20 13.5 0.005 0.011 0.005 0.012 5 -15: dbcsr_t_copy_nocomm 3 3.0 0.000 0.001 0.005 0.011 3 -15: quick_finalize 31 12.9 0.003 0.009 0.003 0.009 6 -15: dbcsr_t_distribution_destroy 434 1.7 0.002 0.002 0.005 0.009 6 -15: mp_cart_sub 116 12.2 0.003 0.007 0.003 0.007 6 -15: dbcsr_work_destroy_all 88 11.2 0.000 0.000 0.001 0.005 6 -15: mp_isend_dv 230 8.8 0.001 0.003 0.001 0.003 6 -15: dbcsr_init_lib_low 1 1.0 0.001 0.002 0.001 0.002 9 -15: dbcsr_distribution_new 586 4.6 0.002 0.002 0.002 0.002 1 -15: dbcsr_t_align_index 30 3.0 0.000 0.000 0.001 0.002 9 -15: dbcsr_sort_indices 1011 6.2 0.001 0.002 0.001 0.002 0 -15: mp_maxloc_dv 327 1.0 0.002 0.002 0.002 0.002 7 -15: dbcsr_t_permute_index 30 4.0 0.001 0.002 0.001 0.002 0 -15: mp_bcast_av 163 1.0 0.001 0.001 0.001 0.001 5 -15: dbcsr_iterator_seek 1097 5.3 0.001 0.001 0.001 0.001 0 -15: mp_isend_lm2 85 9.3 0.001 0.001 0.001 0.001 1 -15: mp_irecv_lm2 75 9.3 0.000 0.001 0.000 0.001 4 -15: dbcsr_work_create 88 10.3 0.000 0.000 0.001 0.001 3 -15: make_images_pack 40 11.5 0.000 0.000 0.000 0.000 3 -15: mp_irecv_dv 224 8.8 0.000 0.000 0.000 0.000 9 -15: dbcsr_make_dbcsr_index 581 7.2 0.000 0.000 0.000 0.000 0 -15: multiply_cannon_metrocomm4 18 11.7 0.000 0.000 0.000 0.000 8 -15: mp_sum_lv 20 1.0 0.000 0.000 0.000 0.000 0 -15: dbcsr_switch_data_area 85 11.8 0.000 0.000 0.000 0.000 6 -15: multiply_cannon_metrocomm2 13 12.3 0.000 0.000 0.000 0.000 10 +15: dbcsr_t_total 96 1.0 0.002 0.004 2.947 3.004 1 +15: dbcsr_t_contract 10 2.0 0.006 0.012 2.042 2.045 0 +15: dbcsr_t_distribution_new 434 1.7 0.012 0.013 1.549 1.922 2 +15: mp_cart_create 898 5.2 1.394 1.729 1.394 1.729 6 +15: dbcsr_t_pgrid_create 440 2.7 0.004 0.005 1.374 1.706 6 +15: dbcsr_tas_multiply 20 4.5 0.000 0.000 1.647 1.656 3 +15: dbcsr_tas_total 20 5.5 0.004 0.008 1.646 1.655 0 +15: mp_sync 272 3.0 1.318 1.517 1.318 1.517 6 +15: mp_sum_dm4 7 1.0 1.267 1.352 1.267 1.352 3 +15: dbcsr_create_new 859 5.8 0.670 1.070 0.690 1.082 4 +15: mp_alltoall_i 136 4.9 0.924 1.019 0.924 1.019 0 +15: dbcsr_t_create_new 217 1.2 0.009 0.013 0.617 0.909 1 +15: dbcsr_t_copy 101 2.2 0.022 0.061 0.805 0.895 3 +15: dbcsr_tas_result_index 10 5.0 0.002 0.003 0.738 0.741 6 +15: dbcsr_tas_create_new 289 3.4 0.007 0.007 0.409 0.708 5 +15: mp_sum_dm3 29 1.0 0.280 0.432 0.280 0.432 6 +15: mp_sum_l 491 4.7 0.380 0.419 0.380 0.419 2 +15: dbcsr_checksum 40 1.0 0.013 0.032 0.327 0.394 6 +15: mp_sum_d 137 1.3 0.315 0.383 0.315 0.383 0 +15: dbcsr_tas_dbcsr 20 6.5 0.000 0.000 0.325 0.336 2 +15: dbcsr_tas_distribution_new 476 3.1 0.033 0.043 0.222 0.283 1 +15: dbcsr_tas_create_split 382 4.1 0.003 0.004 0.212 0.265 6 +15: dbcsr_tas_create_split_rows_or 382 5.1 0.008 0.008 0.209 0.262 5 +15: dbcsr_tas_reshape 21 6.9 0.001 0.001 0.212 0.238 5 +15: mp_comm_dup 372 6.1 0.166 0.220 0.166 0.220 1 +15: dbcsr_multiply_generic 20 8.5 0.003 0.003 0.151 0.205 6 +15: dbcsr_tas_reshape_alltoall 21 7.9 0.000 0.000 0.150 0.184 3 +15: mp_max_l 158 1.1 0.098 0.176 0.098 0.176 6 +15: dbcsr_t_remap 15 3.0 0.004 0.004 0.155 0.169 3 +15: dbcsr_tas_replicate 20 6.5 0.002 0.002 0.139 0.164 6 +15: reshape_mm_small 20 6.5 0.004 0.005 0.125 0.148 3 +15: dbcsr_tas_merge 10 6.5 0.001 0.001 0.115 0.123 2 +15: mp_waitall_2 243 7.0 0.101 0.122 0.101 0.122 6 +15: multiply_cannon 20 9.5 0.019 0.051 0.064 0.120 4 +15: dbcsr_tas_communicate_buffer 41 8.7 0.001 0.001 0.090 0.117 6 +15: dbcsr_tas_mm_2 10 7.5 0.000 0.000 0.108 0.110 3 +15: dbcsr_iterator_start 1063 4.2 0.062 0.103 0.064 0.105 3 +15: dbcsr_scale_anytype 46 6.8 0.001 0.002 0.059 0.099 6 +15: dbcsr_tas_replicate_alltoall 10 7.5 0.000 0.000 0.076 0.098 3 +15: dbcsr_tas_mm_1N 6 7.5 0.000 0.000 0.079 0.096 5 +15: dbcsr_tas_convert_to_dbcsr 40 1.0 0.004 0.011 0.054 0.076 6 +15: make_m2s 40 9.5 0.002 0.004 0.054 0.075 1 +15: make_images 40 10.5 0.011 0.022 0.051 0.072 6 +15: dbcsr_add_anytype 20 6.5 0.001 0.004 0.033 0.071 3 +15: dbcsr_tas_merge_alltoall 10 7.5 0.000 0.000 0.056 0.071 3 +15: dbcsr_t_nd_mp_comm 15 4.0 0.000 0.000 0.047 0.060 2 +15: multiply_cannon_loop 20 10.5 0.004 0.017 0.033 0.052 1 +15: dbcsr_tas_reshape_communicate_ 21 7.9 0.000 0.000 0.035 0.051 5 +15: dbcsr_t_reserve_blocks_index 391 2.3 0.003 0.004 0.021 0.049 3 +15: dbcsr_tas_mm_3T 4 7.5 0.000 0.000 0.024 0.049 4 +15: dbcsr_reserve_blocks 496 4.6 0.023 0.046 0.023 0.048 3 +15: dbcsr_tas_reshape_buffer_fill 21 7.9 0.001 0.001 0.023 0.047 2 +15: dbcsr_tas_reserve_blocks_index 436 3.7 0.004 0.006 0.019 0.046 3 +15: convert_to_new_pgrid 60 6.5 0.000 0.000 0.024 0.046 6 +15: reshape_mm_compatible 20 6.5 0.001 0.001 0.041 0.044 0 +15: dbcsr_tas_replicate_communicat 10 7.5 0.000 0.000 0.033 0.043 2 +15: mp_max_i 90 1.4 0.035 0.041 0.035 0.041 4 +15: multiply_cannon_multrec 26 11.2 0.012 0.035 0.018 0.036 4 +15: dbcsr_finalize 963 3.3 0.015 0.029 0.021 0.033 1 +15: dbcsr_t_reserve_blocks_index_a 189 2.7 0.001 0.001 0.013 0.032 0 +15: dbcsr_tas_merge_communicate_bu 10 7.5 0.000 0.000 0.021 0.031 3 +15: change_split 30 7.0 0.000 0.000 0.028 0.031 0 +15: dbcsr_make_index_exist 859 6.8 0.019 0.031 0.019 0.031 5 +15: dbcsr_new_transposed 14 9.5 0.000 0.000 0.014 0.029 2 +15: dbcsr_filter_anytype 37 5.9 0.001 0.002 0.015 0.029 2 +15: make_images_data 40 11.5 0.001 0.002 0.019 0.029 6 +15: dbcsr_t_communicate_buffer 95 3.3 0.002 0.004 0.018 0.027 2 +15: hybrid_alltoall_any 40 12.5 0.005 0.010 0.017 0.026 6 +15: dbcsr_t_create_template 91 1.1 0.002 0.002 0.012 0.026 0 +15: mp_comm_split_direct 382 6.1 0.018 0.021 0.018 0.021 0 +15: mp_sum_dm 4 1.0 0.017 0.021 0.017 0.021 6 +15: multiply_cannon_multrec_finali 20 12.5 0.000 0.000 0.006 0.019 2 +15: dbcsr_mm_multrec_finalize 20 13.5 0.006 0.019 0.006 0.019 1 +15: dbcsr_t_destroy 338 1.3 0.005 0.005 0.012 0.017 1 +15: dbcsr_t_reserve_blocks_templat 89 1.1 0.002 0.002 0.007 0.016 3 +15: make_images_sizes 40 11.5 0.000 0.000 0.011 0.015 0 +15: mp_alltoall_i44 40 12.5 0.011 0.015 0.011 0.015 4 +15: mp_max_iv 75 3.8 0.010 0.015 0.010 0.015 2 +15: mp_waitall_1 504 12.9 0.008 0.015 0.008 0.015 0 +15: multiply_cannon_metrocomm1 26 11.2 0.000 0.000 0.008 0.014 4 +15: dbcsr_destroy 819 4.9 0.004 0.004 0.009 0.013 0 +15: dbcsr_merge_all 40 9.7 0.004 0.011 0.005 0.012 3 +15: mp_bcast_i 394 6.0 0.004 0.012 0.004 0.012 3 +15: dbcsr_data_release 2598 6.8 0.007 0.011 0.007 0.011 3 +15: mp_comm_free 1736 3.8 0.010 0.011 0.010 0.011 0 +15: dbcsr_copy 80 8.5 0.002 0.007 0.006 0.011 6 +15: dbcsr_iterator_stop 1063 4.2 0.005 0.009 0.007 0.011 4 +15: dbcsr_special_finalize 46 11.3 0.000 0.000 0.004 0.010 6 +15: dbcsr_mm_multrec_init 20 10.5 0.000 0.000 0.003 0.009 0 +15: dbcsr_mm_csr_init 20 11.5 0.003 0.009 0.003 0.009 4 +15: dbcsr_tas_copy 4 4.0 0.001 0.001 0.003 0.008 5 +15: dbcsr_t_copy_nocomm 3 3.0 0.000 0.001 0.003 0.008 3 +15: mp_sum_i 21 7.2 0.004 0.008 0.004 0.008 6 +15: calculate_norms 52 11.2 0.002 0.008 0.002 0.008 1 +15: dbcsr_merge_single_wm 7 11.0 0.002 0.008 0.002 0.008 1 +15: mp_allgather_i34 20 10.5 0.005 0.008 0.005 0.008 4 +15: dbcsr_init_lib_low 1 1.0 0.004 0.007 0.004 0.007 3 +15: dbcsr_t_distribution_destroy 434 1.7 0.003 0.004 0.006 0.007 4 +15: mp_isend_dv 189 8.2 0.002 0.006 0.002 0.006 3 +15: dbcsr_tas_reshape_buffer_obtai 21 7.9 0.001 0.001 0.002 0.006 1 +15: setup_rec_index_2d 40 10.5 0.001 0.004 0.001 0.004 4 +15: setup_buffer_matrices 40 10.5 0.000 0.000 0.002 0.004 0 +15: dbcsr_data_new 1296 7.7 0.003 0.003 0.003 0.003 6 +15: mp_maxloc_dv 325 1.0 0.003 0.003 0.003 0.003 5 +15: dbcsr_tas_mp_comm 14 4.4 0.000 0.000 0.002 0.003 5 +15: dbcsr_sort_indices 963 6.7 0.001 0.003 0.001 0.003 3 +15: mp_bcast_av 162 1.0 0.001 0.001 0.002 0.002 2 +15: dbcsr_distribution_new 570 4.5 0.002 0.002 0.002 0.002 1 +15: dbcsr_iterator_seek 1063 5.2 0.002 0.002 0.002 0.002 3 +15: quick_finalize 39 12.5 0.001 0.001 0.001 0.002 6 +15: dbcsr_make_untransposed_blocks 30 9.0 0.001 0.001 0.001 0.002 2 +15: dbcsr_add_wm_from_matrix 10 8.0 0.000 0.000 0.001 0.001 0 +15: dbcsr_sort_data 27 11.6 0.001 0.001 0.001 0.001 6 +15: dbcsr_work_destroy_all 86 11.2 0.000 0.001 0.001 0.001 6 +15: make_images_pack 40 11.5 0.000 0.000 0.001 0.001 6 +15: dbcsr_fill_wm_from_matrix 10 9.0 0.000 0.001 0.000 0.001 2 +15: dbcsr_t_align_index 30 3.0 0.000 0.000 0.001 0.001 3 +15: mp_cart_sub 84 12.6 0.001 0.001 0.001 0.001 6 +15: dbcsr_work_create 86 10.4 0.001 0.001 0.001 0.001 6 +15: dbcsr_make_dbcsr_index 554 7.9 0.000 0.001 0.000 0.001 3 +15: dbcsr_make_index_list 46 10.3 0.001 0.001 0.001 0.001 6 +15: dbcsr_t_permute_index 30 4.0 0.001 0.001 0.001 0.001 0 +15: dbcsr_switch_data_area 93 11.8 0.000 0.000 0.000 0.001 1 +15: dbcsr_make_index_local_row 46 10.3 0.000 0.000 0.000 0.000 2 +15: block_buffer_get_index 287 8.2 0.000 0.000 0.000 0.000 2 +15: mp_sum_lv 16 1.0 0.000 0.000 0.000 0.000 0 +15: mp_max_lv 30 5.0 0.000 0.000 0.000 0.000 3 +15: merge_index 40 10.7 0.000 0.000 0.000 0.000 2 +15: mp_isend_im2 106 4.7 0.000 0.000 0.000 0.000 3 +15: dbcsr_tas_reshape_get_coord 21 7.9 0.000 0.000 0.000 0.000 0 +15: mp_irecv_dv 196 8.2 0.000 0.000 0.000 0.000 5 +15: mp_isend_lm2 115 9.7 0.000 0.000 0.000 0.000 6 +15: mp_irecv_im2 102 4.7 0.000 0.000 0.000 0.000 3 +15: mp_dims_create 79 5.3 0.000 0.000 0.000 0.000 3 +15: dbcsr_tas_blk_sizes 161 8.0 0.000 0.000 0.000 0.000 5 +15: dbcsr_data_copy_aa2 13 9.4 0.000 0.000 0.000 0.000 2 +15: dbcsr_index_compact 37 6.9 0.000 0.000 0.000 0.000 0 +15: transpose_index_local 14 10.5 0.000 0.000 0.000 0.000 6 15: mp_max_r 1 1.0 0.000 0.000 0.000 0.000 5 -15: mp_isend_iv 121 12.6 0.000 0.000 0.000 0.000 0 -15: mp_isend_im2 98 4.4 0.000 0.000 0.000 0.000 5 -15: block_buffer_get_index 528 8.1 0.000 0.000 0.000 0.000 11 -15: mp_irecv_im2 102 4.4 0.000 0.000 0.000 0.000 1 -15: dbcsr_tas_reshape_get_coord 24 7.7 0.000 0.000 0.000 0.000 7 -15: dbcsr_index_compact 40 6.8 0.000 0.000 0.000 0.000 6 -15: transpose_index_local 14 10.5 0.000 0.000 0.000 0.000 11 -15: mp_dims_create 115 5.3 0.000 0.000 0.000 0.000 5 -15: mp_irecv_iv 119 12.6 0.000 0.000 0.000 0.000 0 -15: fill_hash_tables 20 12.5 0.000 0.000 0.000 0.000 6 -15: mp_bcast_iv 20 1.0 0.000 0.000 0.000 0.000 6 -15: dbcsr_tas_blk_sizes 89 7.7 0.000 0.000 0.000 0.000 7 -15: dbcsr_get_local_rows 20 9.5 0.000 0.000 0.000 0.000 5 -15: dbcsr_mm_sched_init 20 12.5 0.000 0.000 0.000 0.000 9 -15: dbcsr_get_local_cols 20 9.5 0.000 0.000 0.000 0.000 8 -15: dbcsr_data_copy_aa2 9 9.3 0.000 0.000 0.000 0.000 4 +15: mp_irecv_lm2 103 9.7 0.000 0.000 0.000 0.000 0 +15: mp_isend_iv 86 12.4 0.000 0.000 0.000 0.000 3 +15: multiply_cannon_metrocomm2 6 10.0 0.000 0.000 0.000 0.000 3 +15: mp_irecv_iv 86 12.4 0.000 0.000 0.000 0.000 6 +15: mp_bcast_iv 16 1.0 0.000 0.000 0.000 0.000 6 +15: dbcsr_get_data_size_used 40 9.7 0.000 0.000 0.000 0.000 3 +15: fill_hash_tables 20 12.5 0.000 0.000 0.000 0.000 3 +15: dbcsr_mm_sched_init 20 12.5 0.000 0.000 0.000 0.000 6 +15: buffer_matrices_ensure_size 40 10.5 0.000 0.000 0.000 0.000 5 +15: dbcsr_get_local_rows 20 9.5 0.000 0.000 0.000 0.000 0 +15: dbcsr_get_local_cols 20 9.5 0.000 0.000 0.000 0.000 6 15: dbcsr_mm_sched_finalize 20 14.5 0.000 0.000 0.000 0.000 0 -15: dbcsr_get_global_row_map 20 9.5 0.000 0.000 0.000 0.000 8 -15: multrec_filtering 20 14.5 0.000 0.000 0.000 0.000 8 -15: dbcsr_get_global_col_map 20 9.5 0.000 0.000 0.000 0.000 3 -15: dbcsr_mm_hostdrv_init 20 13.5 0.000 0.000 0.000 0.000 5 -15: mp_sum_r 1 1.0 0.000 0.000 0.000 0.000 4 -15: mp_sum_lm3 1 1.0 0.000 0.000 0.000 0.000 4 -15: mp_max_d 1 1.0 0.000 0.000 0.000 0.000 4 -15: mp_sum_rv 1 1.0 0.000 0.000 0.000 0.000 3 -15: mp_min_rv 1 1.0 0.000 0.000 0.000 0.000 0 -15: mp_max_rv 1 1.0 0.000 0.000 0.000 0.000 4 +15: dbcsr_get_global_row_map 20 9.5 0.000 0.000 0.000 0.000 0 +15: multrec_filtering 20 14.5 0.000 0.000 0.000 0.000 5 +15: multiply_cannon_metrocomm3 26 11.2 0.000 0.000 0.000 0.000 0 +15: mp_sum_iv 20 10.5 0.000 0.000 0.000 0.000 0 +15: dbcsr_get_global_col_map 20 9.5 0.000 0.000 0.000 0.000 0 +15: dbcsr_mm_hostdrv_init 20 13.5 0.000 0.000 0.000 0.000 0 +15: mp_sum_lm3 1 1.0 0.000 0.000 0.000 0.000 6 +15: mp_max_d 1 1.0 0.000 0.000 0.000 0.000 0 +15: mp_min_rv 1 1.0 0.000 0.000 0.000 0.000 5 +15: mp_sum_r 1 1.0 0.000 0.000 0.000 0.000 3 +15: mp_max_rv 1 1.0 0.000 0.000 0.000 0.000 5 +15: mp_sum_rv 1 1.0 0.000 0.000 0.000 0.000 6 15: ------------------------------------------------------------------------------- 15: -15/19 Test #15: dbcsr_tensor_unittest ................................. Passed 54.72 sec +15/19 Test #15: dbcsr_tensor_unittest ................................. Passed 12.20 sec test 16 Start 16: dbcsr_tas_unittest -16: Test command: /usr/bin/mpiexec "-n" "12" "/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/tests/dbcsr_tas_unittest" +16: Test command: /usr/bin/mpiexec "-n" "7" "/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/tests/dbcsr_tas_unittest" 16: Working Directory: /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/tests 16: Environment variables: 16: OMP_NUM_THREADS=2 16: Test timeout computed to be: 1500 16: DBCSR TALL-AND-SKINNY MATRICES 16: Split info for matrix A 100 X 20 -16: Asplitting rows by factor 3 -16: Aglobal grid sizes: 6x 2 -16: Agrid sizes on subgroups: 2x 2 +16: Asplitting rows by factor 7 +16: Aglobal grid sizes: 7x 1 +16: Agrid sizes on subgroups: 1x 1 16: Split info for matrix A^t 20 X 100 -16: Atsplitting columns by factor 3 -16: Atglobal grid sizes: 2x 6 -16: Atgrid sizes on subgroups: 2x 2 +16: Atsplitting columns by factor 7 +16: Atglobal grid sizes: 1x 7 +16: Atgrid sizes on subgroups: 1x 1 16: Split info for matrix B 10 X 100 -16: Bsplitting columns by factor 12 -16: Bglobal grid sizes: 1x 12 +16: Bsplitting columns by factor 7 +16: Bglobal grid sizes: 1x 7 16: Bgrid sizes on subgroups: 1x 1 16: Split info for matrix B^t 100 X 10 -16: Btsplitting rows by factor 12 -16: Btglobal grid sizes: 12x 1 +16: Btsplitting rows by factor 7 +16: Btglobal grid sizes: 7x 1 16: Btgrid sizes on subgroups: 1x 1 16: Split info for matrix C 20 X 10 -16: Csplitting rows by factor 3 -16: Cglobal grid sizes: 6x 2 -16: Cgrid sizes on subgroups: 2x 2 +16: Csplitting rows by factor 1 +16: Cglobal grid sizes: 1x 7 +16: Cgrid sizes on subgroups: 1x 7 16: Split info for matrix C^t 10 X 20 -16: Ctsplitting columns by factor 3 -16: Ctglobal grid sizes: 2x 6 -16: Ctgrid sizes on subgroups: 2x 2 +16: Ctsplitting columns by factor 1 +16: Ctglobal grid sizes: 7x 1 +16: Ctgrid sizes on subgroups: 7x 1 16: -------------------------------------------------------------------------------- 16: DBCSR TAS MATRIX MULTIPLICATION: B x A = C^t 16: -------------------------------------------------------------------------------- 16: mm dims: 10 100 20 16: MM PARAMETERS -16: Est. number of matrix elements per CPU of result matrix: 7094 +16: Est. number of matrix elements per CPU of result matrix: 12160 16: Est. optimal split factor: 1 16: Optimizing distribution of B and A 16: mm case: |T x | = + 16: SPLIT / PARALLELIZATION INFO -16: splitting rows by factor 3 -16: global grid sizes: 6x 2 -16: grid sizes on subgroups: 2x 2 +16: splitting rows by factor 1 +16: global grid sizes: 1x 7 +16: grid sizes on subgroups: 1x 7 16: GLOBAL INFO OF B 16: block dimensions: 100 10 16: full dimensions: 1260 270 -16: process grid dimensions: 6 2 +16: process grid dimensions: 1 7 16: GLOBAL INFO OF A 16: block dimensions: 100 20 16: full dimensions: 1260 559 -16: process grid dimensions: 6 2 +16: process grid dimensions: 1 7 16: GLOBAL INFO OF C^t 16: block dimensions: 10 20 16: full dimensions: 270 559 -16: process grid dimensions: 6 2 +16: process grid dimensions: 1 7 16: Change process grid: No 16: DISTRIBUTION OF B 16: Number of non-zero blocks: 91 16: Percentage of non-zero blocks: 9.10 -16: Average number of blocks per group: 31 -16: Maximum number of blocks per group: 35 -16: Average number of matrix elements per group: 9626 -16: Maximum number of matrix elements per group: 10560 -16: Average number of blocks per CPU: 8 -16: Maximum number of blocks per CPU: 10 -16: Average number of matrix elements per CPU: 2407 -16: Maximum number of matrix elements per CPU: 4797 +16: Average number of blocks per group: 91 +16: Maximum number of blocks per group: 91 +16: Average number of matrix elements per group: 28878 +16: Maximum number of matrix elements per group: 28878 +16: Average number of blocks per CPU: 13 +16: Maximum number of blocks per CPU: 21 +16: Average number of matrix elements per CPU: 4126 +16: Maximum number of matrix elements per CPU: 15462 16: DISTRIBUTION OF A 16: Number of non-zero blocks: 207 16: Percentage of non-zero blocks: 10.35 -16: Average number of blocks per group: 69 -16: Maximum number of blocks per group: 69 -16: Average number of matrix elements per group: 21835 -16: Maximum number of matrix elements per group: 25054 -16: Average number of blocks per CPU: 18 -16: Maximum number of blocks per CPU: 22 -16: Average number of matrix elements per CPU: 5459 -16: Maximum number of matrix elements per CPU: 7226 +16: Average number of blocks per group: 207 +16: Maximum number of blocks per group: 207 +16: Average number of matrix elements per group: 65504 +16: Maximum number of matrix elements per group: 65504 +16: Average number of blocks per CPU: 30 +16: Maximum number of blocks per CPU: 41 +16: Average number of matrix elements per CPU: 9358 +16: Maximum number of matrix elements per CPU: 15279 16: DISTRIBUTION OF C^t replicated -16: Number of non-zero blocks: 147 -16: Percentage of non-zero blocks: 24.50 -16: Average number of blocks per group: 49 -16: Maximum number of blocks per group: 64 -16: Average number of matrix elements per group: 38358 -16: Maximum number of matrix elements per group: 43740 -16: Average number of blocks per CPU: 13 -16: Maximum number of blocks per CPU: 32 -16: Average number of matrix elements per CPU: 9590 -16: Maximum number of matrix elements per CPU: 19881 +16: Number of non-zero blocks: 113 +16: Percentage of non-zero blocks: 56.50 +16: Average number of blocks per group: 113 +16: Maximum number of blocks per group: 113 +16: Average number of matrix elements per group: 85119 +16: Maximum number of matrix elements per group: 85119 +16: Average number of blocks per CPU: 17 +16: Maximum number of blocks per CPU: 25 +16: Average number of matrix elements per CPU: 12160 +16: Maximum number of matrix elements per CPU: 21993 16: -------------------------------------------------------------------------------- 16: TAS MATRIX MULTIPLICATION DONE 16: -------------------------------------------------------------------------------- @@ -55978,125 +55980,125 @@ 16: -------------------------------------------------------------------------------- 16: mm dims: 10 100 20 16: MM PARAMETERS -16: Est. number of matrix elements per CPU of result matrix: 7451 +16: Est. number of matrix elements per CPU of result matrix: 12773 16: Est. optimal split factor: 1 16: Optimizing distribution of B^t and A 16: mm case: |T x | = + 16: SPLIT / PARALLELIZATION INFO -16: splitting rows by factor 3 -16: global grid sizes: 6x 2 -16: grid sizes on subgroups: 2x 2 +16: splitting rows by factor 1 +16: global grid sizes: 1x 7 +16: grid sizes on subgroups: 1x 7 16: GLOBAL INFO OF B^t 16: block dimensions: 100 10 16: full dimensions: 1260 270 -16: process grid dimensions: 6 2 +16: process grid dimensions: 1 7 16: GLOBAL INFO OF A 16: block dimensions: 100 20 16: full dimensions: 1260 559 -16: process grid dimensions: 6 2 +16: process grid dimensions: 1 7 16: GLOBAL INFO OF C^t 16: block dimensions: 10 20 16: full dimensions: 270 559 -16: process grid dimensions: 6 2 +16: process grid dimensions: 1 7 16: Change process grid: No 16: DISTRIBUTION OF B^t 16: Number of non-zero blocks: 114 16: Percentage of non-zero blocks: 11.40 -16: Average number of blocks per group: 38 -16: Maximum number of blocks per group: 41 -16: Average number of matrix elements per group: 11419 -16: Maximum number of matrix elements per group: 12123 -16: Average number of blocks per CPU: 10 -16: Maximum number of blocks per CPU: 16 -16: Average number of matrix elements per CPU: 2855 -16: Maximum number of matrix elements per CPU: 6228 +16: Average number of blocks per group: 114 +16: Maximum number of blocks per group: 114 +16: Average number of matrix elements per group: 34257 +16: Maximum number of matrix elements per group: 34257 +16: Average number of blocks per CPU: 17 +16: Maximum number of blocks per CPU: 27 +16: Average number of matrix elements per CPU: 4894 +16: Maximum number of matrix elements per CPU: 12750 16: DISTRIBUTION OF A 16: Number of non-zero blocks: 207 16: Percentage of non-zero blocks: 10.35 -16: Average number of blocks per group: 69 -16: Maximum number of blocks per group: 69 -16: Average number of matrix elements per group: 21835 -16: Maximum number of matrix elements per group: 25054 -16: Average number of blocks per CPU: 18 -16: Maximum number of blocks per CPU: 22 -16: Average number of matrix elements per CPU: 5459 -16: Maximum number of matrix elements per CPU: 7226 +16: Average number of blocks per group: 207 +16: Maximum number of blocks per group: 207 +16: Average number of matrix elements per group: 65504 +16: Maximum number of matrix elements per group: 65504 +16: Average number of blocks per CPU: 30 +16: Maximum number of blocks per CPU: 41 +16: Average number of matrix elements per CPU: 9358 +16: Maximum number of matrix elements per CPU: 15279 16: DISTRIBUTION OF C^t replicated -16: Number of non-zero blocks: 183 -16: Percentage of non-zero blocks: 30.50 -16: Average number of blocks per group: 61 -16: Maximum number of blocks per group: 66 -16: Average number of matrix elements per group: 35466 -16: Maximum number of matrix elements per group: 38577 -16: Average number of blocks per CPU: 16 -16: Maximum number of blocks per CPU: 29 -16: Average number of matrix elements per CPU: 8867 -16: Maximum number of matrix elements per CPU: 16137 +16: Number of non-zero blocks: 131 +16: Percentage of non-zero blocks: 65.50 +16: Average number of blocks per group: 131 +16: Maximum number of blocks per group: 131 +16: Average number of matrix elements per group: 89406 +16: Maximum number of matrix elements per group: 89406 +16: Average number of blocks per CPU: 19 +16: Maximum number of blocks per CPU: 25 +16: Average number of matrix elements per CPU: 12773 +16: Maximum number of matrix elements per CPU: 15633 16: -------------------------------------------------------------------------------- 16: TAS MATRIX MULTIPLICATION DONE 16: -------------------------------------------------------------------------------- 16: B^tT X AN passed! 16: checksums 0.27E+07 0.27E+07 -16: difference norm 0.18E-13 +16: difference norm 0.21E-13 16: -------------------------------------------------------------------------------- 16: DBCSR TAS MATRIX MULTIPLICATION: B x A^t = C^t 16: -------------------------------------------------------------------------------- 16: mm dims: 10 100 20 16: MM PARAMETERS -16: Est. number of matrix elements per CPU of result matrix: 7400 +16: Est. number of matrix elements per CPU of result matrix: 12686 16: Est. optimal split factor: 1 16: Optimizing distribution of B and A^t 16: mm case: |T x | = + 16: SPLIT / PARALLELIZATION INFO -16: splitting rows by factor 3 -16: global grid sizes: 6x 2 -16: grid sizes on subgroups: 2x 2 +16: splitting rows by factor 1 +16: global grid sizes: 1x 7 +16: grid sizes on subgroups: 1x 7 16: GLOBAL INFO OF B 16: block dimensions: 100 10 16: full dimensions: 1260 270 -16: process grid dimensions: 6 2 +16: process grid dimensions: 1 7 16: GLOBAL INFO OF A^t 16: block dimensions: 100 20 16: full dimensions: 1260 559 -16: process grid dimensions: 6 2 +16: process grid dimensions: 1 7 16: GLOBAL INFO OF C^t 16: block dimensions: 10 20 16: full dimensions: 270 559 -16: process grid dimensions: 6 2 +16: process grid dimensions: 1 7 16: Change process grid: No 16: DISTRIBUTION OF B 16: Number of non-zero blocks: 91 16: Percentage of non-zero blocks: 9.10 -16: Average number of blocks per group: 31 -16: Maximum number of blocks per group: 35 -16: Average number of matrix elements per group: 9626 -16: Maximum number of matrix elements per group: 10560 -16: Average number of blocks per CPU: 8 -16: Maximum number of blocks per CPU: 10 -16: Average number of matrix elements per CPU: 2407 -16: Maximum number of matrix elements per CPU: 4797 +16: Average number of blocks per group: 91 +16: Maximum number of blocks per group: 91 +16: Average number of matrix elements per group: 28878 +16: Maximum number of matrix elements per group: 28878 +16: Average number of blocks per CPU: 13 +16: Maximum number of blocks per CPU: 21 +16: Average number of matrix elements per CPU: 4126 +16: Maximum number of matrix elements per CPU: 15462 16: DISTRIBUTION OF A^t 16: Number of non-zero blocks: 208 16: Percentage of non-zero blocks: 10.40 -16: Average number of blocks per group: 70 -16: Maximum number of blocks per group: 72 -16: Average number of matrix elements per group: 25149 -16: Maximum number of matrix elements per group: 29364 -16: Average number of blocks per CPU: 18 -16: Maximum number of blocks per CPU: 24 -16: Average number of matrix elements per CPU: 6288 -16: Maximum number of matrix elements per CPU: 11811 +16: Average number of blocks per group: 208 +16: Maximum number of blocks per group: 208 +16: Average number of matrix elements per group: 75445 +16: Maximum number of matrix elements per group: 75445 +16: Average number of blocks per CPU: 30 +16: Maximum number of blocks per CPU: 41 +16: Average number of matrix elements per CPU: 10778 +16: Maximum number of matrix elements per CPU: 24390 16: DISTRIBUTION OF C^t replicated -16: Number of non-zero blocks: 170 -16: Percentage of non-zero blocks: 28.33 -16: Average number of blocks per group: 57 -16: Maximum number of blocks per group: 64 -16: Average number of matrix elements per group: 43311 -16: Maximum number of matrix elements per group: 46860 -16: Average number of blocks per CPU: 15 -16: Maximum number of blocks per CPU: 27 -16: Average number of matrix elements per CPU: 10828 -16: Maximum number of matrix elements per CPU: 20892 +16: Number of non-zero blocks: 125 +16: Percentage of non-zero blocks: 62.50 +16: Average number of blocks per group: 125 +16: Maximum number of blocks per group: 125 +16: Average number of matrix elements per group: 88797 +16: Maximum number of matrix elements per group: 88797 +16: Average number of blocks per CPU: 18 +16: Maximum number of blocks per CPU: 28 +16: Average number of matrix elements per CPU: 12686 +16: Maximum number of matrix elements per CPU: 17469 16: -------------------------------------------------------------------------------- 16: TAS MATRIX MULTIPLICATION DONE 16: -------------------------------------------------------------------------------- @@ -56108,190 +56110,190 @@ 16: -------------------------------------------------------------------------------- 16: mm dims: 10 100 20 16: MM PARAMETERS -16: Est. number of matrix elements per CPU of result matrix: 7520 +16: Est. number of matrix elements per CPU of result matrix: 12891 16: Est. optimal split factor: 1 16: Optimizing distribution of B^t and A^t 16: mm case: |T x | = + 16: SPLIT / PARALLELIZATION INFO -16: splitting rows by factor 3 -16: global grid sizes: 6x 2 -16: grid sizes on subgroups: 2x 2 +16: splitting rows by factor 1 +16: global grid sizes: 1x 7 +16: grid sizes on subgroups: 1x 7 16: GLOBAL INFO OF B^t 16: block dimensions: 100 10 16: full dimensions: 1260 270 -16: process grid dimensions: 6 2 +16: process grid dimensions: 1 7 16: GLOBAL INFO OF A^t 16: block dimensions: 100 20 16: full dimensions: 1260 559 -16: process grid dimensions: 6 2 +16: process grid dimensions: 1 7 16: GLOBAL INFO OF C^t 16: block dimensions: 10 20 16: full dimensions: 270 559 -16: process grid dimensions: 6 2 +16: process grid dimensions: 1 7 16: Change process grid: No 16: DISTRIBUTION OF B^t 16: Number of non-zero blocks: 114 16: Percentage of non-zero blocks: 11.40 -16: Average number of blocks per group: 38 -16: Maximum number of blocks per group: 41 -16: Average number of matrix elements per group: 11419 -16: Maximum number of matrix elements per group: 12123 -16: Average number of blocks per CPU: 10 -16: Maximum number of blocks per CPU: 16 -16: Average number of matrix elements per CPU: 2855 -16: Maximum number of matrix elements per CPU: 6228 +16: Average number of blocks per group: 114 +16: Maximum number of blocks per group: 114 +16: Average number of matrix elements per group: 34257 +16: Maximum number of matrix elements per group: 34257 +16: Average number of blocks per CPU: 17 +16: Maximum number of blocks per CPU: 27 +16: Average number of matrix elements per CPU: 4894 +16: Maximum number of matrix elements per CPU: 12750 16: DISTRIBUTION OF A^t 16: Number of non-zero blocks: 208 16: Percentage of non-zero blocks: 10.40 -16: Average number of blocks per group: 70 -16: Maximum number of blocks per group: 72 -16: Average number of matrix elements per group: 25149 -16: Maximum number of matrix elements per group: 29364 -16: Average number of blocks per CPU: 18 -16: Maximum number of blocks per CPU: 24 -16: Average number of matrix elements per CPU: 6288 -16: Maximum number of matrix elements per CPU: 11811 +16: Average number of blocks per group: 208 +16: Maximum number of blocks per group: 208 +16: Average number of matrix elements per group: 75445 +16: Maximum number of matrix elements per group: 75445 +16: Average number of blocks per CPU: 30 +16: Maximum number of blocks per CPU: 41 +16: Average number of matrix elements per CPU: 10778 +16: Maximum number of matrix elements per CPU: 24390 16: DISTRIBUTION OF C^t replicated -16: Number of non-zero blocks: 198 -16: Percentage of non-zero blocks: 33.00 -16: Average number of blocks per group: 66 -16: Maximum number of blocks per group: 69 -16: Average number of matrix elements per group: 46114 -16: Maximum number of matrix elements per group: 50826 -16: Average number of blocks per CPU: 17 -16: Maximum number of blocks per CPU: 33 -16: Average number of matrix elements per CPU: 11529 -16: Maximum number of matrix elements per CPU: 22743 +16: Number of non-zero blocks: 137 +16: Percentage of non-zero blocks: 68.50 +16: Average number of blocks per group: 137 +16: Maximum number of blocks per group: 137 +16: Average number of matrix elements per group: 90231 +16: Maximum number of matrix elements per group: 90231 +16: Average number of blocks per CPU: 20 +16: Maximum number of blocks per CPU: 25 +16: Average number of matrix elements per CPU: 12891 +16: Maximum number of matrix elements per CPU: 17043 16: -------------------------------------------------------------------------------- 16: TAS MATRIX MULTIPLICATION DONE 16: -------------------------------------------------------------------------------- 16: B^tT X A^tT passed! 16: checksums 0.44E+07 0.44E+07 -16: difference norm 0.14E-13 +16: difference norm 0.18E-13 16: -------------------------------------------------------------------------------- 16: DBCSR TAS MATRIX MULTIPLICATION: B x A = C 16: -------------------------------------------------------------------------------- 16: mm dims: 10 100 20 16: MM PARAMETERS -16: Est. number of matrix elements per CPU of result matrix: 7094 +16: Est. number of matrix elements per CPU of result matrix: 12160 16: Est. optimal split factor: 1 16: Optimizing distribution of B and A 16: mm case: |T x | = + 16: SPLIT / PARALLELIZATION INFO -16: splitting rows by factor 3 -16: global grid sizes: 6x 2 -16: grid sizes on subgroups: 2x 2 +16: splitting rows by factor 1 +16: global grid sizes: 1x 7 +16: grid sizes on subgroups: 1x 7 16: GLOBAL INFO OF B 16: block dimensions: 100 10 16: full dimensions: 1260 270 -16: process grid dimensions: 6 2 +16: process grid dimensions: 1 7 16: GLOBAL INFO OF A 16: block dimensions: 100 20 16: full dimensions: 1260 559 -16: process grid dimensions: 6 2 +16: process grid dimensions: 1 7 16: GLOBAL INFO OF C 16: block dimensions: 10 20 16: full dimensions: 270 559 -16: process grid dimensions: 6 2 +16: process grid dimensions: 1 7 16: Change process grid: No 16: DISTRIBUTION OF B 16: Number of non-zero blocks: 91 16: Percentage of non-zero blocks: 9.10 -16: Average number of blocks per group: 31 -16: Maximum number of blocks per group: 35 -16: Average number of matrix elements per group: 9626 -16: Maximum number of matrix elements per group: 10560 -16: Average number of blocks per CPU: 8 -16: Maximum number of blocks per CPU: 10 -16: Average number of matrix elements per CPU: 2407 -16: Maximum number of matrix elements per CPU: 4797 +16: Average number of blocks per group: 91 +16: Maximum number of blocks per group: 91 +16: Average number of matrix elements per group: 28878 +16: Maximum number of matrix elements per group: 28878 +16: Average number of blocks per CPU: 13 +16: Maximum number of blocks per CPU: 21 +16: Average number of matrix elements per CPU: 4126 +16: Maximum number of matrix elements per CPU: 15462 16: DISTRIBUTION OF A 16: Number of non-zero blocks: 207 16: Percentage of non-zero blocks: 10.35 -16: Average number of blocks per group: 69 -16: Maximum number of blocks per group: 69 -16: Average number of matrix elements per group: 21835 -16: Maximum number of matrix elements per group: 25054 -16: Average number of blocks per CPU: 18 -16: Maximum number of blocks per CPU: 22 -16: Average number of matrix elements per CPU: 5459 -16: Maximum number of matrix elements per CPU: 7226 +16: Average number of blocks per group: 207 +16: Maximum number of blocks per group: 207 +16: Average number of matrix elements per group: 65504 +16: Maximum number of matrix elements per group: 65504 +16: Average number of blocks per CPU: 30 +16: Maximum number of blocks per CPU: 41 +16: Average number of matrix elements per CPU: 9358 +16: Maximum number of matrix elements per CPU: 15279 16: DISTRIBUTION OF C replicated -16: Number of non-zero blocks: 147 -16: Percentage of non-zero blocks: 24.50 -16: Average number of blocks per group: 49 -16: Maximum number of blocks per group: 64 -16: Average number of matrix elements per group: 38358 -16: Maximum number of matrix elements per group: 43740 -16: Average number of blocks per CPU: 13 -16: Maximum number of blocks per CPU: 32 -16: Average number of matrix elements per CPU: 9590 -16: Maximum number of matrix elements per CPU: 19881 +16: Number of non-zero blocks: 113 +16: Percentage of non-zero blocks: 56.50 +16: Average number of blocks per group: 113 +16: Maximum number of blocks per group: 113 +16: Average number of matrix elements per group: 85119 +16: Maximum number of matrix elements per group: 85119 +16: Average number of blocks per CPU: 17 +16: Maximum number of blocks per CPU: 25 +16: Average number of matrix elements per CPU: 12160 +16: Maximum number of matrix elements per CPU: 21993 16: -------------------------------------------------------------------------------- 16: TAS MATRIX MULTIPLICATION DONE 16: -------------------------------------------------------------------------------- 16: BN X AN passed! 16: checksums 0.28E+07 0.28E+07 -16: difference norm 0.89E-14 +16: difference norm 0.00E+00 16: -------------------------------------------------------------------------------- 16: DBCSR TAS MATRIX MULTIPLICATION: B^t x A = C 16: -------------------------------------------------------------------------------- 16: mm dims: 10 100 20 16: MM PARAMETERS -16: Est. number of matrix elements per CPU of result matrix: 7451 +16: Est. number of matrix elements per CPU of result matrix: 12773 16: Est. optimal split factor: 1 16: Optimizing distribution of B^t and A 16: mm case: |T x | = + 16: SPLIT / PARALLELIZATION INFO -16: splitting rows by factor 3 -16: global grid sizes: 6x 2 -16: grid sizes on subgroups: 2x 2 +16: splitting rows by factor 1 +16: global grid sizes: 1x 7 +16: grid sizes on subgroups: 1x 7 16: GLOBAL INFO OF B^t 16: block dimensions: 100 10 16: full dimensions: 1260 270 -16: process grid dimensions: 6 2 +16: process grid dimensions: 1 7 16: GLOBAL INFO OF A 16: block dimensions: 100 20 16: full dimensions: 1260 559 -16: process grid dimensions: 6 2 +16: process grid dimensions: 1 7 16: GLOBAL INFO OF C 16: block dimensions: 10 20 16: full dimensions: 270 559 -16: process grid dimensions: 6 2 +16: process grid dimensions: 1 7 16: Change process grid: No 16: DISTRIBUTION OF B^t 16: Number of non-zero blocks: 114 16: Percentage of non-zero blocks: 11.40 -16: Average number of blocks per group: 38 -16: Maximum number of blocks per group: 41 -16: Average number of matrix elements per group: 11419 -16: Maximum number of matrix elements per group: 12123 -16: Average number of blocks per CPU: 10 -16: Maximum number of blocks per CPU: 16 -16: Average number of matrix elements per CPU: 2855 -16: Maximum number of matrix elements per CPU: 6228 +16: Average number of blocks per group: 114 +16: Maximum number of blocks per group: 114 +16: Average number of matrix elements per group: 34257 +16: Maximum number of matrix elements per group: 34257 +16: Average number of blocks per CPU: 17 +16: Maximum number of blocks per CPU: 27 +16: Average number of matrix elements per CPU: 4894 +16: Maximum number of matrix elements per CPU: 12750 16: DISTRIBUTION OF A 16: Number of non-zero blocks: 207 16: Percentage of non-zero blocks: 10.35 -16: Average number of blocks per group: 69 -16: Maximum number of blocks per group: 69 -16: Average number of matrix elements per group: 21835 -16: Maximum number of matrix elements per group: 25054 -16: Average number of blocks per CPU: 18 -16: Maximum number of blocks per CPU: 22 -16: Average number of matrix elements per CPU: 5459 -16: Maximum number of matrix elements per CPU: 7226 +16: Average number of blocks per group: 207 +16: Maximum number of blocks per group: 207 +16: Average number of matrix elements per group: 65504 +16: Maximum number of matrix elements per group: 65504 +16: Average number of blocks per CPU: 30 +16: Maximum number of blocks per CPU: 41 +16: Average number of matrix elements per CPU: 9358 +16: Maximum number of matrix elements per CPU: 15279 16: DISTRIBUTION OF C replicated -16: Number of non-zero blocks: 183 -16: Percentage of non-zero blocks: 30.50 -16: Average number of blocks per group: 61 -16: Maximum number of blocks per group: 66 -16: Average number of matrix elements per group: 35466 -16: Maximum number of matrix elements per group: 38577 -16: Average number of blocks per CPU: 16 -16: Maximum number of blocks per CPU: 29 -16: Average number of matrix elements per CPU: 8867 -16: Maximum number of matrix elements per CPU: 16137 +16: Number of non-zero blocks: 131 +16: Percentage of non-zero blocks: 65.50 +16: Average number of blocks per group: 131 +16: Maximum number of blocks per group: 131 +16: Average number of matrix elements per group: 89406 +16: Maximum number of matrix elements per group: 89406 +16: Average number of blocks per CPU: 19 +16: Maximum number of blocks per CPU: 25 +16: Average number of matrix elements per CPU: 12773 +16: Maximum number of matrix elements per CPU: 15633 16: -------------------------------------------------------------------------------- 16: TAS MATRIX MULTIPLICATION DONE 16: -------------------------------------------------------------------------------- @@ -56303,320 +56305,320 @@ 16: -------------------------------------------------------------------------------- 16: mm dims: 10 100 20 16: MM PARAMETERS -16: Est. number of matrix elements per CPU of result matrix: 7400 +16: Est. number of matrix elements per CPU of result matrix: 12686 16: Est. optimal split factor: 1 16: Optimizing distribution of B and A^t 16: mm case: |T x | = + 16: SPLIT / PARALLELIZATION INFO -16: splitting rows by factor 3 -16: global grid sizes: 6x 2 -16: grid sizes on subgroups: 2x 2 +16: splitting rows by factor 1 +16: global grid sizes: 1x 7 +16: grid sizes on subgroups: 1x 7 16: GLOBAL INFO OF B 16: block dimensions: 100 10 16: full dimensions: 1260 270 -16: process grid dimensions: 6 2 +16: process grid dimensions: 1 7 16: GLOBAL INFO OF A^t 16: block dimensions: 100 20 16: full dimensions: 1260 559 -16: process grid dimensions: 6 2 +16: process grid dimensions: 1 7 16: GLOBAL INFO OF C 16: block dimensions: 10 20 16: full dimensions: 270 559 -16: process grid dimensions: 6 2 +16: process grid dimensions: 1 7 16: Change process grid: No 16: DISTRIBUTION OF B 16: Number of non-zero blocks: 91 16: Percentage of non-zero blocks: 9.10 -16: Average number of blocks per group: 31 -16: Maximum number of blocks per group: 35 -16: Average number of matrix elements per group: 9626 -16: Maximum number of matrix elements per group: 10560 -16: Average number of blocks per CPU: 8 -16: Maximum number of blocks per CPU: 10 -16: Average number of matrix elements per CPU: 2407 -16: Maximum number of matrix elements per CPU: 4797 +16: Average number of blocks per group: 91 +16: Maximum number of blocks per group: 91 +16: Average number of matrix elements per group: 28878 +16: Maximum number of matrix elements per group: 28878 +16: Average number of blocks per CPU: 13 +16: Maximum number of blocks per CPU: 21 +16: Average number of matrix elements per CPU: 4126 +16: Maximum number of matrix elements per CPU: 15462 16: DISTRIBUTION OF A^t 16: Number of non-zero blocks: 208 16: Percentage of non-zero blocks: 10.40 -16: Average number of blocks per group: 70 -16: Maximum number of blocks per group: 72 -16: Average number of matrix elements per group: 25149 -16: Maximum number of matrix elements per group: 29364 -16: Average number of blocks per CPU: 18 -16: Maximum number of blocks per CPU: 24 -16: Average number of matrix elements per CPU: 6288 -16: Maximum number of matrix elements per CPU: 11811 +16: Average number of blocks per group: 208 +16: Maximum number of blocks per group: 208 +16: Average number of matrix elements per group: 75445 +16: Maximum number of matrix elements per group: 75445 +16: Average number of blocks per CPU: 30 +16: Maximum number of blocks per CPU: 41 +16: Average number of matrix elements per CPU: 10778 +16: Maximum number of matrix elements per CPU: 24390 16: DISTRIBUTION OF C replicated -16: Number of non-zero blocks: 170 -16: Percentage of non-zero blocks: 28.33 -16: Average number of blocks per group: 57 -16: Maximum number of blocks per group: 64 -16: Average number of matrix elements per group: 43311 -16: Maximum number of matrix elements per group: 46860 -16: Average number of blocks per CPU: 15 -16: Maximum number of blocks per CPU: 27 -16: Average number of matrix elements per CPU: 10828 -16: Maximum number of matrix elements per CPU: 20892 +16: Number of non-zero blocks: 125 +16: Percentage of non-zero blocks: 62.50 +16: Average number of blocks per group: 125 +16: Maximum number of blocks per group: 125 +16: Average number of matrix elements per group: 88797 +16: Maximum number of matrix elements per group: 88797 +16: Average number of blocks per CPU: 18 +16: Maximum number of blocks per CPU: 28 +16: Average number of matrix elements per CPU: 12686 +16: Maximum number of matrix elements per CPU: 17469 16: -------------------------------------------------------------------------------- 16: TAS MATRIX MULTIPLICATION DONE 16: -------------------------------------------------------------------------------- 16: BN X A^tT passed! 16: checksums 0.43E+07 0.43E+07 -16: difference norm 0.18E-13 +16: difference norm 0.00E+00 16: -------------------------------------------------------------------------------- 16: DBCSR TAS MATRIX MULTIPLICATION: B^t x A^t = C 16: -------------------------------------------------------------------------------- 16: mm dims: 10 100 20 16: MM PARAMETERS -16: Est. number of matrix elements per CPU of result matrix: 7520 +16: Est. number of matrix elements per CPU of result matrix: 12891 16: Est. optimal split factor: 1 16: Optimizing distribution of B^t and A^t 16: mm case: |T x | = + 16: SPLIT / PARALLELIZATION INFO -16: splitting rows by factor 3 -16: global grid sizes: 6x 2 -16: grid sizes on subgroups: 2x 2 +16: splitting rows by factor 1 +16: global grid sizes: 1x 7 +16: grid sizes on subgroups: 1x 7 16: GLOBAL INFO OF B^t 16: block dimensions: 100 10 16: full dimensions: 1260 270 -16: process grid dimensions: 6 2 +16: process grid dimensions: 1 7 16: GLOBAL INFO OF A^t 16: block dimensions: 100 20 16: full dimensions: 1260 559 -16: process grid dimensions: 6 2 +16: process grid dimensions: 1 7 16: GLOBAL INFO OF C 16: block dimensions: 10 20 16: full dimensions: 270 559 -16: process grid dimensions: 6 2 +16: process grid dimensions: 1 7 16: Change process grid: No 16: DISTRIBUTION OF B^t 16: Number of non-zero blocks: 114 16: Percentage of non-zero blocks: 11.40 -16: Average number of blocks per group: 38 -16: Maximum number of blocks per group: 41 -16: Average number of matrix elements per group: 11419 -16: Maximum number of matrix elements per group: 12123 -16: Average number of blocks per CPU: 10 -16: Maximum number of blocks per CPU: 16 -16: Average number of matrix elements per CPU: 2855 -16: Maximum number of matrix elements per CPU: 6228 +16: Average number of blocks per group: 114 +16: Maximum number of blocks per group: 114 +16: Average number of matrix elements per group: 34257 +16: Maximum number of matrix elements per group: 34257 +16: Average number of blocks per CPU: 17 +16: Maximum number of blocks per CPU: 27 +16: Average number of matrix elements per CPU: 4894 +16: Maximum number of matrix elements per CPU: 12750 16: DISTRIBUTION OF A^t 16: Number of non-zero blocks: 208 16: Percentage of non-zero blocks: 10.40 -16: Average number of blocks per group: 70 -16: Maximum number of blocks per group: 72 -16: Average number of matrix elements per group: 25149 -16: Maximum number of matrix elements per group: 29364 -16: Average number of blocks per CPU: 18 -16: Maximum number of blocks per CPU: 24 -16: Average number of matrix elements per CPU: 6288 -16: Maximum number of matrix elements per CPU: 11811 +16: Average number of blocks per group: 208 +16: Maximum number of blocks per group: 208 +16: Average number of matrix elements per group: 75445 +16: Maximum number of matrix elements per group: 75445 +16: Average number of blocks per CPU: 30 +16: Maximum number of blocks per CPU: 41 +16: Average number of matrix elements per CPU: 10778 +16: Maximum number of matrix elements per CPU: 24390 16: DISTRIBUTION OF C replicated -16: Number of non-zero blocks: 198 -16: Percentage of non-zero blocks: 33.00 -16: Average number of blocks per group: 66 -16: Maximum number of blocks per group: 69 -16: Average number of matrix elements per group: 46114 -16: Maximum number of matrix elements per group: 50826 -16: Average number of blocks per CPU: 17 -16: Maximum number of blocks per CPU: 33 -16: Average number of matrix elements per CPU: 11529 -16: Maximum number of matrix elements per CPU: 22743 +16: Number of non-zero blocks: 137 +16: Percentage of non-zero blocks: 68.50 +16: Average number of blocks per group: 137 +16: Maximum number of blocks per group: 137 +16: Average number of matrix elements per group: 90231 +16: Maximum number of matrix elements per group: 90231 +16: Average number of blocks per CPU: 20 +16: Maximum number of blocks per CPU: 25 +16: Average number of matrix elements per CPU: 12891 +16: Maximum number of matrix elements per CPU: 17043 16: -------------------------------------------------------------------------------- 16: TAS MATRIX MULTIPLICATION DONE 16: -------------------------------------------------------------------------------- 16: B^tT X A^tT passed! 16: checksums 0.44E+07 0.44E+07 -16: difference norm 0.14E-13 +16: difference norm 0.18E-13 16: -------------------------------------------------------------------------------- 16: DBCSR TAS MATRIX MULTIPLICATION: A x C = B^t 16: -------------------------------------------------------------------------------- 16: mm dims: 100 20 10 16: MM PARAMETERS -16: Est. number of matrix elements per CPU of result matrix: 6314 +16: Est. number of matrix elements per CPU of result matrix: 10824 16: Est. optimal split factor: 5 16: Optimizing distribution of A and B^t 16: mm case: | x + = | 16: SPLIT / PARALLELIZATION INFO -16: splitting rows by factor 3 -16: global grid sizes: 6x 2 -16: grid sizes on subgroups: 2x 2 +16: splitting rows by factor 7 +16: global grid sizes: 7x 1 +16: grid sizes on subgroups: 1x 1 16: GLOBAL INFO OF A 16: block dimensions: 100 20 16: full dimensions: 1260 559 -16: process grid dimensions: 6 2 +16: process grid dimensions: 7 1 16: GLOBAL INFO OF C 16: block dimensions: 20 10 16: full dimensions: 559 270 -16: process grid dimensions: 6 2 +16: process grid dimensions: 7 1 16: GLOBAL INFO OF B^t 16: block dimensions: 100 10 16: full dimensions: 1260 270 -16: process grid dimensions: 6 2 +16: process grid dimensions: 7 1 16: Change process grid: No 16: DISTRIBUTION OF A 16: Number of non-zero blocks: 207 16: Percentage of non-zero blocks: 10.35 -16: Average number of blocks per group: 69 -16: Maximum number of blocks per group: 69 -16: Average number of matrix elements per group: 21835 -16: Maximum number of matrix elements per group: 25054 -16: Average number of blocks per CPU: 18 -16: Maximum number of blocks per CPU: 22 -16: Average number of matrix elements per CPU: 5459 -16: Maximum number of matrix elements per CPU: 7226 +16: Average number of blocks per group: 30 +16: Maximum number of blocks per group: 39 +16: Average number of matrix elements per group: 9358 +16: Maximum number of matrix elements per group: 14069 +16: Average number of blocks per CPU: 30 +16: Maximum number of blocks per CPU: 39 +16: Average number of matrix elements per CPU: 9358 +16: Maximum number of matrix elements per CPU: 14069 16: DISTRIBUTION OF C replicated -16: Number of non-zero blocks: 48 +16: Number of non-zero blocks: 112 16: Percentage of non-zero blocks: 8.00 16: Average number of blocks per group: 16 16: Maximum number of blocks per group: 16 16: Average number of matrix elements per group: 15435 16: Maximum number of matrix elements per group: 15435 -16: Average number of blocks per CPU: 4 -16: Maximum number of blocks per CPU: 6 -16: Average number of matrix elements per CPU: 3859 -16: Maximum number of matrix elements per CPU: 8169 +16: Average number of blocks per CPU: 16 +16: Maximum number of blocks per CPU: 16 +16: Average number of matrix elements per CPU: 15435 +16: Maximum number of matrix elements per CPU: 15435 16: DISTRIBUTION OF B^t 16: Number of non-zero blocks: 157 16: Percentage of non-zero blocks: 15.70 -16: Average number of blocks per group: 53 -16: Maximum number of blocks per group: 54 -16: Average number of matrix elements per group: 25254 -16: Maximum number of matrix elements per group: 26481 -16: Average number of blocks per CPU: 14 -16: Maximum number of blocks per CPU: 21 -16: Average number of matrix elements per CPU: 6314 -16: Maximum number of matrix elements per CPU: 14928 +16: Average number of blocks per group: 23 +16: Maximum number of blocks per group: 32 +16: Average number of matrix elements per group: 10824 +16: Maximum number of matrix elements per group: 14553 +16: Average number of blocks per CPU: 23 +16: Maximum number of blocks per CPU: 32 +16: Average number of matrix elements per CPU: 10824 +16: Maximum number of matrix elements per CPU: 14553 16: -------------------------------------------------------------------------------- 16: TAS MATRIX MULTIPLICATION DONE 16: -------------------------------------------------------------------------------- 16: AN X CN passed! 16: checksums 0.81E+07 0.81E+07 -16: difference norm 0.21E-13 +16: difference norm 0.28E-13 16: -------------------------------------------------------------------------------- 16: DBCSR TAS MATRIX MULTIPLICATION: A^t x C = B^t 16: -------------------------------------------------------------------------------- 16: mm dims: 100 20 10 16: MM PARAMETERS -16: Est. number of matrix elements per CPU of result matrix: 4685 +16: Est. number of matrix elements per CPU of result matrix: 8031 16: Est. optimal split factor: 5 16: Optimizing distribution of A^t and B^t 16: mm case: | x + = | 16: SPLIT / PARALLELIZATION INFO -16: splitting rows by factor 3 -16: global grid sizes: 6x 2 -16: grid sizes on subgroups: 2x 2 +16: splitting rows by factor 7 +16: global grid sizes: 7x 1 +16: grid sizes on subgroups: 1x 1 16: GLOBAL INFO OF A^t 16: block dimensions: 100 20 16: full dimensions: 1260 559 -16: process grid dimensions: 6 2 +16: process grid dimensions: 7 1 16: GLOBAL INFO OF C 16: block dimensions: 20 10 16: full dimensions: 559 270 -16: process grid dimensions: 6 2 +16: process grid dimensions: 7 1 16: GLOBAL INFO OF B^t 16: block dimensions: 100 10 16: full dimensions: 1260 270 -16: process grid dimensions: 6 2 +16: process grid dimensions: 7 1 16: Change process grid: No 16: DISTRIBUTION OF A^t 16: Number of non-zero blocks: 208 16: Percentage of non-zero blocks: 10.40 -16: Average number of blocks per group: 70 -16: Maximum number of blocks per group: 72 -16: Average number of matrix elements per group: 25149 -16: Maximum number of matrix elements per group: 29364 -16: Average number of blocks per CPU: 18 -16: Maximum number of blocks per CPU: 24 -16: Average number of matrix elements per CPU: 6288 -16: Maximum number of matrix elements per CPU: 11811 +16: Average number of blocks per group: 30 +16: Maximum number of blocks per group: 35 +16: Average number of matrix elements per group: 10778 +16: Maximum number of matrix elements per group: 12417 +16: Average number of blocks per CPU: 30 +16: Maximum number of blocks per CPU: 35 +16: Average number of matrix elements per CPU: 10778 +16: Maximum number of matrix elements per CPU: 12417 16: DISTRIBUTION OF C replicated -16: Number of non-zero blocks: 48 +16: Number of non-zero blocks: 112 16: Percentage of non-zero blocks: 8.00 16: Average number of blocks per group: 16 16: Maximum number of blocks per group: 16 16: Average number of matrix elements per group: 15435 16: Maximum number of matrix elements per group: 15435 -16: Average number of blocks per CPU: 4 -16: Maximum number of blocks per CPU: 6 -16: Average number of matrix elements per CPU: 3859 -16: Maximum number of matrix elements per CPU: 8169 +16: Average number of blocks per CPU: 16 +16: Maximum number of blocks per CPU: 16 +16: Average number of matrix elements per CPU: 15435 +16: Maximum number of matrix elements per CPU: 15435 16: DISTRIBUTION OF B^t 16: Number of non-zero blocks: 149 16: Percentage of non-zero blocks: 14.90 -16: Average number of blocks per group: 50 -16: Maximum number of blocks per group: 56 -16: Average number of matrix elements per group: 18738 -16: Maximum number of matrix elements per group: 23340 -16: Average number of blocks per CPU: 13 -16: Maximum number of blocks per CPU: 21 -16: Average number of matrix elements per CPU: 4685 -16: Maximum number of matrix elements per CPU: 10620 +16: Average number of blocks per group: 22 +16: Maximum number of blocks per group: 29 +16: Average number of matrix elements per group: 8031 +16: Maximum number of matrix elements per group: 12486 +16: Average number of blocks per CPU: 22 +16: Maximum number of blocks per CPU: 29 +16: Average number of matrix elements per CPU: 8031 +16: Maximum number of matrix elements per CPU: 12486 16: -------------------------------------------------------------------------------- 16: TAS MATRIX MULTIPLICATION DONE 16: -------------------------------------------------------------------------------- 16: A^tT X CN passed! 16: checksums 0.60E+07 0.60E+07 -16: difference norm 0.18E-13 +16: difference norm 0.11E-13 16: -------------------------------------------------------------------------------- 16: DBCSR TAS MATRIX MULTIPLICATION: A x C^t = B^t 16: -------------------------------------------------------------------------------- 16: mm dims: 100 20 10 16: MM PARAMETERS -16: Est. number of matrix elements per CPU of result matrix: 3010 +16: Est. number of matrix elements per CPU of result matrix: 5160 16: Est. optimal split factor: 6 16: Optimizing distribution of A and B^t 16: mm case: | x + = | 16: SPLIT / PARALLELIZATION INFO -16: splitting rows by factor 3 -16: global grid sizes: 6x 2 -16: grid sizes on subgroups: 2x 2 +16: splitting rows by factor 7 +16: global grid sizes: 7x 1 +16: grid sizes on subgroups: 1x 1 16: GLOBAL INFO OF A 16: block dimensions: 100 20 16: full dimensions: 1260 559 -16: process grid dimensions: 6 2 +16: process grid dimensions: 7 1 16: GLOBAL INFO OF C^t 16: block dimensions: 20 10 16: full dimensions: 559 270 -16: process grid dimensions: 6 2 +16: process grid dimensions: 7 1 16: GLOBAL INFO OF B^t 16: block dimensions: 100 10 16: full dimensions: 1260 270 -16: process grid dimensions: 6 2 +16: process grid dimensions: 7 1 16: Change process grid: No 16: DISTRIBUTION OF A 16: Number of non-zero blocks: 207 16: Percentage of non-zero blocks: 10.35 -16: Average number of blocks per group: 69 -16: Maximum number of blocks per group: 69 -16: Average number of matrix elements per group: 21835 -16: Maximum number of matrix elements per group: 25054 -16: Average number of blocks per CPU: 18 -16: Maximum number of blocks per CPU: 22 -16: Average number of matrix elements per CPU: 5459 -16: Maximum number of matrix elements per CPU: 7226 +16: Average number of blocks per group: 30 +16: Maximum number of blocks per group: 39 +16: Average number of matrix elements per group: 9358 +16: Maximum number of matrix elements per group: 14069 +16: Average number of blocks per CPU: 30 +16: Maximum number of blocks per CPU: 39 +16: Average number of matrix elements per CPU: 9358 +16: Maximum number of matrix elements per CPU: 14069 16: DISTRIBUTION OF C^t replicated -16: Number of non-zero blocks: 51 +16: Number of non-zero blocks: 119 16: Percentage of non-zero blocks: 8.50 16: Average number of blocks per group: 17 16: Maximum number of blocks per group: 17 16: Average number of matrix elements per group: 11277 16: Maximum number of matrix elements per group: 11277 -16: Average number of blocks per CPU: 5 -16: Maximum number of blocks per CPU: 9 -16: Average number of matrix elements per CPU: 2820 -16: Maximum number of matrix elements per CPU: 7257 +16: Average number of blocks per CPU: 17 +16: Maximum number of blocks per CPU: 17 +16: Average number of matrix elements per CPU: 11277 +16: Maximum number of matrix elements per CPU: 11277 16: DISTRIBUTION OF B^t 16: Number of non-zero blocks: 173 16: Percentage of non-zero blocks: 17.30 -16: Average number of blocks per group: 58 -16: Maximum number of blocks per group: 63 -16: Average number of matrix elements per group: 12038 -16: Maximum number of matrix elements per group: 13194 -16: Average number of blocks per CPU: 15 -16: Maximum number of blocks per CPU: 26 -16: Average number of matrix elements per CPU: 3010 -16: Maximum number of matrix elements per CPU: 5112 +16: Average number of blocks per group: 25 +16: Maximum number of blocks per group: 31 +16: Average number of matrix elements per group: 5160 +16: Maximum number of matrix elements per group: 7131 +16: Average number of blocks per CPU: 25 +16: Maximum number of blocks per CPU: 31 +16: Average number of matrix elements per CPU: 5160 +16: Maximum number of matrix elements per CPU: 7131 16: -------------------------------------------------------------------------------- 16: TAS MATRIX MULTIPLICATION DONE 16: -------------------------------------------------------------------------------- @@ -56628,60 +56630,60 @@ 16: -------------------------------------------------------------------------------- 16: mm dims: 100 20 10 16: MM PARAMETERS -16: Est. number of matrix elements per CPU of result matrix: 4145 +16: Est. number of matrix elements per CPU of result matrix: 7106 16: Est. optimal split factor: 7 16: Optimizing distribution of A^t and B^t 16: mm case: | x + = | 16: SPLIT / PARALLELIZATION INFO -16: splitting rows by factor 3 -16: global grid sizes: 6x 2 -16: grid sizes on subgroups: 2x 2 +16: splitting rows by factor 7 +16: global grid sizes: 7x 1 +16: grid sizes on subgroups: 1x 1 16: GLOBAL INFO OF A^t 16: block dimensions: 100 20 16: full dimensions: 1260 559 -16: process grid dimensions: 6 2 +16: process grid dimensions: 7 1 16: GLOBAL INFO OF C^t 16: block dimensions: 20 10 16: full dimensions: 559 270 -16: process grid dimensions: 6 2 +16: process grid dimensions: 7 1 16: GLOBAL INFO OF B^t 16: block dimensions: 100 10 16: full dimensions: 1260 270 -16: process grid dimensions: 6 2 +16: process grid dimensions: 7 1 16: Change process grid: No 16: DISTRIBUTION OF A^t 16: Number of non-zero blocks: 208 16: Percentage of non-zero blocks: 10.40 -16: Average number of blocks per group: 70 -16: Maximum number of blocks per group: 72 -16: Average number of matrix elements per group: 25149 -16: Maximum number of matrix elements per group: 29364 -16: Average number of blocks per CPU: 18 -16: Maximum number of blocks per CPU: 24 -16: Average number of matrix elements per CPU: 6288 -16: Maximum number of matrix elements per CPU: 11811 +16: Average number of blocks per group: 30 +16: Maximum number of blocks per group: 35 +16: Average number of matrix elements per group: 10778 +16: Maximum number of matrix elements per group: 12417 +16: Average number of blocks per CPU: 30 +16: Maximum number of blocks per CPU: 35 +16: Average number of matrix elements per CPU: 10778 +16: Maximum number of matrix elements per CPU: 12417 16: DISTRIBUTION OF C^t replicated -16: Number of non-zero blocks: 51 +16: Number of non-zero blocks: 119 16: Percentage of non-zero blocks: 8.50 16: Average number of blocks per group: 17 16: Maximum number of blocks per group: 17 16: Average number of matrix elements per group: 11277 16: Maximum number of matrix elements per group: 11277 -16: Average number of blocks per CPU: 5 -16: Maximum number of blocks per CPU: 9 -16: Average number of matrix elements per CPU: 2820 -16: Maximum number of matrix elements per CPU: 7257 +16: Average number of blocks per CPU: 17 +16: Maximum number of blocks per CPU: 17 +16: Average number of matrix elements per CPU: 11277 +16: Maximum number of matrix elements per CPU: 11277 16: DISTRIBUTION OF B^t 16: Number of non-zero blocks: 179 16: Percentage of non-zero blocks: 17.90 -16: Average number of blocks per group: 60 -16: Maximum number of blocks per group: 61 -16: Average number of matrix elements per group: 16580 -16: Maximum number of matrix elements per group: 18399 -16: Average number of blocks per CPU: 15 -16: Maximum number of blocks per CPU: 28 -16: Average number of matrix elements per CPU: 4145 -16: Maximum number of matrix elements per CPU: 7044 +16: Average number of blocks per group: 26 +16: Maximum number of blocks per group: 30 +16: Average number of matrix elements per group: 7106 +16: Maximum number of matrix elements per group: 9597 +16: Average number of blocks per CPU: 26 +16: Maximum number of blocks per CPU: 30 +16: Average number of matrix elements per CPU: 7106 +16: Maximum number of matrix elements per CPU: 9597 16: -------------------------------------------------------------------------------- 16: TAS MATRIX MULTIPLICATION DONE 16: -------------------------------------------------------------------------------- @@ -56693,60 +56695,60 @@ 16: -------------------------------------------------------------------------------- 16: mm dims: 100 20 10 16: MM PARAMETERS -16: Est. number of matrix elements per CPU of result matrix: 6314 +16: Est. number of matrix elements per CPU of result matrix: 10824 16: Est. optimal split factor: 5 16: Optimizing distribution of A and B 16: mm case: | x + = | 16: SPLIT / PARALLELIZATION INFO -16: splitting rows by factor 3 -16: global grid sizes: 6x 2 -16: grid sizes on subgroups: 2x 2 +16: splitting rows by factor 7 +16: global grid sizes: 7x 1 +16: grid sizes on subgroups: 1x 1 16: GLOBAL INFO OF A 16: block dimensions: 100 20 16: full dimensions: 1260 559 -16: process grid dimensions: 6 2 +16: process grid dimensions: 7 1 16: GLOBAL INFO OF C 16: block dimensions: 20 10 16: full dimensions: 559 270 -16: process grid dimensions: 6 2 +16: process grid dimensions: 7 1 16: GLOBAL INFO OF B 16: block dimensions: 100 10 16: full dimensions: 1260 270 -16: process grid dimensions: 6 2 +16: process grid dimensions: 7 1 16: Change process grid: No 16: DISTRIBUTION OF A 16: Number of non-zero blocks: 207 16: Percentage of non-zero blocks: 10.35 -16: Average number of blocks per group: 69 -16: Maximum number of blocks per group: 69 -16: Average number of matrix elements per group: 21835 -16: Maximum number of matrix elements per group: 25054 -16: Average number of blocks per CPU: 18 -16: Maximum number of blocks per CPU: 22 -16: Average number of matrix elements per CPU: 5459 -16: Maximum number of matrix elements per CPU: 7226 +16: Average number of blocks per group: 30 +16: Maximum number of blocks per group: 39 +16: Average number of matrix elements per group: 9358 +16: Maximum number of matrix elements per group: 14069 +16: Average number of blocks per CPU: 30 +16: Maximum number of blocks per CPU: 39 +16: Average number of matrix elements per CPU: 9358 +16: Maximum number of matrix elements per CPU: 14069 16: DISTRIBUTION OF C replicated -16: Number of non-zero blocks: 48 +16: Number of non-zero blocks: 112 16: Percentage of non-zero blocks: 8.00 16: Average number of blocks per group: 16 16: Maximum number of blocks per group: 16 16: Average number of matrix elements per group: 15435 16: Maximum number of matrix elements per group: 15435 -16: Average number of blocks per CPU: 4 -16: Maximum number of blocks per CPU: 6 -16: Average number of matrix elements per CPU: 3859 -16: Maximum number of matrix elements per CPU: 8169 +16: Average number of blocks per CPU: 16 +16: Maximum number of blocks per CPU: 16 +16: Average number of matrix elements per CPU: 15435 +16: Maximum number of matrix elements per CPU: 15435 16: DISTRIBUTION OF B 16: Number of non-zero blocks: 157 16: Percentage of non-zero blocks: 15.70 -16: Average number of blocks per group: 53 -16: Maximum number of blocks per group: 54 -16: Average number of matrix elements per group: 25254 -16: Maximum number of matrix elements per group: 26481 -16: Average number of blocks per CPU: 14 -16: Maximum number of blocks per CPU: 21 -16: Average number of matrix elements per CPU: 6314 -16: Maximum number of matrix elements per CPU: 14928 +16: Average number of blocks per group: 23 +16: Maximum number of blocks per group: 32 +16: Average number of matrix elements per group: 10824 +16: Maximum number of matrix elements per group: 14553 +16: Average number of blocks per CPU: 23 +16: Maximum number of blocks per CPU: 32 +16: Average number of matrix elements per CPU: 10824 +16: Maximum number of matrix elements per CPU: 14553 16: -------------------------------------------------------------------------------- 16: TAS MATRIX MULTIPLICATION DONE 16: -------------------------------------------------------------------------------- @@ -56758,450 +56760,450 @@ 16: -------------------------------------------------------------------------------- 16: mm dims: 100 20 10 16: MM PARAMETERS -16: Est. number of matrix elements per CPU of result matrix: 4685 +16: Est. number of matrix elements per CPU of result matrix: 8031 16: Est. optimal split factor: 5 16: Optimizing distribution of A^t and B 16: mm case: | x + = | 16: SPLIT / PARALLELIZATION INFO -16: splitting rows by factor 3 -16: global grid sizes: 6x 2 -16: grid sizes on subgroups: 2x 2 +16: splitting rows by factor 7 +16: global grid sizes: 7x 1 +16: grid sizes on subgroups: 1x 1 16: GLOBAL INFO OF A^t 16: block dimensions: 100 20 16: full dimensions: 1260 559 -16: process grid dimensions: 6 2 +16: process grid dimensions: 7 1 16: GLOBAL INFO OF C 16: block dimensions: 20 10 16: full dimensions: 559 270 -16: process grid dimensions: 6 2 +16: process grid dimensions: 7 1 16: GLOBAL INFO OF B 16: block dimensions: 100 10 16: full dimensions: 1260 270 -16: process grid dimensions: 6 2 +16: process grid dimensions: 7 1 16: Change process grid: No 16: DISTRIBUTION OF A^t 16: Number of non-zero blocks: 208 16: Percentage of non-zero blocks: 10.40 -16: Average number of blocks per group: 70 -16: Maximum number of blocks per group: 72 -16: Average number of matrix elements per group: 25149 -16: Maximum number of matrix elements per group: 29364 -16: Average number of blocks per CPU: 18 -16: Maximum number of blocks per CPU: 24 -16: Average number of matrix elements per CPU: 6288 -16: Maximum number of matrix elements per CPU: 11811 +16: Average number of blocks per group: 30 +16: Maximum number of blocks per group: 35 +16: Average number of matrix elements per group: 10778 +16: Maximum number of matrix elements per group: 12417 +16: Average number of blocks per CPU: 30 +16: Maximum number of blocks per CPU: 35 +16: Average number of matrix elements per CPU: 10778 +16: Maximum number of matrix elements per CPU: 12417 16: DISTRIBUTION OF C replicated -16: Number of non-zero blocks: 48 +16: Number of non-zero blocks: 112 16: Percentage of non-zero blocks: 8.00 16: Average number of blocks per group: 16 16: Maximum number of blocks per group: 16 16: Average number of matrix elements per group: 15435 16: Maximum number of matrix elements per group: 15435 -16: Average number of blocks per CPU: 4 -16: Maximum number of blocks per CPU: 6 -16: Average number of matrix elements per CPU: 3859 -16: Maximum number of matrix elements per CPU: 8169 +16: Average number of blocks per CPU: 16 +16: Maximum number of blocks per CPU: 16 +16: Average number of matrix elements per CPU: 15435 +16: Maximum number of matrix elements per CPU: 15435 16: DISTRIBUTION OF B 16: Number of non-zero blocks: 149 16: Percentage of non-zero blocks: 14.90 -16: Average number of blocks per group: 50 -16: Maximum number of blocks per group: 56 -16: Average number of matrix elements per group: 18738 -16: Maximum number of matrix elements per group: 23340 -16: Average number of blocks per CPU: 13 -16: Maximum number of blocks per CPU: 21 -16: Average number of matrix elements per CPU: 4685 -16: Maximum number of matrix elements per CPU: 10620 +16: Average number of blocks per group: 22 +16: Maximum number of blocks per group: 29 +16: Average number of matrix elements per group: 8031 +16: Maximum number of matrix elements per group: 12486 +16: Average number of blocks per CPU: 22 +16: Maximum number of blocks per CPU: 29 +16: Average number of matrix elements per CPU: 8031 +16: Maximum number of matrix elements per CPU: 12486 16: -------------------------------------------------------------------------------- 16: TAS MATRIX MULTIPLICATION DONE 16: -------------------------------------------------------------------------------- 16: A^tT X CN passed! 16: checksums 0.60E+07 0.60E+07 -16: difference norm 0.25E-13 +16: difference norm 0.11E-13 16: -------------------------------------------------------------------------------- 16: DBCSR TAS MATRIX MULTIPLICATION: A x C^t = B 16: -------------------------------------------------------------------------------- 16: mm dims: 100 20 10 16: MM PARAMETERS -16: Est. number of matrix elements per CPU of result matrix: 3010 +16: Est. number of matrix elements per CPU of result matrix: 5160 16: Est. optimal split factor: 6 16: Optimizing distribution of A and B 16: mm case: | x + = | 16: SPLIT / PARALLELIZATION INFO -16: splitting rows by factor 3 -16: global grid sizes: 6x 2 -16: grid sizes on subgroups: 2x 2 +16: splitting rows by factor 7 +16: global grid sizes: 7x 1 +16: grid sizes on subgroups: 1x 1 16: GLOBAL INFO OF A 16: block dimensions: 100 20 16: full dimensions: 1260 559 -16: process grid dimensions: 6 2 +16: process grid dimensions: 7 1 16: GLOBAL INFO OF C^t 16: block dimensions: 20 10 16: full dimensions: 559 270 -16: process grid dimensions: 6 2 +16: process grid dimensions: 7 1 16: GLOBAL INFO OF B 16: block dimensions: 100 10 16: full dimensions: 1260 270 -16: process grid dimensions: 6 2 +16: process grid dimensions: 7 1 16: Change process grid: No 16: DISTRIBUTION OF A 16: Number of non-zero blocks: 207 16: Percentage of non-zero blocks: 10.35 -16: Average number of blocks per group: 69 -16: Maximum number of blocks per group: 69 -16: Average number of matrix elements per group: 21835 -16: Maximum number of matrix elements per group: 25054 -16: Average number of blocks per CPU: 18 -16: Maximum number of blocks per CPU: 22 -16: Average number of matrix elements per CPU: 5459 -16: Maximum number of matrix elements per CPU: 7226 +16: Average number of blocks per group: 30 +16: Maximum number of blocks per group: 39 +16: Average number of matrix elements per group: 9358 +16: Maximum number of matrix elements per group: 14069 +16: Average number of blocks per CPU: 30 +16: Maximum number of blocks per CPU: 39 +16: Average number of matrix elements per CPU: 9358 +16: Maximum number of matrix elements per CPU: 14069 16: DISTRIBUTION OF C^t replicated -16: Number of non-zero blocks: 51 +16: Number of non-zero blocks: 119 16: Percentage of non-zero blocks: 8.50 16: Average number of blocks per group: 17 16: Maximum number of blocks per group: 17 16: Average number of matrix elements per group: 11277 16: Maximum number of matrix elements per group: 11277 -16: Average number of blocks per CPU: 5 -16: Maximum number of blocks per CPU: 9 -16: Average number of matrix elements per CPU: 2820 -16: Maximum number of matrix elements per CPU: 7257 +16: Average number of blocks per CPU: 17 +16: Maximum number of blocks per CPU: 17 +16: Average number of matrix elements per CPU: 11277 +16: Maximum number of matrix elements per CPU: 11277 16: DISTRIBUTION OF B 16: Number of non-zero blocks: 173 16: Percentage of non-zero blocks: 17.30 -16: Average number of blocks per group: 58 -16: Maximum number of blocks per group: 63 -16: Average number of matrix elements per group: 12038 -16: Maximum number of matrix elements per group: 13194 -16: Average number of blocks per CPU: 15 -16: Maximum number of blocks per CPU: 26 -16: Average number of matrix elements per CPU: 3010 -16: Maximum number of matrix elements per CPU: 5112 +16: Average number of blocks per group: 25 +16: Maximum number of blocks per group: 31 +16: Average number of matrix elements per group: 5160 +16: Maximum number of matrix elements per group: 7131 +16: Average number of blocks per CPU: 25 +16: Maximum number of blocks per CPU: 31 +16: Average number of matrix elements per CPU: 5160 +16: Maximum number of matrix elements per CPU: 7131 16: -------------------------------------------------------------------------------- 16: TAS MATRIX MULTIPLICATION DONE 16: -------------------------------------------------------------------------------- 16: AN X C^tT passed! 16: checksums 0.26E+07 0.26E+07 -16: difference norm 0.21E-13 +16: difference norm 0.36E-13 16: -------------------------------------------------------------------------------- 16: DBCSR TAS MATRIX MULTIPLICATION: A^t x C^t = B 16: -------------------------------------------------------------------------------- 16: mm dims: 100 20 10 16: MM PARAMETERS -16: Est. number of matrix elements per CPU of result matrix: 4145 +16: Est. number of matrix elements per CPU of result matrix: 7106 16: Est. optimal split factor: 7 16: Optimizing distribution of A^t and B 16: mm case: | x + = | 16: SPLIT / PARALLELIZATION INFO -16: splitting rows by factor 3 -16: global grid sizes: 6x 2 -16: grid sizes on subgroups: 2x 2 +16: splitting rows by factor 7 +16: global grid sizes: 7x 1 +16: grid sizes on subgroups: 1x 1 16: GLOBAL INFO OF A^t 16: block dimensions: 100 20 16: full dimensions: 1260 559 -16: process grid dimensions: 6 2 +16: process grid dimensions: 7 1 16: GLOBAL INFO OF C^t 16: block dimensions: 20 10 16: full dimensions: 559 270 -16: process grid dimensions: 6 2 +16: process grid dimensions: 7 1 16: GLOBAL INFO OF B 16: block dimensions: 100 10 16: full dimensions: 1260 270 -16: process grid dimensions: 6 2 +16: process grid dimensions: 7 1 16: Change process grid: No 16: DISTRIBUTION OF A^t 16: Number of non-zero blocks: 208 16: Percentage of non-zero blocks: 10.40 -16: Average number of blocks per group: 70 -16: Maximum number of blocks per group: 72 -16: Average number of matrix elements per group: 25149 -16: Maximum number of matrix elements per group: 29364 -16: Average number of blocks per CPU: 18 -16: Maximum number of blocks per CPU: 24 -16: Average number of matrix elements per CPU: 6288 -16: Maximum number of matrix elements per CPU: 11811 +16: Average number of blocks per group: 30 +16: Maximum number of blocks per group: 35 +16: Average number of matrix elements per group: 10778 +16: Maximum number of matrix elements per group: 12417 +16: Average number of blocks per CPU: 30 +16: Maximum number of blocks per CPU: 35 +16: Average number of matrix elements per CPU: 10778 +16: Maximum number of matrix elements per CPU: 12417 16: DISTRIBUTION OF C^t replicated -16: Number of non-zero blocks: 51 +16: Number of non-zero blocks: 119 16: Percentage of non-zero blocks: 8.50 16: Average number of blocks per group: 17 16: Maximum number of blocks per group: 17 16: Average number of matrix elements per group: 11277 16: Maximum number of matrix elements per group: 11277 -16: Average number of blocks per CPU: 5 -16: Maximum number of blocks per CPU: 9 -16: Average number of matrix elements per CPU: 2820 -16: Maximum number of matrix elements per CPU: 7257 +16: Average number of blocks per CPU: 17 +16: Maximum number of blocks per CPU: 17 +16: Average number of matrix elements per CPU: 11277 +16: Maximum number of matrix elements per CPU: 11277 16: DISTRIBUTION OF B 16: Number of non-zero blocks: 179 16: Percentage of non-zero blocks: 17.90 -16: Average number of blocks per group: 60 -16: Maximum number of blocks per group: 61 -16: Average number of matrix elements per group: 16580 -16: Maximum number of matrix elements per group: 18399 -16: Average number of blocks per CPU: 15 -16: Maximum number of blocks per CPU: 28 -16: Average number of matrix elements per CPU: 4145 -16: Maximum number of matrix elements per CPU: 7044 +16: Average number of blocks per group: 26 +16: Maximum number of blocks per group: 30 +16: Average number of matrix elements per group: 7106 +16: Maximum number of matrix elements per group: 9597 +16: Average number of blocks per CPU: 26 +16: Maximum number of blocks per CPU: 30 +16: Average number of matrix elements per CPU: 7106 +16: Maximum number of matrix elements per CPU: 9597 16: -------------------------------------------------------------------------------- 16: TAS MATRIX MULTIPLICATION DONE 16: -------------------------------------------------------------------------------- 16: A^tT X C^tT passed! 16: checksums 0.61E+07 0.61E+07 -16: difference norm 0.32E-13 +16: difference norm 0.36E-13 16: -------------------------------------------------------------------------------- 16: DBCSR TAS MATRIX MULTIPLICATION: C x B = A^t 16: -------------------------------------------------------------------------------- 16: mm dims: 20 10 100 16: MM PARAMETERS -16: Est. number of matrix elements per CPU of result matrix: 3934 +16: Est. number of matrix elements per CPU of result matrix: 6744 16: Est. optimal split factor: 3 16: Optimizing distribution of B and A^t 16: mm case: + x |T = |T 16: SPLIT / PARALLELIZATION INFO -16: splitting rows by factor 3 -16: global grid sizes: 6x 2 -16: grid sizes on subgroups: 2x 2 +16: splitting rows by factor 7 +16: global grid sizes: 7x 1 +16: grid sizes on subgroups: 1x 1 16: GLOBAL INFO OF C 16: block dimensions: 20 10 16: full dimensions: 559 270 -16: process grid dimensions: 6 2 +16: process grid dimensions: 7 1 16: GLOBAL INFO OF B 16: block dimensions: 100 10 16: full dimensions: 1260 270 -16: process grid dimensions: 6 2 +16: process grid dimensions: 7 1 16: GLOBAL INFO OF A^t 16: block dimensions: 100 20 16: full dimensions: 1260 559 -16: process grid dimensions: 6 2 +16: process grid dimensions: 7 1 16: Change process grid: No 16: DISTRIBUTION OF C replicated -16: Number of non-zero blocks: 48 +16: Number of non-zero blocks: 112 16: Percentage of non-zero blocks: 8.00 16: Average number of blocks per group: 16 16: Maximum number of blocks per group: 16 16: Average number of matrix elements per group: 15435 16: Maximum number of matrix elements per group: 15435 -16: Average number of blocks per CPU: 4 -16: Maximum number of blocks per CPU: 6 -16: Average number of matrix elements per CPU: 3859 -16: Maximum number of matrix elements per CPU: 8169 +16: Average number of blocks per CPU: 16 +16: Maximum number of blocks per CPU: 16 +16: Average number of matrix elements per CPU: 15435 +16: Maximum number of matrix elements per CPU: 15435 16: DISTRIBUTION OF B 16: Number of non-zero blocks: 91 16: Percentage of non-zero blocks: 9.10 -16: Average number of blocks per group: 31 -16: Maximum number of blocks per group: 35 -16: Average number of matrix elements per group: 9626 -16: Maximum number of matrix elements per group: 10560 -16: Average number of blocks per CPU: 8 -16: Maximum number of blocks per CPU: 10 -16: Average number of matrix elements per CPU: 2407 -16: Maximum number of matrix elements per CPU: 4797 +16: Average number of blocks per group: 13 +16: Maximum number of blocks per group: 17 +16: Average number of matrix elements per group: 4126 +16: Maximum number of matrix elements per group: 5730 +16: Average number of blocks per CPU: 13 +16: Maximum number of blocks per CPU: 17 +16: Average number of matrix elements per CPU: 4126 +16: Maximum number of matrix elements per CPU: 5730 16: DISTRIBUTION OF A^t 16: Number of non-zero blocks: 152 16: Percentage of non-zero blocks: 7.60 -16: Average number of blocks per group: 51 -16: Maximum number of blocks per group: 65 -16: Average number of matrix elements per group: 15736 -16: Maximum number of matrix elements per group: 19557 -16: Average number of blocks per CPU: 13 -16: Maximum number of blocks per CPU: 23 -16: Average number of matrix elements per CPU: 3934 -16: Maximum number of matrix elements per CPU: 7499 +16: Average number of blocks per group: 22 +16: Maximum number of blocks per group: 31 +16: Average number of matrix elements per group: 6744 +16: Maximum number of matrix elements per group: 11788 +16: Average number of blocks per CPU: 22 +16: Maximum number of blocks per CPU: 31 +16: Average number of matrix elements per CPU: 6744 +16: Maximum number of matrix elements per CPU: 11788 16: -------------------------------------------------------------------------------- 16: TAS MATRIX MULTIPLICATION DONE 16: -------------------------------------------------------------------------------- 16: CN X BN passed! 16: checksums 0.83E+07 0.83E+07 -16: difference norm 0.00E+00 +16: difference norm 0.18E-13 16: -------------------------------------------------------------------------------- 16: DBCSR TAS MATRIX MULTIPLICATION: C^t x B = A^t 16: -------------------------------------------------------------------------------- 16: mm dims: 20 10 100 16: MM PARAMETERS -16: Est. number of matrix elements per CPU of result matrix: 4185 +16: Est. number of matrix elements per CPU of result matrix: 7173 16: Est. optimal split factor: 4 16: Optimizing distribution of B and A^t 16: mm case: + x |T = |T 16: SPLIT / PARALLELIZATION INFO -16: splitting rows by factor 3 -16: global grid sizes: 6x 2 -16: grid sizes on subgroups: 2x 2 +16: splitting rows by factor 7 +16: global grid sizes: 7x 1 +16: grid sizes on subgroups: 1x 1 16: GLOBAL INFO OF C^t 16: block dimensions: 20 10 16: full dimensions: 559 270 -16: process grid dimensions: 6 2 +16: process grid dimensions: 7 1 16: GLOBAL INFO OF B 16: block dimensions: 100 10 16: full dimensions: 1260 270 -16: process grid dimensions: 6 2 +16: process grid dimensions: 7 1 16: GLOBAL INFO OF A^t 16: block dimensions: 100 20 16: full dimensions: 1260 559 -16: process grid dimensions: 6 2 +16: process grid dimensions: 7 1 16: Change process grid: No 16: DISTRIBUTION OF C^t replicated -16: Number of non-zero blocks: 51 +16: Number of non-zero blocks: 119 16: Percentage of non-zero blocks: 8.50 16: Average number of blocks per group: 17 16: Maximum number of blocks per group: 17 16: Average number of matrix elements per group: 11277 16: Maximum number of matrix elements per group: 11277 -16: Average number of blocks per CPU: 5 -16: Maximum number of blocks per CPU: 9 -16: Average number of matrix elements per CPU: 2820 -16: Maximum number of matrix elements per CPU: 7257 +16: Average number of blocks per CPU: 17 +16: Maximum number of blocks per CPU: 17 +16: Average number of matrix elements per CPU: 11277 +16: Maximum number of matrix elements per CPU: 11277 16: DISTRIBUTION OF B 16: Number of non-zero blocks: 91 16: Percentage of non-zero blocks: 9.10 -16: Average number of blocks per group: 31 -16: Maximum number of blocks per group: 35 -16: Average number of matrix elements per group: 9626 -16: Maximum number of matrix elements per group: 10560 -16: Average number of blocks per CPU: 8 -16: Maximum number of blocks per CPU: 10 -16: Average number of matrix elements per CPU: 2407 -16: Maximum number of matrix elements per CPU: 4797 +16: Average number of blocks per group: 13 +16: Maximum number of blocks per group: 17 +16: Average number of matrix elements per group: 4126 +16: Maximum number of matrix elements per group: 5730 +16: Average number of blocks per CPU: 13 +16: Maximum number of blocks per CPU: 17 +16: Average number of matrix elements per CPU: 4126 +16: Maximum number of matrix elements per CPU: 5730 16: DISTRIBUTION OF A^t 16: Number of non-zero blocks: 135 16: Percentage of non-zero blocks: 6.75 -16: Average number of blocks per group: 45 -16: Maximum number of blocks per group: 49 -16: Average number of matrix elements per group: 16737 -16: Maximum number of matrix elements per group: 19052 -16: Average number of blocks per CPU: 12 -16: Maximum number of blocks per CPU: 17 -16: Average number of matrix elements per CPU: 4185 -16: Maximum number of matrix elements per CPU: 10264 +16: Average number of blocks per group: 20 +16: Maximum number of blocks per group: 26 +16: Average number of matrix elements per group: 7173 +16: Maximum number of matrix elements per group: 10488 +16: Average number of blocks per CPU: 20 +16: Maximum number of blocks per CPU: 26 +16: Average number of matrix elements per CPU: 7173 +16: Maximum number of matrix elements per CPU: 10488 16: -------------------------------------------------------------------------------- 16: TAS MATRIX MULTIPLICATION DONE 16: -------------------------------------------------------------------------------- 16: C^tT X BN passed! 16: checksums 0.24E+07 0.24E+07 -16: difference norm 0.89E-14 +16: difference norm 0.36E-14 16: -------------------------------------------------------------------------------- 16: DBCSR TAS MATRIX MULTIPLICATION: C x B^t = A^t 16: -------------------------------------------------------------------------------- 16: mm dims: 20 10 100 16: MM PARAMETERS -16: Est. number of matrix elements per CPU of result matrix: 5273 +16: Est. number of matrix elements per CPU of result matrix: 9039 16: Est. optimal split factor: 4 16: Optimizing distribution of B^t and A^t 16: mm case: + x |T = |T 16: SPLIT / PARALLELIZATION INFO -16: splitting rows by factor 3 -16: global grid sizes: 6x 2 -16: grid sizes on subgroups: 2x 2 +16: splitting rows by factor 7 +16: global grid sizes: 7x 1 +16: grid sizes on subgroups: 1x 1 16: GLOBAL INFO OF C 16: block dimensions: 20 10 16: full dimensions: 559 270 -16: process grid dimensions: 6 2 +16: process grid dimensions: 7 1 16: GLOBAL INFO OF B^t 16: block dimensions: 100 10 16: full dimensions: 1260 270 -16: process grid dimensions: 6 2 +16: process grid dimensions: 7 1 16: GLOBAL INFO OF A^t 16: block dimensions: 100 20 16: full dimensions: 1260 559 -16: process grid dimensions: 6 2 +16: process grid dimensions: 7 1 16: Change process grid: No 16: DISTRIBUTION OF C replicated -16: Number of non-zero blocks: 48 +16: Number of non-zero blocks: 112 16: Percentage of non-zero blocks: 8.00 16: Average number of blocks per group: 16 16: Maximum number of blocks per group: 16 16: Average number of matrix elements per group: 15435 16: Maximum number of matrix elements per group: 15435 -16: Average number of blocks per CPU: 4 -16: Maximum number of blocks per CPU: 6 -16: Average number of matrix elements per CPU: 3859 -16: Maximum number of matrix elements per CPU: 8169 +16: Average number of blocks per CPU: 16 +16: Maximum number of blocks per CPU: 16 +16: Average number of matrix elements per CPU: 15435 +16: Maximum number of matrix elements per CPU: 15435 16: DISTRIBUTION OF B^t 16: Number of non-zero blocks: 114 16: Percentage of non-zero blocks: 11.40 -16: Average number of blocks per group: 38 -16: Maximum number of blocks per group: 41 -16: Average number of matrix elements per group: 11419 -16: Maximum number of matrix elements per group: 12123 -16: Average number of blocks per CPU: 10 -16: Maximum number of blocks per CPU: 16 -16: Average number of matrix elements per CPU: 2855 -16: Maximum number of matrix elements per CPU: 6228 +16: Average number of blocks per group: 17 +16: Maximum number of blocks per group: 20 +16: Average number of matrix elements per group: 4894 +16: Maximum number of matrix elements per group: 6792 +16: Average number of blocks per CPU: 17 +16: Maximum number of blocks per CPU: 20 +16: Average number of matrix elements per CPU: 4894 +16: Maximum number of matrix elements per CPU: 6792 16: DISTRIBUTION OF A^t 16: Number of non-zero blocks: 169 16: Percentage of non-zero blocks: 8.45 -16: Average number of blocks per group: 57 -16: Maximum number of blocks per group: 63 -16: Average number of matrix elements per group: 21091 -16: Maximum number of matrix elements per group: 25748 -16: Average number of blocks per CPU: 15 -16: Maximum number of blocks per CPU: 25 -16: Average number of matrix elements per CPU: 5273 -16: Maximum number of matrix elements per CPU: 8804 +16: Average number of blocks per group: 25 +16: Maximum number of blocks per group: 37 +16: Average number of matrix elements per group: 9039 +16: Maximum number of matrix elements per group: 17258 +16: Average number of blocks per CPU: 25 +16: Maximum number of blocks per CPU: 37 +16: Average number of matrix elements per CPU: 9039 +16: Maximum number of matrix elements per CPU: 17258 16: -------------------------------------------------------------------------------- 16: TAS MATRIX MULTIPLICATION DONE 16: -------------------------------------------------------------------------------- 16: CN X B^tT passed! 16: checksums 0.56E+07 0.56E+07 -16: difference norm 0.53E-14 +16: difference norm 0.00E+00 16: -------------------------------------------------------------------------------- 16: DBCSR TAS MATRIX MULTIPLICATION: C^t x B^t = A^t 16: -------------------------------------------------------------------------------- 16: mm dims: 20 10 100 16: MM PARAMETERS -16: Est. number of matrix elements per CPU of result matrix: 5619 +16: Est. number of matrix elements per CPU of result matrix: 9633 16: Est. optimal split factor: 6 16: Optimizing distribution of B^t and A^t 16: mm case: + x |T = |T 16: SPLIT / PARALLELIZATION INFO -16: splitting rows by factor 3 -16: global grid sizes: 6x 2 -16: grid sizes on subgroups: 2x 2 +16: splitting rows by factor 7 +16: global grid sizes: 7x 1 +16: grid sizes on subgroups: 1x 1 16: GLOBAL INFO OF C^t 16: block dimensions: 20 10 16: full dimensions: 559 270 -16: process grid dimensions: 6 2 +16: process grid dimensions: 7 1 16: GLOBAL INFO OF B^t 16: block dimensions: 100 10 16: full dimensions: 1260 270 -16: process grid dimensions: 6 2 +16: process grid dimensions: 7 1 16: GLOBAL INFO OF A^t 16: block dimensions: 100 20 16: full dimensions: 1260 559 -16: process grid dimensions: 6 2 +16: process grid dimensions: 7 1 16: Change process grid: No 16: DISTRIBUTION OF C^t replicated -16: Number of non-zero blocks: 51 +16: Number of non-zero blocks: 119 16: Percentage of non-zero blocks: 8.50 16: Average number of blocks per group: 17 16: Maximum number of blocks per group: 17 16: Average number of matrix elements per group: 11277 16: Maximum number of matrix elements per group: 11277 -16: Average number of blocks per CPU: 5 -16: Maximum number of blocks per CPU: 9 -16: Average number of matrix elements per CPU: 2820 -16: Maximum number of matrix elements per CPU: 7257 +16: Average number of blocks per CPU: 17 +16: Maximum number of blocks per CPU: 17 +16: Average number of matrix elements per CPU: 11277 +16: Maximum number of matrix elements per CPU: 11277 16: DISTRIBUTION OF B^t 16: Number of non-zero blocks: 114 16: Percentage of non-zero blocks: 11.40 -16: Average number of blocks per group: 38 -16: Maximum number of blocks per group: 41 -16: Average number of matrix elements per group: 11419 -16: Maximum number of matrix elements per group: 12123 -16: Average number of blocks per CPU: 10 -16: Maximum number of blocks per CPU: 16 -16: Average number of matrix elements per CPU: 2855 -16: Maximum number of matrix elements per CPU: 6228 +16: Average number of blocks per group: 17 +16: Maximum number of blocks per group: 20 +16: Average number of matrix elements per group: 4894 +16: Maximum number of matrix elements per group: 6792 +16: Average number of blocks per CPU: 17 +16: Maximum number of blocks per CPU: 20 +16: Average number of matrix elements per CPU: 4894 +16: Maximum number of matrix elements per CPU: 6792 16: DISTRIBUTION OF A^t 16: Number of non-zero blocks: 164 16: Percentage of non-zero blocks: 8.20 -16: Average number of blocks per group: 55 -16: Maximum number of blocks per group: 55 -16: Average number of matrix elements per group: 22476 -16: Maximum number of matrix elements per group: 23896 -16: Average number of blocks per CPU: 14 -16: Maximum number of blocks per CPU: 22 -16: Average number of matrix elements per CPU: 5619 -16: Maximum number of matrix elements per CPU: 11321 +16: Average number of blocks per group: 24 +16: Maximum number of blocks per group: 30 +16: Average number of matrix elements per group: 9633 +16: Maximum number of matrix elements per group: 12420 +16: Average number of blocks per CPU: 24 +16: Maximum number of blocks per CPU: 30 +16: Average number of matrix elements per CPU: 9633 +16: Maximum number of matrix elements per CPU: 12420 16: -------------------------------------------------------------------------------- 16: TAS MATRIX MULTIPLICATION DONE 16: -------------------------------------------------------------------------------- @@ -57213,60 +57215,60 @@ 16: -------------------------------------------------------------------------------- 16: mm dims: 20 10 100 16: MM PARAMETERS -16: Est. number of matrix elements per CPU of result matrix: 3934 +16: Est. number of matrix elements per CPU of result matrix: 6744 16: Est. optimal split factor: 3 16: Optimizing distribution of B and A 16: mm case: + x |T = |T 16: SPLIT / PARALLELIZATION INFO -16: splitting rows by factor 3 -16: global grid sizes: 6x 2 -16: grid sizes on subgroups: 2x 2 +16: splitting rows by factor 7 +16: global grid sizes: 7x 1 +16: grid sizes on subgroups: 1x 1 16: GLOBAL INFO OF C 16: block dimensions: 20 10 16: full dimensions: 559 270 -16: process grid dimensions: 6 2 +16: process grid dimensions: 7 1 16: GLOBAL INFO OF B 16: block dimensions: 100 10 16: full dimensions: 1260 270 -16: process grid dimensions: 6 2 +16: process grid dimensions: 7 1 16: GLOBAL INFO OF A 16: block dimensions: 100 20 16: full dimensions: 1260 559 -16: process grid dimensions: 6 2 +16: process grid dimensions: 7 1 16: Change process grid: No 16: DISTRIBUTION OF C replicated -16: Number of non-zero blocks: 48 +16: Number of non-zero blocks: 112 16: Percentage of non-zero blocks: 8.00 16: Average number of blocks per group: 16 16: Maximum number of blocks per group: 16 16: Average number of matrix elements per group: 15435 16: Maximum number of matrix elements per group: 15435 -16: Average number of blocks per CPU: 4 -16: Maximum number of blocks per CPU: 6 -16: Average number of matrix elements per CPU: 3859 -16: Maximum number of matrix elements per CPU: 8169 +16: Average number of blocks per CPU: 16 +16: Maximum number of blocks per CPU: 16 +16: Average number of matrix elements per CPU: 15435 +16: Maximum number of matrix elements per CPU: 15435 16: DISTRIBUTION OF B 16: Number of non-zero blocks: 91 16: Percentage of non-zero blocks: 9.10 -16: Average number of blocks per group: 31 -16: Maximum number of blocks per group: 35 -16: Average number of matrix elements per group: 9626 -16: Maximum number of matrix elements per group: 10560 -16: Average number of blocks per CPU: 8 -16: Maximum number of blocks per CPU: 10 -16: Average number of matrix elements per CPU: 2407 -16: Maximum number of matrix elements per CPU: 4797 +16: Average number of blocks per group: 13 +16: Maximum number of blocks per group: 17 +16: Average number of matrix elements per group: 4126 +16: Maximum number of matrix elements per group: 5730 +16: Average number of blocks per CPU: 13 +16: Maximum number of blocks per CPU: 17 +16: Average number of matrix elements per CPU: 4126 +16: Maximum number of matrix elements per CPU: 5730 16: DISTRIBUTION OF A 16: Number of non-zero blocks: 152 16: Percentage of non-zero blocks: 7.60 -16: Average number of blocks per group: 51 -16: Maximum number of blocks per group: 65 -16: Average number of matrix elements per group: 15736 -16: Maximum number of matrix elements per group: 19557 -16: Average number of blocks per CPU: 13 -16: Maximum number of blocks per CPU: 23 -16: Average number of matrix elements per CPU: 3934 -16: Maximum number of matrix elements per CPU: 7499 +16: Average number of blocks per group: 22 +16: Maximum number of blocks per group: 31 +16: Average number of matrix elements per group: 6744 +16: Maximum number of matrix elements per group: 11788 +16: Average number of blocks per CPU: 22 +16: Maximum number of blocks per CPU: 31 +16: Average number of matrix elements per CPU: 6744 +16: Maximum number of matrix elements per CPU: 11788 16: -------------------------------------------------------------------------------- 16: TAS MATRIX MULTIPLICATION DONE 16: -------------------------------------------------------------------------------- @@ -57278,60 +57280,60 @@ 16: -------------------------------------------------------------------------------- 16: mm dims: 20 10 100 16: MM PARAMETERS -16: Est. number of matrix elements per CPU of result matrix: 4185 +16: Est. number of matrix elements per CPU of result matrix: 7173 16: Est. optimal split factor: 4 16: Optimizing distribution of B and A 16: mm case: + x |T = |T 16: SPLIT / PARALLELIZATION INFO -16: splitting rows by factor 3 -16: global grid sizes: 6x 2 -16: grid sizes on subgroups: 2x 2 +16: splitting rows by factor 7 +16: global grid sizes: 7x 1 +16: grid sizes on subgroups: 1x 1 16: GLOBAL INFO OF C^t 16: block dimensions: 20 10 16: full dimensions: 559 270 -16: process grid dimensions: 6 2 +16: process grid dimensions: 7 1 16: GLOBAL INFO OF B 16: block dimensions: 100 10 16: full dimensions: 1260 270 -16: process grid dimensions: 6 2 +16: process grid dimensions: 7 1 16: GLOBAL INFO OF A 16: block dimensions: 100 20 16: full dimensions: 1260 559 -16: process grid dimensions: 6 2 +16: process grid dimensions: 7 1 16: Change process grid: No 16: DISTRIBUTION OF C^t replicated -16: Number of non-zero blocks: 51 +16: Number of non-zero blocks: 119 16: Percentage of non-zero blocks: 8.50 16: Average number of blocks per group: 17 16: Maximum number of blocks per group: 17 16: Average number of matrix elements per group: 11277 16: Maximum number of matrix elements per group: 11277 -16: Average number of blocks per CPU: 5 -16: Maximum number of blocks per CPU: 9 -16: Average number of matrix elements per CPU: 2820 -16: Maximum number of matrix elements per CPU: 7257 +16: Average number of blocks per CPU: 17 +16: Maximum number of blocks per CPU: 17 +16: Average number of matrix elements per CPU: 11277 +16: Maximum number of matrix elements per CPU: 11277 16: DISTRIBUTION OF B 16: Number of non-zero blocks: 91 16: Percentage of non-zero blocks: 9.10 -16: Average number of blocks per group: 31 -16: Maximum number of blocks per group: 35 -16: Average number of matrix elements per group: 9626 -16: Maximum number of matrix elements per group: 10560 -16: Average number of blocks per CPU: 8 -16: Maximum number of blocks per CPU: 10 -16: Average number of matrix elements per CPU: 2407 -16: Maximum number of matrix elements per CPU: 4797 +16: Average number of blocks per group: 13 +16: Maximum number of blocks per group: 17 +16: Average number of matrix elements per group: 4126 +16: Maximum number of matrix elements per group: 5730 +16: Average number of blocks per CPU: 13 +16: Maximum number of blocks per CPU: 17 +16: Average number of matrix elements per CPU: 4126 +16: Maximum number of matrix elements per CPU: 5730 16: DISTRIBUTION OF A 16: Number of non-zero blocks: 135 16: Percentage of non-zero blocks: 6.75 -16: Average number of blocks per group: 45 -16: Maximum number of blocks per group: 49 -16: Average number of matrix elements per group: 16737 -16: Maximum number of matrix elements per group: 19052 -16: Average number of blocks per CPU: 12 -16: Maximum number of blocks per CPU: 17 -16: Average number of matrix elements per CPU: 4185 -16: Maximum number of matrix elements per CPU: 10264 +16: Average number of blocks per group: 20 +16: Maximum number of blocks per group: 26 +16: Average number of matrix elements per group: 7173 +16: Maximum number of matrix elements per group: 10488 +16: Average number of blocks per CPU: 20 +16: Maximum number of blocks per CPU: 26 +16: Average number of matrix elements per CPU: 7173 +16: Maximum number of matrix elements per CPU: 10488 16: -------------------------------------------------------------------------------- 16: TAS MATRIX MULTIPLICATION DONE 16: -------------------------------------------------------------------------------- @@ -57343,131 +57345,131 @@ 16: -------------------------------------------------------------------------------- 16: mm dims: 20 10 100 16: MM PARAMETERS -16: Est. number of matrix elements per CPU of result matrix: 5273 +16: Est. number of matrix elements per CPU of result matrix: 9039 16: Est. optimal split factor: 4 16: Optimizing distribution of B^t and A 16: mm case: + x |T = |T 16: SPLIT / PARALLELIZATION INFO -16: splitting rows by factor 3 -16: global grid sizes: 6x 2 -16: grid sizes on subgroups: 2x 2 +16: splitting rows by factor 7 +16: global grid sizes: 7x 1 +16: grid sizes on subgroups: 1x 1 16: GLOBAL INFO OF C 16: block dimensions: 20 10 16: full dimensions: 559 270 -16: process grid dimensions: 6 2 +16: process grid dimensions: 7 1 16: GLOBAL INFO OF B^t 16: block dimensions: 100 10 16: full dimensions: 1260 270 -16: process grid dimensions: 6 2 +16: process grid dimensions: 7 1 16: GLOBAL INFO OF A 16: block dimensions: 100 20 16: full dimensions: 1260 559 -16: process grid dimensions: 6 2 +16: process grid dimensions: 7 1 16: Change process grid: No 16: DISTRIBUTION OF C replicated -16: Number of non-zero blocks: 48 +16: Number of non-zero blocks: 112 16: Percentage of non-zero blocks: 8.00 16: Average number of blocks per group: 16 16: Maximum number of blocks per group: 16 16: Average number of matrix elements per group: 15435 16: Maximum number of matrix elements per group: 15435 -16: Average number of blocks per CPU: 4 -16: Maximum number of blocks per CPU: 6 -16: Average number of matrix elements per CPU: 3859 -16: Maximum number of matrix elements per CPU: 8169 +16: Average number of blocks per CPU: 16 +16: Maximum number of blocks per CPU: 16 +16: Average number of matrix elements per CPU: 15435 +16: Maximum number of matrix elements per CPU: 15435 16: DISTRIBUTION OF B^t 16: Number of non-zero blocks: 114 16: Percentage of non-zero blocks: 11.40 -16: Average number of blocks per group: 38 -16: Maximum number of blocks per group: 41 -16: Average number of matrix elements per group: 11419 -16: Maximum number of matrix elements per group: 12123 -16: Average number of blocks per CPU: 10 -16: Maximum number of blocks per CPU: 16 -16: Average number of matrix elements per CPU: 2855 -16: Maximum number of matrix elements per CPU: 6228 +16: Average number of blocks per group: 17 +16: Maximum number of blocks per group: 20 +16: Average number of matrix elements per group: 4894 +16: Maximum number of matrix elements per group: 6792 +16: Average number of blocks per CPU: 17 +16: Maximum number of blocks per CPU: 20 +16: Average number of matrix elements per CPU: 4894 +16: Maximum number of matrix elements per CPU: 6792 16: DISTRIBUTION OF A 16: Number of non-zero blocks: 169 16: Percentage of non-zero blocks: 8.45 -16: Average number of blocks per group: 57 -16: Maximum number of blocks per group: 63 -16: Average number of matrix elements per group: 21091 -16: Maximum number of matrix elements per group: 25748 -16: Average number of blocks per CPU: 15 -16: Maximum number of blocks per CPU: 25 -16: Average number of matrix elements per CPU: 5273 -16: Maximum number of matrix elements per CPU: 8804 +16: Average number of blocks per group: 25 +16: Maximum number of blocks per group: 37 +16: Average number of matrix elements per group: 9039 +16: Maximum number of matrix elements per group: 17258 +16: Average number of blocks per CPU: 25 +16: Maximum number of blocks per CPU: 37 +16: Average number of matrix elements per CPU: 9039 +16: Maximum number of matrix elements per CPU: 17258 16: -------------------------------------------------------------------------------- 16: TAS MATRIX MULTIPLICATION DONE 16: -------------------------------------------------------------------------------- 16: CN X B^tT passed! 16: checksums 0.56E+07 0.56E+07 -16: difference norm 0.00E+00 +16: difference norm 0.21E-13 16: -------------------------------------------------------------------------------- 16: DBCSR TAS MATRIX MULTIPLICATION: C^t x B^t = A 16: -------------------------------------------------------------------------------- 16: mm dims: 20 10 100 16: MM PARAMETERS -16: Est. number of matrix elements per CPU of result matrix: 5619 +16: Est. number of matrix elements per CPU of result matrix: 9633 16: Est. optimal split factor: 6 16: Optimizing distribution of B^t and A 16: mm case: + x |T = |T 16: SPLIT / PARALLELIZATION INFO -16: splitting rows by factor 3 -16: global grid sizes: 6x 2 -16: grid sizes on subgroups: 2x 2 +16: splitting rows by factor 7 +16: global grid sizes: 7x 1 +16: grid sizes on subgroups: 1x 1 16: GLOBAL INFO OF C^t 16: block dimensions: 20 10 16: full dimensions: 559 270 -16: process grid dimensions: 6 2 +16: process grid dimensions: 7 1 16: GLOBAL INFO OF B^t 16: block dimensions: 100 10 16: full dimensions: 1260 270 -16: process grid dimensions: 6 2 +16: process grid dimensions: 7 1 16: GLOBAL INFO OF A 16: block dimensions: 100 20 16: full dimensions: 1260 559 -16: process grid dimensions: 6 2 +16: process grid dimensions: 7 1 16: Change process grid: No 16: DISTRIBUTION OF C^t replicated -16: Number of non-zero blocks: 51 +16: Number of non-zero blocks: 119 16: Percentage of non-zero blocks: 8.50 16: Average number of blocks per group: 17 16: Maximum number of blocks per group: 17 16: Average number of matrix elements per group: 11277 16: Maximum number of matrix elements per group: 11277 -16: Average number of blocks per CPU: 5 -16: Maximum number of blocks per CPU: 9 -16: Average number of matrix elements per CPU: 2820 -16: Maximum number of matrix elements per CPU: 7257 +16: Average number of blocks per CPU: 17 +16: Maximum number of blocks per CPU: 17 +16: Average number of matrix elements per CPU: 11277 +16: Maximum number of matrix elements per CPU: 11277 16: DISTRIBUTION OF B^t 16: Number of non-zero blocks: 114 16: Percentage of non-zero blocks: 11.40 -16: Average number of blocks per group: 38 -16: Maximum number of blocks per group: 41 -16: Average number of matrix elements per group: 11419 -16: Maximum number of matrix elements per group: 12123 -16: Average number of blocks per CPU: 10 -16: Maximum number of blocks per CPU: 16 -16: Average number of matrix elements per CPU: 2855 -16: Maximum number of matrix elements per CPU: 6228 +16: Average number of blocks per group: 17 +16: Maximum number of blocks per group: 20 +16: Average number of matrix elements per group: 4894 +16: Maximum number of matrix elements per group: 6792 +16: Average number of blocks per CPU: 17 +16: Maximum number of blocks per CPU: 20 +16: Average number of matrix elements per CPU: 4894 +16: Maximum number of matrix elements per CPU: 6792 16: DISTRIBUTION OF A 16: Number of non-zero blocks: 164 16: Percentage of non-zero blocks: 8.20 -16: Average number of blocks per group: 55 -16: Maximum number of blocks per group: 55 -16: Average number of matrix elements per group: 22476 -16: Maximum number of matrix elements per group: 23896 -16: Average number of blocks per CPU: 14 -16: Maximum number of blocks per CPU: 22 -16: Average number of matrix elements per CPU: 5619 -16: Maximum number of matrix elements per CPU: 11321 +16: Average number of blocks per group: 24 +16: Maximum number of blocks per group: 30 +16: Average number of matrix elements per group: 9633 +16: Maximum number of matrix elements per group: 12420 +16: Average number of blocks per CPU: 24 +16: Maximum number of blocks per CPU: 30 +16: Average number of matrix elements per CPU: 9633 +16: Maximum number of matrix elements per CPU: 12420 16: -------------------------------------------------------------------------------- 16: TAS MATRIX MULTIPLICATION DONE 16: -------------------------------------------------------------------------------- 16: C^tT X B^tT passed! 16: checksums 0.57E+07 0.57E+07 -16: difference norm 0.53E-14 +16: difference norm 0.36E-14 16: 16: ------------------------------------------------------------------------------- 16: - - @@ -57476,408 +57478,279 @@ 16: ------------------------------------------------------------------------------- 16: COUNTER TOTAL BLAS SMM ACC 16: flops 2 x 3 x 5 420 100.0% 0.0% 0.0% -16: flops 2 x 8 x 3 480 100.0% 0.0% 0.0% -16: flops 2 x 15 x 8 480 100.0% 0.0% 0.0% 16: flops 2 x 5 x 3 540 100.0% 0.0% 0.0% 16: flops 2 x 3 x 8 672 100.0% 0.0% 0.0% 16: flops 2 x 3 x 12 720 100.0% 0.0% 0.0% -16: flops 2 x 8 x 12 768 100.0% 0.0% 0.0% -16: flops 2 x 13 x 3 780 100.0% 0.0% 0.0% -16: flops 2 x 12 x 3 864 100.0% 0.0% 0.0% -16: flops 13 x 2 x 3 936 100.0% 0.0% 0.0% -16: flops 5 x 2 x 3 1020 100.0% 0.0% 0.0% +16: flops 3 x 2 x 5 840 100.0% 0.0% 0.0% 16: flops 2 x 33 x 8 1056 100.0% 0.0% 0.0% 16: flops 9 x 5 x 3 1080 100.0% 0.0% 0.0% -16: flops 2 x 13 x 12 1248 100.0% 0.0% 0.0% -16: flops 3 x 2 x 5 1260 100.0% 0.0% 0.0% -16: flops 3 x 2 x 8 1440 100.0% 0.0% 0.0% -16: flops 15 x 2 x 8 1440 100.0% 0.0% 0.0% +16: flops 2 x 12 x 3 1152 100.0% 0.0% 0.0% +16: flops 2 x 8 x 3 1152 100.0% 0.0% 0.0% +16: flops 3 x 2 x 8 1344 100.0% 0.0% 0.0% +16: flops 3 x 2 x 12 1440 100.0% 0.0% 0.0% 16: flops 2 x 5 x 12 1440 100.0% 0.0% 0.0% -16: flops 2 x 15 x 5 1500 100.0% 0.0% 0.0% -16: flops 15 x 2 x 13 1560 100.0% 0.0% 0.0% -16: flops 3 x 2 x 12 1584 100.0% 0.0% 0.0% 16: flops 2 x 12 x 5 1680 100.0% 0.0% 0.0% -16: flops 12 x 2 x 3 1728 100.0% 0.0% 0.0% -16: flops 9 x 8 x 3 1728 100.0% 0.0% 0.0% -16: flops 8 x 2 x 3 1920 100.0% 0.0% 0.0% -16: flops 9 x 13 x 3 2106 100.0% 0.0% 0.0% -16: flops 2 x 25 x 3 2400 100.0% 0.0% 0.0% -16: flops 25 x 2 x 3 2400 100.0% 0.0% 0.0% -16: flops 25 x 2 x 12 2400 100.0% 0.0% 0.0% -16: flops 12 x 2 x 13 2496 100.0% 0.0% 0.0% -16: flops 13 x 2 x 12 2496 100.0% 0.0% 0.0% -16: flops 9 x 12 x 3 2592 100.0% 0.0% 0.0% +16: flops 2 x 8 x 12 1920 100.0% 0.0% 0.0% +16: flops 33 x 2 x 8 2112 100.0% 0.0% 0.0% 16: flops 2 x 12 x 8 2688 100.0% 0.0% 0.0% -16: flops 25 x 3 x 9 2700 100.0% 0.0% 0.0% -16: flops 3 x 13 x 9 2808 100.0% 0.0% 0.0% -16: flops 2 x 15 x 12 2880 100.0% 0.0% 0.0% -16: flops 3 x 5 x 9 2970 100.0% 0.0% 0.0% +16: flops 5 x 9 x 3 2700 100.0% 0.0% 0.0% 16: flops 9 x 3 x 5 2970 100.0% 0.0% 0.0% -16: flops 3 x 2 x 25 3000 100.0% 0.0% 0.0% -16: flops 3 x 8 x 9 3024 100.0% 0.0% 0.0% -16: flops 33 x 2 x 8 3168 100.0% 0.0% 0.0% -16: flops 5 x 9 x 3 3240 100.0% 0.0% 0.0% -16: flops 33 x 2 x 13 3432 100.0% 0.0% 0.0% +16: flops 3 x 5 x 9 2970 100.0% 0.0% 0.0% +16: flops 9 x 8 x 3 3024 100.0% 0.0% 0.0% +16: flops 9 x 12 x 3 3240 100.0% 0.0% 0.0% +16: flops 12 x 2 x 5 3360 100.0% 0.0% 0.0% 16: flops 15 x 5 x 23 3450 100.0% 0.0% 0.0% -16: flops 2 x 12 x 12 3456 100.0% 0.0% 0.0% -16: flops 3 x 23 x 13 3588 100.0% 0.0% 0.0% -16: flops 13 x 9 x 3 4212 100.0% 0.0% 0.0% -16: flops 5 x 2 x 12 4320 100.0% 0.0% 0.0% -16: flops 15 x 2 x 12 4320 100.0% 0.0% 0.0% -16: flops 23 x 8 x 12 4416 100.0% 0.0% 0.0% -16: flops 15 x 2 x 5 4500 100.0% 0.0% 0.0% -16: flops 3 x 12 x 9 4536 100.0% 0.0% 0.0% -16: flops 9 x 8 x 33 4752 100.0% 0.0% 0.0% -16: flops 2 x 25 x 12 4800 100.0% 0.0% 0.0% -16: flops 2 x 78 x 8 4992 100.0% 0.0% 0.0% -16: flops 8 x 2 x 12 4992 100.0% 0.0% 0.0% -16: flops 12 x 2 x 5 5040 100.0% 0.0% 0.0% -16: flops 12 x 9 x 3 5184 100.0% 0.0% 0.0% -16: flops 3 x 13 x 23 5382 100.0% 0.0% 0.0% +16: flops 12 x 2 x 12 3456 100.0% 0.0% 0.0% +16: flops 2 x 12 x 12 4032 100.0% 0.0% 0.0% +16: flops 3 x 8 x 9 4752 100.0% 0.0% 0.0% +16: flops 12 x 2 x 8 5376 100.0% 0.0% 0.0% 16: flops 23 x 3 x 5 5520 100.0% 0.0% 0.0% 16: flops 12 x 5 x 23 5520 100.0% 0.0% 0.0% -16: flops 15 x 2 x 25 6000 100.0% 0.0% 0.0% 16: flops 8 x 9 x 3 6048 100.0% 0.0% 0.0% -16: flops 12 x 2 x 8 6528 100.0% 0.0% 0.0% 16: flops 2 x 33 x 5 6600 100.0% 0.0% 0.0% -16: flops 33 x 2 x 25 6600 100.0% 0.0% 0.0% -16: flops 9 x 8 x 12 6912 100.0% 0.0% 0.0% -16: flops 13 x 3 x 9 7020 100.0% 0.0% 0.0% -16: flops 12 x 2 x 25 7200 100.0% 0.0% 0.0% +16: flops 12 x 9 x 3 7128 100.0% 0.0% 0.0% 16: flops 9 x 3 x 8 7344 100.0% 0.0% 0.0% -16: flops 3 x 9 x 5 7560 100.0% 0.0% 0.0% -16: flops 9 x 13 x 33 7722 100.0% 0.0% 0.0% -16: flops 9 x 25 x 3 8100 100.0% 0.0% 0.0% -16: flops 3 x 9 x 13 8424 100.0% 0.0% 0.0% +16: flops 5 x 12 x 23 8280 100.0% 0.0% 0.0% +16: flops 5 x 3 x 9 8370 100.0% 0.0% 0.0% +16: flops 15 x 9 x 8 8640 100.0% 0.0% 0.0% 16: flops 12 x 5 x 9 8640 100.0% 0.0% 0.0% -16: flops 12 x 2 x 12 8640 100.0% 0.0% 0.0% -16: flops 9 x 15 x 8 8640 100.0% 0.0% 0.0% 16: flops 1 x 1 x 1 8772 100.0% 0.0% 0.0% -16: flops 5 x 3 x 9 8910 100.0% 0.0% 0.0% -16: flops 23 x 5 x 3 8970 100.0% 0.0% 0.0% +16: flops 3 x 9 x 5 8910 100.0% 0.0% 0.0% 16: flops 3 x 5 x 23 8970 100.0% 0.0% 0.0% -16: flops 15 x 13 x 23 8970 100.0% 0.0% 0.0% -16: flops 2 x 78 x 5 9360 100.0% 0.0% 0.0% -16: flops 23 x 8 x 3 9936 100.0% 0.0% 0.0% -16: flops 3 x 8 x 23 9936 100.0% 0.0% 0.0% -16: flops 78 x 2 x 8 9984 100.0% 0.0% 0.0% -16: flops 5 x 15 x 23 10350 100.0% 0.0% 0.0% -16: flops 23 x 15 x 5 10350 100.0% 0.0% 0.0% +16: flops 23 x 5 x 3 8970 100.0% 0.0% 0.0% +16: flops 3 x 12 x 9 9720 100.0% 0.0% 0.0% +16: flops 15 x 23 x 5 10350 100.0% 0.0% 0.0% 16: flops 9 x 3 x 12 10368 100.0% 0.0% 0.0% -16: flops 13 x 23 x 3 10764 100.0% 0.0% 0.0% -16: flops 8 x 3 x 9 10800 100.0% 0.0% 0.0% -16: flops 15 x 8 x 23 11040 100.0% 0.0% 0.0% -16: flops 2 x 78 x 12 11232 100.0% 0.0% 0.0% -16: flops 9 x 13 x 12 11232 100.0% 0.0% 0.0% -16: flops 23 x 8 x 33 12144 100.0% 0.0% 0.0% +16: flops 13 x 9 x 3 10530 100.0% 0.0% 0.0% +16: flops 8 x 3 x 9 11664 100.0% 0.0% 0.0% 16: flops 23 x 3 x 8 12144 100.0% 0.0% 0.0% -16: flops 64 x 8 x 3 12288 100.0% 0.0% 0.0% -16: flops 3 x 23 x 5 12420 100.0% 0.0% 0.0% +16: flops 25 x 3 x 9 12150 100.0% 0.0% 0.0% 16: flops 2 x 33 x 12 12672 100.0% 0.0% 0.0% 16: flops 9 x 5 x 12 12960 100.0% 0.0% 0.0% -16: flops 12 x 8 x 23 13248 100.0% 0.0% 0.0% -16: flops 3 x 25 x 9 13500 100.0% 0.0% 0.0% -16: flops 9 x 15 x 5 13500 100.0% 0.0% 0.0% -16: flops 3 x 23 x 25 13800 100.0% 0.0% 0.0% -16: flops 23 x 13 x 3 14352 100.0% 0.0% 0.0% -16: flops 13 x 3 x 23 14352 100.0% 0.0% 0.0% -16: flops 15 x 9 x 8 15120 100.0% 0.0% 0.0% -16: flops 78 x 2 x 5 15600 100.0% 0.0% 0.0% -16: flops 78 x 2 x 13 16224 100.0% 0.0% 0.0% -16: flops 3 x 9 x 8 16416 100.0% 0.0% 0.0% +16: flops 33 x 2 x 5 13200 100.0% 0.0% 0.0% +16: flops 13 x 3 x 9 13338 100.0% 0.0% 0.0% +16: flops 15 x 9 x 5 13500 100.0% 0.0% 0.0% +16: flops 15 x 8 x 23 16560 100.0% 0.0% 0.0% +16: flops 3 x 23 x 5 16560 100.0% 0.0% 0.0% 16: flops 23 x 5 x 12 16560 100.0% 0.0% 0.0% -16: flops 15 x 12 x 23 16560 100.0% 0.0% 0.0% -16: flops 5 x 12 x 23 16560 100.0% 0.0% 0.0% -16: flops 23 x 12 x 3 16560 100.0% 0.0% 0.0% -16: flops 12 x 13 x 9 16848 100.0% 0.0% 0.0% -16: flops 15 x 25 x 23 17250 100.0% 0.0% 0.0% -16: flops 12 x 8 x 9 17280 100.0% 0.0% 0.0% +16: flops 9 x 8 x 12 17280 100.0% 0.0% 0.0% 16: flops 33 x 5 x 9 17820 100.0% 0.0% 0.0% -16: flops 13 x 15 x 23 17940 100.0% 0.0% 0.0% -16: flops 15 x 23 x 13 17940 100.0% 0.0% 0.0% -16: flops 3 x 12 x 64 18432 100.0% 0.0% 0.0% -16: flops 3 x 8 x 64 18432 100.0% 0.0% 0.0% 16: flops 25 x 9 x 3 18900 100.0% 0.0% 0.0% +16: flops 9 x 8 x 33 19008 100.0% 0.0% 0.0% 16: flops 9 x 33 x 8 19008 100.0% 0.0% 0.0% -16: flops 23 x 13 x 33 19734 100.0% 0.0% 0.0% -16: flops 33 x 2 x 5 19800 100.0% 0.0% 0.0% 16: flops 23 x 3 x 12 19872 100.0% 0.0% 0.0% -16: flops 12 x 3 x 9 20088 100.0% 0.0% 0.0% +16: flops 5 x 23 x 3 20700 100.0% 0.0% 0.0% 16: flops 9 x 12 x 8 20736 100.0% 0.0% 0.0% -16: flops 15 x 9 x 13 21060 100.0% 0.0% 0.0% -16: flops 33 x 12 x 9 21384 100.0% 0.0% 0.0% -16: flops 5 x 23 x 3 21390 100.0% 0.0% 0.0% -16: flops 23 x 13 x 12 21528 100.0% 0.0% 0.0% +16: flops 23 x 8 x 3 20976 100.0% 0.0% 0.0% +16: flops 23 x 12 x 3 21528 100.0% 0.0% 0.0% 16: flops 9 x 12 x 5 21600 100.0% 0.0% 0.0% -16: flops 25 x 9 x 12 21600 100.0% 0.0% 0.0% +16: flops 3 x 9 x 8 22032 100.0% 0.0% 0.0% +16: flops 12 x 3 x 9 22032 100.0% 0.0% 0.0% +16: flops 5 x 3 x 23 22080 100.0% 0.0% 0.0% 16: flops 23 x 12 x 5 22080 100.0% 0.0% 0.0% -16: flops 13 x 9 x 12 22464 100.0% 0.0% 0.0% -16: flops 3 x 9 x 12 22680 100.0% 0.0% 0.0% +16: flops 12 x 8 x 9 22464 100.0% 0.0% 0.0% 16: flops 3 x 5 x 64 23040 100.0% 0.0% 0.0% -16: flops 3 x 23 x 8 23184 100.0% 0.0% 0.0% -16: flops 3 x 12 x 23 23184 100.0% 0.0% 0.0% -16: flops 33 x 8 x 9 23760 100.0% 0.0% 0.0% -16: flops 15 x 23 x 5 24150 100.0% 0.0% 0.0% -16: flops 64 x 3 x 5 24960 100.0% 0.0% 0.0% -16: flops 5 x 12 x 9 25920 100.0% 0.0% 0.0% -16: flops 78 x 2 x 12 26208 100.0% 0.0% 0.0% +16: flops 3 x 8 x 23 23184 100.0% 0.0% 0.0% +16: flops 5 x 12 x 9 24840 100.0% 0.0% 0.0% +16: flops 15 x 12 x 23 24840 100.0% 0.0% 0.0% +16: flops 33 x 2 x 12 25344 100.0% 0.0% 0.0% +16: flops 23 x 8 x 12 26496 100.0% 0.0% 0.0% +16: flops 64 x 3 x 5 26880 100.0% 0.0% 0.0% 16: flops 64 x 5 x 3 26880 100.0% 0.0% 0.0% -16: flops 5 x 3 x 23 26910 100.0% 0.0% 0.0% -16: flops 25 x 3 x 23 27600 100.0% 0.0% 0.0% -16: flops 25 x 12 x 23 27600 100.0% 0.0% 0.0% -16: flops 12 x 23 x 25 27600 100.0% 0.0% 0.0% -16: flops 64 x 12 x 3 27648 100.0% 0.0% 0.0% 16: flops 64 x 3 x 12 27648 100.0% 0.0% 0.0% 16: flops 9 x 5 x 33 29700 100.0% 0.0% 0.0% -16: flops 25 x 9 x 33 29700 100.0% 0.0% 0.0% -16: flops 13 x 64 x 3 29952 100.0% 0.0% 0.0% 16: flops 33 x 5 x 23 30360 100.0% 0.0% 0.0% -16: flops 64 x 15 x 8 30720 100.0% 0.0% 0.0% -16: flops 13 x 9 x 33 30888 100.0% 0.0% 0.0% -16: flops 33 x 2 x 12 31680 100.0% 0.0% 0.0% -16: flops 12 x 9 x 25 32400 100.0% 0.0% 0.0% -16: flops 12 x 25 x 9 32400 100.0% 0.0% 0.0% -16: flops 13 x 12 x 9 33696 100.0% 0.0% 0.0% -16: flops 15 x 9 x 5 33750 100.0% 0.0% 0.0% -16: flops 64 x 3 x 8 33792 100.0% 0.0% 0.0% -16: flops 8 x 64 x 33 33792 100.0% 0.0% 0.0% -16: flops 25 x 15 x 23 34500 100.0% 0.0% 0.0% -16: flops 3 x 13 x 64 34944 100.0% 0.0% 0.0% -16: flops 64 x 13 x 3 34944 100.0% 0.0% 0.0% +16: flops 15 x 64 x 8 30720 100.0% 0.0% 0.0% +16: flops 12 x 8 x 23 30912 100.0% 0.0% 0.0% +16: flops 3 x 9 x 12 31104 100.0% 0.0% 0.0% +16: flops 3 x 12 x 64 32256 100.0% 0.0% 0.0% +16: flops 5 x 9 x 12 32400 100.0% 0.0% 0.0% +16: flops 8 x 33 x 64 33792 100.0% 0.0% 0.0% +16: flops 64 x 8 x 33 33792 100.0% 0.0% 0.0% +16: flops 33 x 8 x 64 33792 100.0% 0.0% 0.0% +16: flops 3 x 12 x 23 34776 100.0% 0.0% 0.0% 16: flops 78 x 5 x 23 35880 100.0% 0.0% 0.0% -16: flops 64 x 15 x 5 38400 100.0% 0.0% 0.0% -16: flops 33 x 13 x 9 38610 100.0% 0.0% 0.0% +16: flops 3 x 23 x 8 36432 100.0% 0.0% 0.0% +16: flops 64 x 3 x 8 36864 100.0% 0.0% 0.0% +16: flops 64 x 12 x 3 36864 100.0% 0.0% 0.0% 16: flops 9 x 33 x 5 38610 100.0% 0.0% 0.0% -16: flops 12 x 23 x 5 38640 100.0% 0.0% 0.0% -16: flops 8 x 15 x 23 38640 100.0% 0.0% 0.0% -16: flops 23 x 15 x 8 38640 100.0% 0.0% 0.0% -16: flops 5 x 9 x 12 38880 100.0% 0.0% 0.0% -16: flops 33 x 23 x 13 39468 100.0% 0.0% 0.0% -16: flops 13 x 3 x 64 39936 100.0% 0.0% 0.0% -16: flops 3 x 9 x 25 40500 100.0% 0.0% 0.0% -16: flops 15 x 9 x 25 40500 100.0% 0.0% 0.0% -16: flops 8 x 23 x 3 40848 100.0% 0.0% 0.0% -16: flops 12 x 23 x 3 41400 100.0% 0.0% 0.0% -16: flops 3 x 25 x 23 41400 100.0% 0.0% 0.0% -16: flops 23 x 25 x 12 41400 100.0% 0.0% 0.0% -16: flops 9 x 12 x 12 41472 100.0% 0.0% 0.0% +16: flops 15 x 23 x 8 38640 100.0% 0.0% 0.0% +16: flops 13 x 9 x 12 39312 100.0% 0.0% 0.0% +16: flops 33 x 8 x 9 42768 100.0% 0.0% 0.0% +16: flops 64 x 8 x 3 43008 100.0% 0.0% 0.0% 16: flops 13 x 23 x 12 43056 100.0% 0.0% 0.0% -16: flops 3 x 23 x 12 43056 100.0% 0.0% 0.0% -16: flops 12 x 9 x 8 43200 100.0% 0.0% 0.0% -16: flops 9 x 25 x 12 43200 100.0% 0.0% 0.0% 16: flops 25 x 12 x 9 43200 100.0% 0.0% 0.0% -16: flops 8 x 9 x 12 44928 100.0% 0.0% 0.0% -16: flops 64 x 15 x 12 46080 100.0% 0.0% 0.0% -16: flops 33 x 9 x 13 46332 100.0% 0.0% 0.0% -16: flops 8 x 9 x 33 47520 100.0% 0.0% 0.0% -16: flops 33 x 9 x 8 47520 100.0% 0.0% 0.0% -16: flops 23 x 25 x 3 48300 100.0% 0.0% 0.0% -16: flops 9 x 78 x 5 49140 100.0% 0.0% 0.0% -16: flops 12 x 8 x 64 49152 100.0% 0.0% 0.0% -16: flops 5 x 23 x 12 49680 100.0% 0.0% 0.0% -16: flops 3 x 64 x 13 49920 100.0% 0.0% 0.0% -16: flops 8 x 12 x 9 50112 100.0% 0.0% 0.0% -16: flops 12 x 9 x 13 50544 100.0% 0.0% 0.0% -16: flops 12 x 9 x 5 52920 100.0% 0.0% 0.0% -16: flops 23 x 12 x 12 52992 100.0% 0.0% 0.0% -16: flops 5 x 33 x 9 53460 100.0% 0.0% 0.0% -16: flops 8 x 3 x 23 54096 100.0% 0.0% 0.0% -16: flops 64 x 13 x 33 54912 100.0% 0.0% 0.0% -16: flops 25 x 23 x 3 55200 100.0% 0.0% 0.0% -16: flops 78 x 9 x 5 56160 100.0% 0.0% 0.0% +16: flops 8 x 23 x 3 44160 100.0% 0.0% 0.0% +16: flops 12 x 23 x 3 44712 100.0% 0.0% 0.0% +16: flops 5 x 33 x 23 45540 100.0% 0.0% 0.0% +16: flops 9 x 12 x 12 46656 100.0% 0.0% 0.0% +16: flops 5 x 23 x 12 46920 100.0% 0.0% 0.0% +16: flops 8 x 9 x 12 48384 100.0% 0.0% 0.0% +16: flops 23 x 8 x 33 48576 100.0% 0.0% 0.0% +16: flops 78 x 9 x 5 49140 100.0% 0.0% 0.0% +16: flops 5 x 3 x 64 49920 100.0% 0.0% 0.0% +16: flops 13 x 12 x 23 50232 100.0% 0.0% 0.0% +16: flops 5 x 33 x 9 50490 100.0% 0.0% 0.0% +16: flops 3 x 8 x 64 52224 100.0% 0.0% 0.0% +16: flops 25 x 9 x 12 54000 100.0% 0.0% 0.0% 16: flops 78 x 5 x 9 56160 100.0% 0.0% 0.0% -16: flops 64 x 25 x 3 57600 100.0% 0.0% 0.0% -16: flops 9 x 15 x 12 58320 100.0% 0.0% 0.0% -16: flops 9 x 25 x 33 59400 100.0% 0.0% 0.0% -16: flops 12 x 12 x 9 59616 100.0% 0.0% 0.0% -16: flops 13 x 33 x 9 61776 100.0% 0.0% 0.0% -16: flops 8 x 23 x 12 61824 100.0% 0.0% 0.0% +16: flops 8 x 9 x 33 57024 100.0% 0.0% 0.0% +16: flops 33 x 9 x 8 57024 100.0% 0.0% 0.0% +16: flops 33 x 12 x 9 57024 100.0% 0.0% 0.0% +16: flops 15 x 64 x 5 57600 100.0% 0.0% 0.0% +16: flops 5 x 64 x 3 57600 100.0% 0.0% 0.0% +16: flops 15 x 9 x 12 58320 100.0% 0.0% 0.0% +16: flops 8 x 3 x 23 58512 100.0% 0.0% 0.0% +16: flops 3 x 23 x 12 59616 100.0% 0.0% 0.0% +16: flops 23 x 12 x 12 59616 100.0% 0.0% 0.0% +16: flops 12 x 3 x 64 59904 100.0% 0.0% 0.0% +16: flops 8 x 12 x 9 60480 100.0% 0.0% 0.0% +16: flops 12 x 9 x 8 62208 100.0% 0.0% 0.0% 16: flops 64 x 5 x 33 63360 100.0% 0.0% 0.0% -16: flops 9 x 12 x 33 64152 100.0% 0.0% 0.0% +16: flops 13 x 12 x 9 64584 100.0% 0.0% 0.0% +16: flops 12 x 9 x 5 64800 100.0% 0.0% 0.0% +16: flops 15 x 23 x 12 66240 100.0% 0.0% 0.0% +16: flops 12 x 23 x 5 66240 100.0% 0.0% 0.0% 16: flops 23 x 12 x 8 66240 100.0% 0.0% 0.0% -16: flops 8 x 12 x 23 66240 100.0% 0.0% 0.0% -16: flops 23 x 15 x 12 66240 100.0% 0.0% 0.0% -16: flops 9 x 78 x 8 67392 100.0% 0.0% 0.0% -16: flops 78 x 12 x 9 67392 100.0% 0.0% 0.0% -16: flops 5 x 3 x 64 69120 100.0% 0.0% 0.0% +16: flops 78 x 9 x 8 67392 100.0% 0.0% 0.0% +16: flops 13 x 23 x 3 68172 100.0% 0.0% 0.0% +16: flops 12 x 64 x 3 69120 100.0% 0.0% 0.0% +16: flops 8 x 12 x 23 70656 100.0% 0.0% 0.0% +16: flops 8 x 23 x 12 70656 100.0% 0.0% 0.0% 16: flops 9 x 33 x 12 71280 100.0% 0.0% 0.0% -16: flops 15 x 23 x 8 71760 100.0% 0.0% 0.0% -16: flops 33 x 8 x 23 72864 100.0% 0.0% 0.0% -16: flops 3 x 64 x 12 73728 100.0% 0.0% 0.0% -16: flops 64 x 12 x 8 73728 100.0% 0.0% 0.0% -16: flops 64 x 8 x 12 73728 100.0% 0.0% 0.0% -16: flops 33 x 25 x 9 74250 100.0% 0.0% 0.0% -16: flops 12 x 15 x 23 74520 100.0% 0.0% 0.0% -16: flops 25 x 23 x 33 75900 100.0% 0.0% 0.0% +16: flops 5 x 9 x 33 71280 100.0% 0.0% 0.0% +16: flops 13 x 3 x 23 71760 100.0% 0.0% 0.0% +16: flops 12 x 12 x 9 72576 100.0% 0.0% 0.0% 16: flops 23 x 5 x 33 75900 100.0% 0.0% 0.0% -16: flops 3 x 25 x 64 76800 100.0% 0.0% 0.0% -16: flops 13 x 23 x 33 78936 100.0% 0.0% 0.0% +16: flops 12 x 3 x 23 76176 100.0% 0.0% 0.0% 16: flops 3 x 64 x 5 80640 100.0% 0.0% 0.0% -16: flops 5 x 64 x 3 80640 100.0% 0.0% 0.0% -16: flops 12 x 3 x 23 81144 100.0% 0.0% 0.0% -16: flops 25 x 23 x 12 82800 100.0% 0.0% 0.0% -16: flops 12 x 25 x 23 82800 100.0% 0.0% 0.0% +16: flops 25 x 3 x 23 82800 100.0% 0.0% 0.0% +16: flops 3 x 64 x 12 82944 100.0% 0.0% 0.0% 16: flops 23 x 33 x 5 83490 100.0% 0.0% 0.0% 16: flops 33 x 5 x 64 84480 100.0% 0.0% 0.0% -16: flops 78 x 8 x 23 86112 100.0% 0.0% 0.0% -16: flops 12 x 3 x 64 87552 100.0% 0.0% 0.0% -16: flops 5 x 9 x 33 89100 100.0% 0.0% 0.0% -16: flops 23 x 78 x 5 89700 100.0% 0.0% 0.0% -16: flops 5 x 33 x 23 91080 100.0% 0.0% 0.0% -16: flops 64 x 12 x 5 92160 100.0% 0.0% 0.0% -16: flops 15 x 64 x 8 92160 100.0% 0.0% 0.0% -16: flops 33 x 9 x 5 98010 100.0% 0.0% 0.0% -16: flops 3 x 64 x 8 98304 100.0% 0.0% 0.0% -16: flops 8 x 33 x 9 99792 100.0% 0.0% 0.0% -16: flops 12 x 13 x 64 99840 100.0% 0.0% 0.0% +16: flops 13 x 9 x 33 84942 100.0% 0.0% 0.0% +16: flops 9 x 12 x 33 85536 100.0% 0.0% 0.0% +16: flops 12 x 33 x 9 85536 100.0% 0.0% 0.0% +16: flops 64 x 12 x 8 86016 100.0% 0.0% 0.0% +16: flops 78 x 23 x 5 89700 100.0% 0.0% 0.0% +16: flops 15 x 64 x 12 92160 100.0% 0.0% 0.0% +16: flops 8 x 64 x 3 98304 100.0% 0.0% 0.0% +16: flops 12 x 12 x 23 99360 100.0% 0.0% 0.0% 16: flops 12 x 5 x 64 99840 100.0% 0.0% 0.0% -16: flops 12 x 9 x 12 101088 100.0% 0.0% 0.0% -16: flops 8 x 33 x 64 101376 100.0% 0.0% 0.0% -16: flops 33 x 12 x 64 101376 100.0% 0.0% 0.0% -16: flops 15 x 9 x 12 103680 100.0% 0.0% 0.0% -16: flops 64 x 25 x 33 105600 100.0% 0.0% 0.0% -16: flops 5 x 78 x 23 107640 100.0% 0.0% 0.0% +16: flops 8 x 3 x 64 101376 100.0% 0.0% 0.0% +16: flops 8 x 64 x 33 101376 100.0% 0.0% 0.0% +16: flops 25 x 9 x 33 103950 100.0% 0.0% 0.0% 16: flops 23 x 33 x 8 109296 100.0% 0.0% 0.0% -16: flops 78 x 9 x 13 109512 100.0% 0.0% 0.0% -16: flops 78 x 13 x 9 109512 100.0% 0.0% 0.0% -16: flops 12 x 23 x 8 110400 100.0% 0.0% 0.0% -16: flops 12 x 64 x 3 110592 100.0% 0.0% 0.0% -16: flops 78 x 8 x 9 112320 100.0% 0.0% 0.0% -16: flops 12 x 12 x 23 112608 100.0% 0.0% 0.0% -16: flops 25 x 64 x 3 115200 100.0% 0.0% 0.0% -16: flops 15 x 23 x 12 115920 100.0% 0.0% 0.0% -16: flops 8 x 64 x 3 116736 100.0% 0.0% 0.0% +16: flops 8 x 33 x 9 109296 100.0% 0.0% 0.0% +16: flops 25 x 23 x 12 110400 100.0% 0.0% 0.0% +16: flops 25 x 12 x 23 110400 100.0% 0.0% 0.0% +16: flops 3 x 64 x 8 110592 100.0% 0.0% 0.0% +16: flops 33 x 9 x 5 115830 100.0% 0.0% 0.0% +16: flops 25 x 23 x 3 117300 100.0% 0.0% 0.0% 16: flops 25 x 33 x 9 118800 100.0% 0.0% 0.0% -16: flops 64 x 13 x 12 119808 100.0% 0.0% 0.0% -16: flops 8 x 23 x 33 121440 100.0% 0.0% 0.0% -16: flops 78 x 9 x 8 123552 100.0% 0.0% 0.0% -16: flops 78 x 23 x 5 125580 100.0% 0.0% 0.0% -16: flops 12 x 23 x 12 125856 100.0% 0.0% 0.0% +16: flops 64 x 12 x 5 122880 100.0% 0.0% 0.0% +16: flops 12 x 8 x 64 122880 100.0% 0.0% 0.0% 16: flops 64 x 33 x 5 126720 100.0% 0.0% 0.0% -16: flops 8 x 3 x 64 132096 100.0% 0.0% 0.0% +16: flops 12 x 9 x 12 129600 100.0% 0.0% 0.0% 16: flops 64 x 33 x 8 135168 100.0% 0.0% 0.0% 16: flops 64 x 5 x 12 138240 100.0% 0.0% 0.0% -16: flops 78 x 9 x 25 140400 100.0% 0.0% 0.0% -16: flops 12 x 33 x 9 142560 100.0% 0.0% 0.0% -16: flops 33 x 12 x 23 145728 100.0% 0.0% 0.0% -16: flops 25 x 33 x 23 151800 100.0% 0.0% 0.0% -16: flops 23 x 25 x 33 151800 100.0% 0.0% 0.0% -16: flops 25 x 3 x 64 153600 100.0% 0.0% 0.0% -16: flops 33 x 9 x 12 156816 100.0% 0.0% 0.0% -16: flops 23 x 12 x 33 163944 100.0% 0.0% 0.0% -16: flops 33 x 13 x 64 164736 100.0% 0.0% 0.0% -16: flops 5 x 78 x 9 168480 100.0% 0.0% 0.0% -16: flops 78 x 12 x 23 172224 100.0% 0.0% 0.0% -16: flops 15 x 64 x 5 172800 100.0% 0.0% 0.0% -16: flops 78 x 23 x 25 179400 100.0% 0.0% 0.0% -16: flops 25 x 78 x 23 179400 100.0% 0.0% 0.0% -16: flops 12 x 64 x 8 184320 100.0% 0.0% 0.0% -16: flops 33 x 23 x 5 189750 100.0% 0.0% 0.0% -16: flops 5 x 64 x 33 190080 100.0% 0.0% 0.0% -16: flops 9 x 78 x 12 202176 100.0% 0.0% 0.0% +16: flops 13 x 64 x 3 139776 100.0% 0.0% 0.0% +16: flops 8 x 23 x 33 145728 100.0% 0.0% 0.0% +16: flops 78 x 8 x 9 146016 100.0% 0.0% 0.0% +16: flops 5 x 64 x 33 147840 100.0% 0.0% 0.0% +16: flops 78 x 12 x 9 151632 100.0% 0.0% 0.0% +16: flops 33 x 12 x 64 152064 100.0% 0.0% 0.0% +16: flops 13 x 33 x 9 162162 100.0% 0.0% 0.0% +16: flops 13 x 3 x 64 164736 100.0% 0.0% 0.0% +16: flops 5 x 33 x 64 168960 100.0% 0.0% 0.0% +16: flops 33 x 8 x 23 170016 100.0% 0.0% 0.0% +16: flops 12 x 23 x 12 172224 100.0% 0.0% 0.0% +16: flops 25 x 3 x 64 172800 100.0% 0.0% 0.0% +16: flops 25 x 64 x 3 172800 100.0% 0.0% 0.0% +16: flops 5 x 23 x 33 182160 100.0% 0.0% 0.0% +16: flops 33 x 12 x 23 182160 100.0% 0.0% 0.0% +16: flops 64 x 8 x 12 184320 100.0% 0.0% 0.0% +16: flops 12 x 9 x 33 185328 100.0% 0.0% 0.0% +16: flops 12 x 23 x 8 198720 100.0% 0.0% 0.0% +16: flops 78 x 8 x 23 200928 100.0% 0.0% 0.0% 16: flops 78 x 9 x 12 202176 100.0% 0.0% 0.0% -16: flops 33 x 23 x 8 206448 100.0% 0.0% 0.0% -16: flops 78 x 25 x 9 210600 100.0% 0.0% 0.0% -16: flops 33 x 25 x 64 211200 100.0% 0.0% 0.0% -16: flops 12 x 9 x 33 213840 100.0% 0.0% 0.0% -16: flops 23 x 78 x 12 215280 100.0% 0.0% 0.0% +16: flops 25 x 33 x 64 211200 100.0% 0.0% 0.0% +16: flops 33 x 9 x 12 213840 100.0% 0.0% 0.0% +16: flops 5 x 12 x 64 215040 100.0% 0.0% 0.0% 16: flops 78 x 23 x 12 215280 100.0% 0.0% 0.0% -16: flops 13 x 78 x 9 219024 100.0% 0.0% 0.0% -16: flops 13 x 64 x 33 219648 100.0% 0.0% 0.0% -16: flops 5 x 23 x 33 227700 100.0% 0.0% 0.0% -16: flops 25 x 64 x 12 230400 100.0% 0.0% 0.0% -16: flops 15 x 64 x 12 230400 100.0% 0.0% 0.0% -16: flops 3 x 64 x 25 230400 100.0% 0.0% 0.0% +16: flops 78 x 12 x 23 215280 100.0% 0.0% 0.0% +16: flops 13 x 23 x 33 217074 100.0% 0.0% 0.0% +16: flops 23 x 12 x 33 218592 100.0% 0.0% 0.0% +16: flops 8 x 12 x 64 221184 100.0% 0.0% 0.0% 16: flops 23 x 33 x 12 236808 100.0% 0.0% 0.0% -16: flops 13 x 64 x 12 239616 100.0% 0.0% 0.0% -16: flops 13 x 12 x 64 239616 100.0% 0.0% 0.0% -16: flops 5 x 33 x 64 253440 100.0% 0.0% 0.0% -16: flops 64 x 12 x 33 253440 100.0% 0.0% 0.0% -16: flops 64 x 12 x 12 258048 100.0% 0.0% 0.0% -16: flops 25 x 78 x 9 280800 100.0% 0.0% 0.0% -16: flops 23 x 78 x 8 287040 100.0% 0.0% 0.0% -16: flops 5 x 12 x 64 299520 100.0% 0.0% 0.0% -16: flops 64 x 78 x 5 299520 100.0% 0.0% 0.0% -16: flops 12 x 64 x 25 307200 100.0% 0.0% 0.0% -16: flops 8 x 12 x 64 319488 100.0% 0.0% 0.0% -16: flops 12 x 64 x 13 319488 100.0% 0.0% 0.0% -16: flops 12 x 78 x 9 320112 100.0% 0.0% 0.0% -16: flops 8 x 78 x 9 325728 100.0% 0.0% 0.0% -16: flops 33 x 64 x 8 337920 100.0% 0.0% 0.0% -16: flops 12 x 25 x 64 345600 100.0% 0.0% 0.0% +16: flops 33 x 23 x 5 250470 100.0% 0.0% 0.0% +16: flops 12 x 64 x 8 258048 100.0% 0.0% 0.0% +16: flops 25 x 23 x 33 265650 100.0% 0.0% 0.0% +16: flops 13 x 33 x 23 276276 100.0% 0.0% 0.0% +16: flops 78 x 23 x 8 287040 100.0% 0.0% 0.0% +16: flops 64 x 12 x 33 304128 100.0% 0.0% 0.0% +16: flops 33 x 23 x 8 327888 100.0% 0.0% 0.0% +16: flops 13 x 64 x 33 329472 100.0% 0.0% 0.0% +16: flops 64 x 12 x 12 331776 100.0% 0.0% 0.0% +16: flops 5 x 64 x 12 345600 100.0% 0.0% 0.0% +16: flops 78 x 64 x 5 349440 100.0% 0.0% 0.0% 16: flops 12 x 33 x 64 354816 100.0% 0.0% 0.0% -16: flops 8 x 33 x 23 364320 100.0% 0.0% 0.0% +16: flops 12 x 33 x 23 364320 100.0% 0.0% 0.0% 16: flops 12 x 64 x 5 368640 100.0% 0.0% 0.0% 16: flops 33 x 64 x 5 380160 100.0% 0.0% 0.0% -16: flops 78 x 8 x 64 399360 100.0% 0.0% 0.0% -16: flops 78 x 23 x 8 401856 100.0% 0.0% 0.0% -16: flops 5 x 64 x 12 414720 100.0% 0.0% 0.0% -16: flops 25 x 33 x 64 422400 100.0% 0.0% 0.0% -16: flops 33 x 64 x 25 422400 100.0% 0.0% 0.0% -16: flops 8 x 78 x 23 430560 100.0% 0.0% 0.0% -16: flops 13 x 33 x 64 439296 100.0% 0.0% 0.0% +16: flops 8 x 33 x 23 388608 100.0% 0.0% 0.0% +16: flops 33 x 64 x 8 405504 100.0% 0.0% 0.0% +16: flops 13 x 64 x 12 419328 100.0% 0.0% 0.0% +16: flops 25 x 64 x 33 422400 100.0% 0.0% 0.0% 16: flops 78 x 5 x 64 449280 100.0% 0.0% 0.0% -16: flops 33 x 23 x 12 455400 100.0% 0.0% 0.0% -16: flops 33 x 25 x 23 455400 100.0% 0.0% 0.0% -16: flops 64 x 25 x 12 460800 100.0% 0.0% 0.0% -16: flops 12 x 33 x 23 473616 100.0% 0.0% 0.0% -16: flops 8 x 64 x 12 479232 100.0% 0.0% 0.0% -16: flops 78 x 64 x 25 499200 100.0% 0.0% 0.0% -16: flops 64 x 33 x 12 506880 100.0% 0.0% 0.0% -16: flops 25 x 12 x 64 537600 100.0% 0.0% 0.0% -16: flops 78 x 25 x 23 538200 100.0% 0.0% 0.0% -16: flops 12 x 23 x 33 546480 100.0% 0.0% 0.0% -16: flops 12 x 78 x 23 559728 100.0% 0.0% 0.0% -16: flops 12 x 12 x 64 626688 100.0% 0.0% 0.0% -16: flops 64 x 78 x 8 638976 100.0% 0.0% 0.0% -16: flops 78 x 64 x 5 648960 100.0% 0.0% 0.0% -16: flops 12 x 64 x 12 737280 100.0% 0.0% 0.0% -16: flops 15 x 64 x 25 768000 100.0% 0.0% 0.0% -16: flops 78 x 64 x 13 778752 100.0% 0.0% 0.0% -16: flops 78 x 13 x 64 778752 100.0% 0.0% 0.0% -16: flops 12 x 64 x 33 912384 100.0% 0.0% 0.0% -16: flops 25 x 78 x 64 998400 100.0% 0.0% 0.0% -16: flops 78 x 12 x 64 1198080 100.0% 0.0% 0.0% -16: flops 78 x 25 x 64 1248000 100.0% 0.0% 0.0% -16: flops 5 x 78 x 64 1347840 100.0% 0.0% 0.0% -16: flops 8 x 78 x 64 1357824 100.0% 0.0% 0.0% -16: flops 64 x 78 x 12 1437696 100.0% 0.0% 0.0% -16: flops 13 x 78 x 64 1557504 100.0% 0.0% 0.0% -16: flops 33 x 64 x 12 1571328 100.0% 0.0% 0.0% -16: flops 78 x 64 x 8 1837056 100.0% 0.0% 0.0% -16: flops 78 x 64 x 12 2995200 100.0% 0.0% 0.0% -16: flops 12 x 78 x 64 3714048 100.0% 0.0% 0.0% -16: flops inhomo. stacks 879264000 100.0% 0.0% 0.0% -16: flops total 936.054168E+06 100.0% 0.0% 0.0% -16: flops max/rank 100.921804E+06 100.0% 0.0% 0.0% -16: matmuls inhomo. stacks 4350 100.0% 0.0% 0.0% +16: flops 12 x 23 x 33 473616 100.0% 0.0% 0.0% +16: flops 25 x 12 x 64 499200 100.0% 0.0% 0.0% +16: flops 8 x 64 x 12 516096 100.0% 0.0% 0.0% +16: flops 13 x 12 x 64 519168 100.0% 0.0% 0.0% +16: flops 64 x 33 x 12 557568 100.0% 0.0% 0.0% +16: flops 78 x 8 x 64 559104 100.0% 0.0% 0.0% +16: flops 25 x 64 x 12 576000 100.0% 0.0% 0.0% +16: flops 25 x 33 x 23 607200 100.0% 0.0% 0.0% +16: flops 12 x 12 x 64 608256 100.0% 0.0% 0.0% +16: flops 12 x 64 x 33 658944 100.0% 0.0% 0.0% +16: flops 33 x 23 x 12 710424 100.0% 0.0% 0.0% +16: flops 13 x 33 x 64 713856 100.0% 0.0% 0.0% +16: flops 78 x 64 x 8 718848 100.0% 0.0% 0.0% +16: flops 12 x 64 x 12 884736 100.0% 0.0% 0.0% +16: flops 78 x 12 x 64 1557504 100.0% 0.0% 0.0% +16: flops 33 x 64 x 12 1672704 100.0% 0.0% 0.0% +16: flops 78 x 64 x 12 1797120 100.0% 0.0% 0.0% +16: flops inhomo. stacks 1045363200 100.0% 0.0% 0.0% +16: flops total 1.078733E+09 100.0% 0.0% 0.0% +16: flops max/rank 181.647356E+06 100.0% 0.0% 0.0% +16: matmuls inhomo. stacks 4923 100.0% 0.0% 0.0% 16: matmuls total 13158 100.0% 0.0% 0.0% -16: number of processed stacks 6723 100.0% 0.0% 0.0% -16: average stack size 2.0 0.0 0.0 -16: marketing flops 18.257457E+09 +16: number of processed stacks 4812 100.0% 0.0% 0.0% +16: average stack size 2.7 0.0 0.0 +16: marketing flops 18.257453E+09 16: ------------------------------------------------------------------------------- 16: # multiplications 72 -16: max memory usage/rank 103.292928E+06 -16: # max total images/rank 4 +16: max memory usage/rank 77.438976E+06 +16: # max total images/rank 7 16: # max 3D layers 1 -16: # MPI messages exchanged 5856 +16: # MPI messages exchanged 1344 16: MPI messages size (bytes): -16: total size 55.153728E+06 +16: total size 56.434752E+06 16: min size 0.000000E+00 -16: max size 82.496000E+03 -16: average size 9.418328E+03 +16: max size 122.232000E+03 +16: average size 41.990145E+03 16: MPI breakdown and total messages size (bytes): -16: size <= 128 1876 19120 -16: 128 < size <= 8192 1942 6625984 -16: 8192 < size <= 32768 1588 27190384 -16: 32768 < size <= 131072 450 21318240 +16: size <= 128 72 1152 +16: 128 < size <= 8192 132 430560 +16: 8192 < size <= 32768 360 7101216 +16: 32768 < size <= 131072 780 48901824 16: 131072 < size <= 4194304 0 0 16: 4194304 < size <= 16777216 0 0 16: 16777216 < size 0 0 16: ------------------------------------------------------------------------------- 16: 16: *** WARNING in dbcsr_mm.F:291 :: Using a non-square number of MPI ranks *** -16: *** might lead to poor performance. Used ranks: 12 Suggested: 9 25 *** +16: *** might lead to poor performance. Used ranks: 7 Suggested: 9 16 *** 16: 16: ------------------------------------------------------------------------------- 16: - - @@ -57885,11 +57758,11 @@ 16: - - 16: ------------------------------------------------------------------------------- 16: ROUTINE CALLS AVE VOLUME [Bytes] -16: MP_Bcast 451 11. -16: MP_Allreduce 1787 17. -16: MP_Alltoall 816 6497. -16: MP_ISend 2750 3810. -16: MP_IRecv 2918 3321. +16: MP_Bcast 322 10. +16: MP_Allreduce 1553 16. +16: MP_Alltoall 816 13929. +16: MP_ISend 2492 7298. +16: MP_IRecv 2398 7582. 16: ------------------------------------------------------------------------------- 16: 16: ------------------------------------------------------------------------------- @@ -57899,164 +57772,164 @@ 16: ------------------------------------------------------------------------------- 16: SUBROUTINE CALLS ASD SELF TIME TOTAL TIME MAXRANK 16: MAXIMUM AVERAGE MAXIMUM AVERAGE MAXIMUM -16: dbcsr_tas_multiply 48 2.5 0.000 0.000 1.893 1.893 3 -16: dbcsr_tas_total 48 3.5 0.006 0.014 1.889 1.889 0 -16: dbcsr_tas_result_index 24 3.0 0.002 0.003 0.894 0.894 6 -16: dbcsr_multiply_generic 72 4.7 0.005 0.006 0.755 0.803 5 -16: mp_sync 192 4.6 0.545 0.611 0.545 0.611 11 -16: dbcsr_tas_reshape 120 4.9 0.002 0.002 0.508 0.550 2 -16: mp_alltoall_i 168 6.8 0.465 0.515 0.465 0.515 3 -16: dbcsr_tas_dbcsr 48 4.5 0.000 0.000 0.434 0.435 0 -16: dbcsr_create_new 1644 5.6 0.237 0.361 0.251 0.372 2 -16: dbcsr_tas_reshape_alltoall 120 5.9 0.000 0.000 0.336 0.371 10 -16: make_m2s 144 5.7 0.002 0.002 0.321 0.366 2 -16: make_images 144 6.7 0.037 0.070 0.316 0.362 2 -16: dbcsr_complete_redistribute 72 1.0 0.015 0.018 0.288 0.305 0 -16: multiply_cannon 72 5.7 0.041 0.053 0.265 0.293 11 -16: mp_alltoall_i22 72 2.0 0.213 0.241 0.213 0.241 3 -16: mp_sum_l 803 4.1 0.213 0.237 0.213 0.237 3 -16: dbcsr_checksum 48 1.0 0.021 0.034 0.190 0.212 7 -16: mp_cart_create 328 6.7 0.162 0.207 0.162 0.207 3 -16: make_images_sizes 144 7.7 0.000 0.000 0.170 0.199 0 -16: mp_alltoall_i44 144 8.7 0.170 0.199 0.170 0.199 3 -16: reshape_mm_small 48 4.5 0.008 0.009 0.184 0.197 2 -16: mp_sum_d 303 1.2 0.171 0.191 0.171 0.191 2 -16: reshape_mm_compatible 48 4.5 0.001 0.001 0.158 0.170 0 -16: multiply_cannon_loop 72 6.7 0.008 0.011 0.146 0.170 3 -16: mp_waitall_1 2528 8.5 0.144 0.167 0.144 0.167 10 -16: dbcsr_tas_replicate 48 4.5 0.003 0.004 0.153 0.165 0 -16: dbcsr_tas_communicate_buffer 168 6.8 0.004 0.004 0.141 0.162 6 -16: mp_waitall_2 328 7.7 0.133 0.153 0.133 0.153 6 -16: dbcsr_tas_mm_2 16 5.5 0.000 0.000 0.152 0.152 1 -16: dbcsr_finalize 676 4.0 0.009 0.019 0.068 0.130 1 -16: dbcsr_tas_create_new 246 4.9 0.001 0.002 0.081 0.123 10 -16: make_images_data 144 7.7 0.003 0.003 0.083 0.121 0 -16: dbcsr_merge_all 240 5.1 0.049 0.105 0.056 0.118 7 -16: dbcsr_tas_reshape_communicate_ 120 5.9 0.000 0.000 0.097 0.115 2 -16: hybrid_alltoall_any 144 8.7 0.006 0.016 0.063 0.104 1 -16: dbcsr_tas_replicate_alltoall 32 5.5 0.000 0.000 0.082 0.097 11 -16: dbcsr_tas_mm_1N 12 5.0 0.000 0.000 0.059 0.091 0 -16: dbcsr_tas_merge 16 4.5 0.002 0.002 0.082 0.090 11 -16: dbcsr_tas_distribution_new 174 5.3 0.002 0.002 0.067 0.081 2 -16: dbcsr_tas_create_split 78 5.5 0.000 0.000 0.067 0.081 0 -16: dbcsr_tas_create_split_rows_or 78 6.5 0.001 0.001 0.067 0.080 2 -16: mp_comm_dup 78 7.5 0.061 0.074 0.061 0.074 3 -16: mp_allgather_i34 72 6.7 0.060 0.073 0.060 0.073 3 -16: dbcsr_tas_reshape_buffer_fill 120 5.9 0.004 0.005 0.043 0.073 6 -16: multiply_cannon_metrocomm3 376 5.3 0.001 0.001 0.041 0.072 2 -16: multiply_cannon_metrocomm1 376 5.3 0.001 0.001 0.050 0.072 2 -16: dbcsr_add_anytype 72 3.7 0.016 0.032 0.047 0.068 1 -16: mp_max_d 25 1.0 0.053 0.062 0.053 0.062 3 -16: reshape_mm_template 24 7.0 0.002 0.002 0.053 0.062 0 -16: dbcsr_tas_mm_3T 12 5.0 0.000 0.000 0.046 0.059 0 -16: dbcsr_tas_merge_alltoall 16 5.5 0.000 0.000 0.046 0.053 6 -16: dbcsr_scale_anytype 88 4.3 0.002 0.007 0.033 0.052 1 -16: dbcsr_new_transposed 56 5.1 0.001 0.001 0.026 0.050 1 -16: convert_to_new_pgrid 144 4.5 0.000 0.000 0.019 0.049 0 -16: dbcsr_iterator_start 1402 5.3 0.034 0.048 0.035 0.049 6 -16: dbcsr_tas_replicate_communicat 32 5.5 0.000 0.000 0.033 0.042 0 -16: multiply_cannon_multrec 376 5.3 0.019 0.025 0.026 0.040 2 -16: dbcsr_tas_reshape_buffer_obtai 120 5.9 0.007 0.008 0.022 0.032 2 -16: dbcsr_tas_convert_to_dbcsr 72 1.0 0.004 0.004 0.020 0.032 6 -16: dbcsr_tas_setup_test_matrix 6 1.0 0.005 0.008 0.030 0.031 0 -16: dbcsr_reserve_blocks 288 5.5 0.020 0.030 0.020 0.030 4 -16: calculate_norms 752 5.3 0.015 0.029 0.015 0.029 0 -16: dbcsr_copy 240 5.6 0.003 0.008 0.017 0.027 8 -16: dbcsr_special_finalize 264 6.0 0.002 0.005 0.017 0.027 10 -16: dbcsr_tas_mm_1T 4 7.0 0.000 0.000 0.017 0.026 0 -16: dbcsr_tas_reserve_blocks_index 168 6.0 0.001 0.001 0.015 0.025 2 -16: dbcsr_tas_mp_comm 30 3.6 0.000 0.000 0.019 0.023 2 -16: dbcsr_filter_anytype 96 4.5 0.003 0.003 0.012 0.022 1 -16: dbcsr_add_d 24 1.0 0.000 0.000 0.016 0.021 5 -16: dbcsr_tas_merge_communicate_bu 16 5.5 0.000 0.000 0.013 0.021 8 -16: dbcsr_merge_single_wm 168 5.0 0.012 0.019 0.013 0.020 10 -16: dbcsr_make_index_exist 1644 6.6 0.012 0.020 0.012 0.020 8 -16: multiply_cannon_multrec_finali 72 8.7 0.000 0.000 0.007 0.015 2 -16: dbcsr_mm_multrec_finalize 72 9.7 0.006 0.015 0.007 0.015 7 -16: dbcsr_tas_mm_3N 4 7.0 0.000 0.000 0.006 0.014 0 -16: buffer_matrices_ensure_size 144 6.7 0.002 0.011 0.002 0.011 4 -16: setup_buffer_matrices 144 6.7 0.001 0.001 0.005 0.010 0 -16: dbcsr_iterator_stop 1402 5.4 0.005 0.008 0.005 0.009 9 -16: dbcsr_mm_multrec_init 72 6.7 0.000 0.000 0.006 0.009 2 -16: dbcsr_mm_csr_init 72 7.7 0.006 0.008 0.006 0.008 5 -16: setup_rec_index_2d 144 6.7 0.002 0.008 0.002 0.008 1 -16: merge_index 240 6.1 0.002 0.008 0.002 0.008 7 -16: mp_sum_lv 373 1.0 0.006 0.008 0.006 0.008 11 -16: dbcsr_destroy 1548 4.5 0.003 0.004 0.007 0.007 0 -16: mp_alltoall_d11v 216 2.0 0.006 0.007 0.006 0.007 5 -16: mp_isend_dv 1396 7.2 0.005 0.006 0.005 0.006 3 -16: mp_comm_free 780 5.1 0.004 0.006 0.004 0.006 0 -16: multiply_cannon_metrocomm2 256 4.8 0.002 0.004 0.004 0.005 10 -16: mp_cart_sub 296 8.5 0.005 0.005 0.005 0.005 0 -16: dbcsr_data_release 6112 6.2 0.005 0.005 0.005 0.005 2 -16: dbcsr_data_new 3736 6.0 0.004 0.005 0.004 0.005 2 -16: quick_finalize 96 10.5 0.001 0.003 0.002 0.004 6 -16: mp_max_l 141 1.0 0.003 0.003 0.003 0.003 4 -16: mp_comm_split_direct 78 7.5 0.003 0.003 0.003 0.003 4 -16: dbcsr_make_index_local_row 264 5.0 0.001 0.003 0.001 0.003 6 -16: mp_max_i 515 1.0 0.003 0.003 0.003 0.003 9 -16: multiply_cannon_metrocomm4 232 4.9 0.001 0.001 0.003 0.003 0 -16: dbcsr_work_create 504 5.1 0.002 0.002 0.003 0.003 0 -16: make_images_pack 144 7.7 0.002 0.002 0.002 0.003 6 -16: dbcsr_sort_data 258 6.5 0.002 0.003 0.002 0.003 5 -16: mp_max_r 1 1.0 0.002 0.003 0.002 0.003 2 -16: dbcsr_work_destroy_all 504 6.1 0.001 0.001 0.002 0.002 0 -16: dbcsr_sort_indices 964 7.0 0.002 0.002 0.002 0.002 2 -16: dbcsr_make_index_list 264 5.0 0.001 0.002 0.001 0.002 4 -16: mp_alltoall_i11v 216 2.0 0.002 0.002 0.002 0.002 8 -16: dbcsr_data_copy_aa2 125 5.4 0.001 0.002 0.001 0.002 8 -16: mp_maxloc_dv 301 1.0 0.001 0.002 0.001 0.002 3 -16: tree_to_linear_d 72 4.0 0.001 0.002 0.001 0.002 8 -16: dbcsr_add_wm_from_matrix 18 5.0 0.000 0.001 0.001 0.001 0 -16: dbcsr_distribution_new 518 4.8 0.001 0.001 0.001 0.001 2 -16: mp_isend_lm2 712 7.9 0.001 0.001 0.001 0.001 6 -16: dbcsr_make_untransposed_blocks 72 5.7 0.001 0.001 0.001 0.001 2 -16: dbcsr_init_lib_low 1 1.0 0.001 0.001 0.001 0.001 2 -16: mp_bcast_av 150 1.0 0.001 0.001 0.001 0.001 11 -16: dbcsr_set 72 2.0 0.000 0.000 0.000 0.001 3 -16: dbcsr_iterator_seek 1402 6.3 0.001 0.001 0.001 0.001 2 -16: mp_irecv_dv 1408 7.2 0.001 0.001 0.001 0.001 2 -16: mp_sum_iv 72 6.7 0.001 0.001 0.001 0.001 2 -16: mp_irecv_lm2 710 7.9 0.001 0.001 0.001 0.001 4 -16: mp_isend_iv 911 6.9 0.001 0.001 0.001 0.001 10 -16: dbcsr_zero 72 3.0 0.000 0.001 0.000 0.001 3 -16: dbcsr_tas_reshape_get_coord 120 5.9 0.001 0.001 0.001 0.001 0 -16: mp_bcast_iv 373 1.0 0.001 0.001 0.001 0.001 9 -16: dbcsr_fill_wm_from_matrix 18 6.0 0.000 0.001 0.001 0.001 2 -16: block_buffer_get_index 2016 6.5 0.001 0.001 0.001 0.001 2 -16: dbcsr_switch_data_area 296 8.1 0.000 0.000 0.001 0.001 2 -16: mp_irecv_iv 906 6.9 0.001 0.001 0.001 0.001 0 -16: dbcsr_make_dbcsr_index 844 6.9 0.001 0.001 0.001 0.001 1 -16: dbcsr_tas_blk_sizes 1584 6.5 0.000 0.001 0.000 0.001 2 -16: mp_bcast_i 90 6.7 0.000 0.000 0.000 0.000 7 -16: mp_max_lv 72 3.0 0.000 0.000 0.000 0.000 6 -16: transpose_index_local 56 6.1 0.000 0.000 0.000 0.000 0 -16: fill_hash_tables 72 8.7 0.000 0.000 0.000 0.000 2 -16: mp_max_iv 72 3.0 0.000 0.000 0.000 0.000 1 -16: multrec_filtering 72 10.7 0.000 0.000 0.000 0.000 1 -16: dbcsr_get_data_size_used 240 5.1 0.000 0.000 0.000 0.000 5 -16: dbcsr_index_compact 96 5.5 0.000 0.000 0.000 0.000 2 -16: dbcsr_mm_sched_init 72 8.7 0.000 0.000 0.000 0.000 1 -16: dbcsr_get_local_rows 72 5.7 0.000 0.000 0.000 0.000 5 -16: dbcsr_get_local_cols 72 5.7 0.000 0.000 0.000 0.000 2 -16: mp_dims_create 206 4.6 0.000 0.000 0.000 0.000 11 -16: dbcsr_get_global_row_map 72 5.7 0.000 0.000 0.000 0.000 7 -16: dbcsr_get_global_col_map 72 5.7 0.000 0.000 0.000 0.000 6 -16: dbcsr_mm_sched_finalize 72 10.7 0.000 0.000 0.000 0.000 6 -16: dbcsr_mm_hostdrv_init 72 9.7 0.000 0.000 0.000 0.000 5 -16: mp_sum_r 1 1.0 0.000 0.000 0.000 0.000 0 -16: mp_sum_lm3 1 1.0 0.000 0.000 0.000 0.000 4 -16: mp_min_rv 1 1.0 0.000 0.000 0.000 0.000 3 +16: dbcsr_tas_multiply 48 2.5 0.000 0.000 7.137 7.166 3 +16: dbcsr_tas_total 48 3.5 0.013 0.021 7.074 7.097 0 +16: dbcsr_tas_result_index 24 3.0 0.017 0.017 2.973 2.979 5 +16: dbcsr_multiply_generic 72 4.7 0.016 0.036 2.784 2.891 3 +16: mp_sync 192 4.6 1.654 1.866 1.654 1.866 6 +16: dbcsr_tas_reshape 120 4.9 0.004 0.004 1.553 1.670 6 +16: dbcsr_tas_dbcsr 48 4.5 0.000 0.000 1.554 1.563 5 +16: mp_alltoall_i 168 6.8 1.282 1.414 1.282 1.414 2 +16: multiply_cannon 72 5.7 0.143 0.290 1.259 1.362 4 +16: dbcsr_create_new 1788 5.7 0.853 1.239 0.897 1.281 4 +16: mp_sum_l 803 4.1 1.043 1.144 1.043 1.144 0 +16: make_m2s 144 5.7 0.004 0.004 1.000 1.040 3 +16: make_images 144 6.7 0.098 0.133 0.989 1.029 3 +16: dbcsr_tas_mm_2 16 5.5 0.000 0.000 1.015 1.025 5 +16: reshape_mm_small 48 4.5 0.010 0.011 0.950 1.000 5 +16: dbcsr_tas_reshape_alltoall 120 5.9 0.001 0.001 0.850 0.991 5 +16: multiply_cannon_loop 72 6.7 0.034 0.062 0.845 0.965 1 +16: dbcsr_complete_redistribute 72 1.0 0.034 0.038 0.897 0.923 2 +16: mp_waitall_1 2496 8.2 0.808 0.902 0.808 0.902 2 +16: reshape_mm_compatible 48 4.5 0.002 0.002 0.678 0.746 0 +16: dbcsr_tas_communicate_buffer 168 6.8 0.012 0.016 0.680 0.737 1 +16: dbcsr_tas_replicate 48 4.5 0.009 0.010 0.691 0.726 0 +16: mp_cart_create 328 6.7 0.653 0.711 0.653 0.711 3 +16: mp_waitall_2 328 7.7 0.658 0.710 0.658 0.710 1 +16: dbcsr_checksum 48 1.0 0.070 0.116 0.571 0.626 4 +16: dbcsr_tas_create_new 246 4.9 0.027 0.028 0.389 0.567 0 +16: mp_sum_d 303 1.2 0.504 0.548 0.504 0.548 2 +16: dbcsr_tas_distribution_new 174 5.3 0.003 0.004 0.495 0.542 3 +16: dbcsr_tas_create_split 78 5.5 0.000 0.000 0.494 0.540 3 +16: dbcsr_tas_create_split_rows_or 78 6.5 0.002 0.002 0.493 0.540 3 +16: multiply_cannon_metrocomm1 264 5.7 0.002 0.002 0.462 0.526 3 +16: dbcsr_tas_reshape_communicate_ 120 5.9 0.001 0.001 0.436 0.507 5 +16: mp_alltoall_i22 72 2.0 0.387 0.504 0.387 0.504 1 +16: mp_comm_dup 78 7.5 0.412 0.486 0.412 0.486 3 +16: make_images_sizes 144 7.7 0.001 0.001 0.370 0.470 3 +16: mp_alltoall_i44 144 8.7 0.369 0.469 0.369 0.469 2 +16: make_images_data 144 7.7 0.006 0.006 0.412 0.447 3 +16: dbcsr_tas_replicate_alltoall 32 5.5 0.000 0.000 0.315 0.365 3 +16: hybrid_alltoall_any 144 8.7 0.041 0.081 0.319 0.359 4 +16: dbcsr_reserve_blocks 288 5.5 0.167 0.274 0.168 0.275 4 +16: dbcsr_tas_merge 16 4.5 0.005 0.006 0.238 0.256 3 +16: mp_allgather_i34 72 6.7 0.213 0.254 0.213 0.254 1 +16: dbcsr_finalize 676 4.0 0.012 0.017 0.175 0.251 6 +16: dbcsr_merge_all 240 5.1 0.140 0.223 0.157 0.236 4 +16: dbcsr_tas_replicate_communicat 32 5.5 0.000 0.000 0.199 0.220 3 +16: reshape_mm_template 24 7.0 0.007 0.011 0.172 0.218 1 +16: dbcsr_add_anytype 72 3.7 0.062 0.095 0.152 0.187 0 +16: mp_max_d 25 1.0 0.163 0.180 0.163 0.180 5 +16: dbcsr_tas_reshape_buffer_obtai 120 5.9 0.015 0.019 0.124 0.180 0 +16: calculate_norms 528 5.7 0.129 0.173 0.129 0.173 4 +16: dbcsr_tas_reserve_blocks_index 168 6.0 0.003 0.006 0.107 0.165 5 +16: dbcsr_tas_setup_test_matrix 6 1.0 0.012 0.021 0.163 0.165 0 +16: mp_alltoall_d11v 216 2.0 0.131 0.164 0.131 0.164 5 +16: multiply_cannon_metrocomm3 264 5.7 0.001 0.001 0.116 0.156 3 +16: dbcsr_tas_merge_alltoall 16 5.5 0.000 0.000 0.117 0.155 6 +16: dbcsr_tas_reshape_buffer_fill 120 5.9 0.012 0.013 0.119 0.154 3 +16: dbcsr_tas_mm_1N 12 5.0 0.000 0.000 0.082 0.154 3 +16: multiply_cannon_multrec 264 5.7 0.057 0.072 0.097 0.149 2 +16: dbcsr_iterator_start 1402 5.3 0.114 0.145 0.116 0.147 4 +16: dbcsr_scale_anytype 88 4.3 0.004 0.007 0.114 0.143 1 +16: dbcsr_special_finalize 336 6.1 0.004 0.004 0.075 0.121 6 +16: dbcsr_new_transposed 56 5.1 0.002 0.002 0.073 0.117 3 +16: dbcsr_tas_mp_comm 30 3.6 0.000 0.000 0.094 0.109 3 +16: dbcsr_copy 240 5.6 0.013 0.036 0.070 0.107 3 +16: mp_comm_split_direct 78 7.5 0.076 0.105 0.076 0.105 1 +16: convert_to_new_pgrid 144 4.5 0.001 0.001 0.069 0.094 3 +16: dbcsr_tas_mm_3T 12 5.0 0.000 0.000 0.063 0.085 5 +16: mp_cart_sub 296 8.5 0.071 0.082 0.071 0.082 0 +16: mp_alltoall_i11v 216 2.0 0.052 0.077 0.052 0.077 3 +16: multiply_cannon_multrec_finali 72 8.7 0.000 0.000 0.040 0.077 3 +16: dbcsr_mm_multrec_finalize 72 9.7 0.039 0.076 0.039 0.076 2 +16: dbcsr_merge_single_wm 224 6.0 0.039 0.064 0.045 0.067 4 +16: dbcsr_tas_convert_to_dbcsr 72 1.0 0.007 0.010 0.056 0.066 0 +16: dbcsr_make_index_exist 1788 6.7 0.040 0.065 0.040 0.065 1 +16: dbcsr_tas_merge_communicate_bu 16 5.5 0.000 0.000 0.046 0.065 3 +16: dbcsr_add_d 24 1.0 0.000 0.000 0.046 0.059 6 +16: quick_finalize 112 9.4 0.023 0.047 0.024 0.049 4 +16: dbcsr_tas_mm_3N 4 7.0 0.000 0.000 0.023 0.044 2 +16: dbcsr_tas_mm_1T 4 7.0 0.000 0.000 0.024 0.036 3 +16: mp_max_iv 72 3.0 0.028 0.032 0.028 0.032 2 +16: mp_max_lv 72 3.0 0.019 0.031 0.019 0.031 6 +16: setup_rec_index_2d 144 6.7 0.012 0.026 0.012 0.026 1 +16: mp_sum_iv 72 6.7 0.013 0.025 0.013 0.025 4 +16: dbcsr_init_lib_low 1 1.0 0.011 0.022 0.011 0.022 0 +16: setup_buffer_matrices 144 6.7 0.002 0.002 0.015 0.021 4 +16: dbcsr_filter_anytype 96 4.5 0.005 0.007 0.016 0.020 0 +16: dbcsr_iterator_stop 1402 5.4 0.012 0.018 0.013 0.019 1 +16: dbcsr_destroy 1692 4.5 0.009 0.009 0.016 0.018 4 +16: dbcsr_mm_multrec_init 72 6.7 0.000 0.000 0.010 0.016 6 +16: dbcsr_mm_csr_init 72 7.7 0.009 0.015 0.010 0.016 2 +16: dbcsr_data_release 6416 6.2 0.012 0.015 0.012 0.015 5 +16: dbcsr_sort_data 314 7.1 0.008 0.014 0.008 0.014 0 +16: mp_comm_free 780 5.1 0.007 0.013 0.007 0.013 5 +16: dbcsr_data_new 3952 6.1 0.011 0.013 0.011 0.013 5 +16: dbcsr_data_copy_aa2 126 5.4 0.005 0.012 0.005 0.012 2 +16: mp_isend_dv 1114 7.4 0.012 0.012 0.012 0.012 3 +16: tree_to_linear_d 72 4.0 0.004 0.012 0.004 0.012 5 +16: mp_sum_lv 244 1.0 0.008 0.010 0.008 0.010 1 +16: mp_max_l 142 1.0 0.007 0.010 0.007 0.010 6 +16: dbcsr_make_index_list 336 5.1 0.006 0.009 0.006 0.009 6 +16: make_images_pack 144 7.7 0.005 0.006 0.007 0.007 6 +16: dbcsr_work_create 576 5.3 0.004 0.004 0.006 0.007 3 +16: dbcsr_work_destroy_all 576 6.3 0.004 0.005 0.005 0.006 1 +16: mp_max_i 387 1.0 0.005 0.006 0.005 0.006 6 +16: multiply_cannon_metrocomm2 144 4.0 0.002 0.002 0.005 0.005 3 +16: buffer_matrices_ensure_size 144 6.7 0.004 0.005 0.004 0.005 5 +16: dbcsr_add_wm_from_matrix 18 5.0 0.001 0.002 0.003 0.005 3 +16: dbcsr_sort_indices 1036 7.1 0.004 0.004 0.004 0.004 1 +16: dbcsr_set 72 2.0 0.000 0.000 0.002 0.004 5 +16: dbcsr_tas_blk_sizes 3064 6.3 0.003 0.004 0.003 0.004 0 +16: dbcsr_zero 72 3.0 0.002 0.004 0.002 0.004 3 +16: merge_index 240 6.1 0.003 0.004 0.003 0.004 0 +16: mp_maxloc_dv 301 1.0 0.003 0.003 0.003 0.003 6 +16: dbcsr_make_untransposed_blocks 72 5.7 0.002 0.002 0.003 0.003 0 +16: dbcsr_fill_wm_from_matrix 18 6.0 0.001 0.003 0.001 0.003 0 +16: multiply_cannon_metrocomm4 48 8.0 0.001 0.001 0.002 0.003 1 +16: dbcsr_iterator_seek 1402 6.3 0.003 0.003 0.003 0.003 1 +16: mp_bcast_av 151 1.0 0.001 0.001 0.002 0.002 3 +16: mp_max_r 1 1.0 0.002 0.002 0.002 0.002 6 +16: dbcsr_distribution_new 518 4.8 0.002 0.002 0.002 0.002 3 +16: dbcsr_tas_reshape_get_coord 120 5.9 0.001 0.001 0.002 0.002 2 +16: mp_irecv_dv 1091 7.4 0.002 0.002 0.002 0.002 3 +16: mp_isend_iv 632 7.4 0.002 0.002 0.002 0.002 3 +16: mp_isend_lm2 774 7.8 0.002 0.002 0.002 0.002 1 +16: block_buffer_get_index 1176 6.5 0.002 0.002 0.002 0.002 3 +16: dbcsr_switch_data_area 312 7.9 0.001 0.001 0.002 0.002 0 +16: dbcsr_make_dbcsr_index 916 7.1 0.001 0.001 0.001 0.001 0 +16: mp_bcast_iv 244 1.0 0.001 0.001 0.001 0.001 6 +16: dbcsr_make_index_local_row 336 5.1 0.001 0.001 0.001 0.001 3 +16: mp_bcast_i 90 6.7 0.001 0.001 0.001 0.001 5 +16: mp_irecv_lm2 731 7.8 0.001 0.001 0.001 0.001 0 +16: mp_irecv_iv 632 7.4 0.001 0.001 0.001 0.001 3 +16: transpose_index_local 56 6.1 0.000 0.001 0.001 0.001 3 +16: multrec_filtering 72 10.7 0.001 0.001 0.001 0.001 2 +16: dbcsr_get_data_size_used 240 5.1 0.001 0.001 0.001 0.001 1 +16: fill_hash_tables 72 8.7 0.000 0.001 0.000 0.001 3 +16: dbcsr_index_compact 96 5.5 0.000 0.000 0.000 0.000 3 +16: dbcsr_mm_sched_init 72 8.7 0.000 0.000 0.000 0.000 5 +16: dbcsr_get_local_rows 72 5.7 0.000 0.000 0.000 0.000 3 +16: mp_sum_i 25 5.3 0.000 0.000 0.000 0.000 0 +16: dbcsr_get_local_cols 72 5.7 0.000 0.000 0.000 0.000 3 +16: mp_dims_create 110 4.6 0.000 0.000 0.000 0.000 3 +16: dbcsr_get_global_row_map 72 5.7 0.000 0.000 0.000 0.000 3 +16: dbcsr_get_global_col_map 72 5.7 0.000 0.000 0.000 0.000 2 +16: dbcsr_mm_sched_finalize 72 10.7 0.000 0.000 0.000 0.000 1 +16: dbcsr_mm_hostdrv_init 72 9.7 0.000 0.000 0.000 0.000 3 +16: mp_min_rv 1 1.0 0.000 0.000 0.000 0.000 6 +16: mp_sum_lm3 1 1.0 0.000 0.000 0.000 0.000 6 16: mp_sum_rv 1 1.0 0.000 0.000 0.000 0.000 6 -16: mp_sum_i 1 1.0 0.000 0.000 0.000 0.000 5 -16: mp_max_rv 1 1.0 0.000 0.000 0.000 0.000 9 +16: mp_max_rv 1 1.0 0.000 0.000 0.000 0.000 0 +16: mp_sum_r 1 1.0 0.000 0.000 0.000 0.000 6 16: ------------------------------------------------------------------------------- 16: -16/19 Test #16: dbcsr_tas_unittest .................................... Passed 3.25 sec +16/19 Test #16: dbcsr_tas_unittest .................................... Passed 11.25 sec test 17 Start 17: dbcsr_test_csr_conversions -17: Test command: /usr/bin/mpiexec "-n" "12" "/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/tests/dbcsr_test_csr_conversions" +17: Test command: /usr/bin/mpiexec "-n" "7" "/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/tests/dbcsr_test_csr_conversions" 17: Working Directory: /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/tests 17: Environment variables: 17: OMP_NUM_THREADS=2 @@ -58184,7 +58057,7 @@ 17: ROUTINE CALLS AVE VOLUME [Bytes] 17: MP_Bcast 101 32. 17: MP_Allreduce 419 9. -17: MP_Alltoall 5600 2724. +17: MP_Alltoall 5600 3890. 17: ------------------------------------------------------------------------------- 17: 17: ------------------------------------------------------------------------------- @@ -58194,92 +58067,87 @@ 17: ------------------------------------------------------------------------------- 17: SUBROUTINE CALLS ASD SELF TIME TOTAL TIME MAXRANK 17: MAXIMUM AVERAGE MAXIMUM AVERAGE MAXIMUM -17: dbcsr_complete_redistribute 800 2.5 0.108 0.117 3.276 3.361 6 -17: csr_create_from_dbcsr 200 1.0 0.003 0.003 2.444 2.479 6 -17: mp_alltoall_i22 800 3.5 2.239 2.319 2.239 2.319 9 -17: dbcsr_create_brd 400 2.0 0.005 0.008 1.721 1.754 0 -17: convert_csr_to_dbcsr 200 1.0 0.001 0.001 0.796 0.889 10 -17: convert_dbcsr_to_csr 200 1.0 0.001 0.001 0.793 0.833 7 -17: dbcsr_finalize 1080 3.2 0.016 0.019 0.672 0.813 2 -17: dbcsr_merge_all 1070 4.2 0.628 0.769 0.650 0.791 6 -17: csr_create_from_brd 200 2.0 0.001 0.001 0.704 0.747 11 -17: mp_sum_l 275 2.5 0.692 0.736 0.692 0.736 10 -17: dbcsr_norm_scalar 200 1.0 0.003 0.004 0.604 0.632 11 -17: mp_max_d 201 2.0 0.600 0.628 0.600 0.628 4 -17: dbcsr_create_new 1500 2.3 0.172 0.213 0.186 0.227 11 -17: dbcsr_set 1000 3.0 0.004 0.004 0.136 0.171 11 -17: dbcsr_zero 800 4.5 0.131 0.166 0.131 0.166 8 -17: mp_cart_create 501 3.8 0.046 0.050 0.046 0.050 9 -17: dbcsr_copy 800 1.5 0.015 0.027 0.026 0.046 9 -17: mp_alltoall_d11v 2400 3.5 0.032 0.036 0.032 0.036 8 -17: dbcsr_make_index_exist 1500 3.3 0.013 0.030 0.013 0.030 2 -17: mp_cart_sub 1000 3.8 0.028 0.028 0.028 0.028 9 -17: merge_index 1070 5.2 0.012 0.023 0.012 0.023 2 -17: mp_alltoall_i11v 2400 3.5 0.014 0.021 0.014 0.021 0 -17: dbcsr_add_d 200 1.0 0.000 0.000 0.015 0.016 8 -17: dbcsr_add_anytype 200 2.0 0.003 0.003 0.015 0.016 11 -17: dbcsr_iterator_stop 3080 3.2 0.006 0.012 0.007 0.013 6 -17: convert_brd_to_csr 200 2.0 0.009 0.010 0.011 0.012 4 -17: dbcsr_destroy 1300 1.6 0.004 0.005 0.010 0.011 6 -17: csr_get_dbcsr_mapping 200 3.0 0.009 0.010 0.011 0.011 4 -17: dbcsr_iterator_start 3080 3.2 0.007 0.007 0.009 0.010 11 -17: mp_comm_free 1501 3.1 0.007 0.009 0.007 0.009 0 -17: mp_bcast_iv 101 1.0 0.004 0.007 0.004 0.007 7 -17: dbcsr_data_new 7940 3.6 0.007 0.007 0.007 0.007 0 -17: dbcsr_work_create 1070 3.2 0.004 0.005 0.007 0.007 6 -17: tree_to_linear_d 800 5.5 0.006 0.007 0.006 0.007 6 -17: dbcsr_data_release 11020 3.9 0.006 0.006 0.006 0.006 0 -17: dbcsr_work_destroy_all 1070 4.2 0.003 0.004 0.005 0.005 11 -17: csr_destroy 200 1.0 0.001 0.001 0.004 0.005 0 -17: dbcsr_init_lib_low 1 1.0 0.002 0.004 0.002 0.004 0 -17: convert_csr_to_brd 200 2.0 0.003 0.003 0.003 0.003 6 -17: mp_max_l 52 1.0 0.002 0.003 0.002 0.003 11 -17: dbcsr_sort_indices 1026 5.2 0.002 0.003 0.002 0.003 6 -17: dbcsr_iterator_seek 3080 4.2 0.002 0.002 0.002 0.002 11 -17: dbcsr_data_copy_aa2 474 5.4 0.001 0.001 0.001 0.001 0 -17: dbcsr_get_data_size_used 1070 4.2 0.001 0.001 0.001 0.001 6 -17: dbcsr_distribution_new 500 2.6 0.001 0.001 0.001 0.001 6 -17: mp_maxloc_dv 123 1.0 0.001 0.001 0.001 0.001 8 -17: mp_sum_d 125 1.0 0.001 0.001 0.001 0.001 10 -17: dbcsr_make_dbcsr_index 1070 5.2 0.001 0.001 0.001 0.001 5 -17: csr_assert_consistency_with_db 400 2.0 0.001 0.001 0.001 0.001 11 -17: mp_bcast_av 60 1.0 0.000 0.000 0.000 0.001 1 -17: mp_max_i 54 1.0 0.000 0.000 0.000 0.000 2 -17: csr_create_new 200 3.0 0.000 0.000 0.000 0.000 0 -17: mp_bcast_i 61 2.0 0.000 0.000 0.000 0.000 10 -17: csr_create_nzerow 200 3.0 0.000 0.000 0.000 0.000 6 -17: dbcsr_scale_anytype 200 3.0 0.000 0.000 0.000 0.000 11 -17: mp_max_r 1 1.0 0.000 0.000 0.000 0.000 6 -17: mp_sum_lv 1 1.0 0.000 0.000 0.000 0.000 4 -17: mp_sum_lm3 1 1.0 0.000 0.000 0.000 0.000 6 -17: mp_sum_i 1 1.0 0.000 0.000 0.000 0.000 1 +17: dbcsr_complete_redistribute 800 2.5 0.221 0.237 8.165 8.287 4 +17: csr_create_from_dbcsr 200 1.0 0.006 0.006 5.614 5.706 1 +17: mp_alltoall_i22 800 3.5 4.558 4.897 4.558 4.897 4 +17: dbcsr_create_brd 400 2.0 0.009 0.013 4.279 4.332 3 +17: convert_csr_to_dbcsr 200 1.0 0.002 0.002 2.057 2.143 3 +17: convert_dbcsr_to_csr 200 1.0 0.002 0.003 1.896 2.014 1 +17: dbcsr_finalize 1074 3.2 0.028 0.035 1.314 1.735 4 +17: dbcsr_merge_all 1061 4.2 1.239 1.665 1.271 1.695 6 +17: csr_create_from_brd 200 2.0 0.002 0.003 1.298 1.480 1 +17: mp_sum_l 275 2.5 1.276 1.458 1.276 1.458 0 +17: dbcsr_norm_scalar 200 1.0 0.006 0.007 1.189 1.341 2 +17: mp_max_d 201 2.0 1.181 1.332 1.181 1.332 4 +17: mp_cart_create 501 3.8 1.197 1.301 1.197 1.301 5 +17: dbcsr_create_new 1500 2.3 0.301 0.428 0.320 0.443 6 +17: dbcsr_set 1000 3.0 0.008 0.008 0.253 0.333 2 +17: dbcsr_zero 800 4.5 0.243 0.324 0.243 0.324 5 +17: mp_alltoall_d11v 2400 3.5 0.235 0.277 0.235 0.277 2 +17: mp_cart_sub 1000 3.8 0.209 0.253 0.209 0.253 0 +17: mp_alltoall_i11v 2400 3.5 0.175 0.224 0.175 0.224 3 +17: mp_bcast_iv 101 1.0 0.114 0.172 0.114 0.172 6 +17: dbcsr_copy 800 1.5 0.022 0.027 0.042 0.047 3 +17: dbcsr_add_d 200 1.0 0.001 0.001 0.036 0.044 1 +17: dbcsr_add_anytype 200 2.0 0.006 0.006 0.035 0.043 2 +17: dbcsr_make_index_exist 1500 3.3 0.016 0.025 0.016 0.025 1 +17: dbcsr_destroy 1300 1.6 0.011 0.012 0.020 0.024 1 +17: convert_brd_to_csr 200 2.0 0.017 0.018 0.022 0.023 4 +17: dbcsr_iterator_start 3074 3.2 0.016 0.017 0.020 0.022 1 +17: csr_get_dbcsr_mapping 200 3.0 0.016 0.016 0.020 0.021 4 +17: dbcsr_data_new 7922 3.6 0.017 0.018 0.017 0.018 1 +17: dbcsr_data_release 10996 3.9 0.016 0.017 0.016 0.017 5 +17: merge_index 1061 5.2 0.012 0.017 0.012 0.017 5 +17: dbcsr_iterator_stop 3074 3.2 0.012 0.013 0.015 0.016 1 +17: dbcsr_work_create 1061 3.2 0.010 0.010 0.015 0.016 2 +17: tree_to_linear_d 800 5.5 0.011 0.014 0.011 0.014 3 +17: mp_comm_free 1501 3.1 0.009 0.013 0.009 0.013 1 +17: dbcsr_work_destroy_all 1061 4.2 0.008 0.009 0.012 0.013 6 +17: convert_csr_to_brd 200 2.0 0.006 0.007 0.007 0.008 2 +17: csr_destroy 200 1.0 0.002 0.002 0.007 0.007 5 +17: dbcsr_iterator_seek 3074 4.2 0.005 0.005 0.005 0.005 5 +17: dbcsr_sort_indices 1013 5.2 0.004 0.004 0.004 0.004 2 +17: dbcsr_init_lib_low 1 1.0 0.003 0.004 0.003 0.004 5 +17: mp_max_l 52 1.0 0.003 0.004 0.003 0.004 5 +17: dbcsr_data_copy_aa2 477 5.5 0.003 0.004 0.003 0.004 3 +17: dbcsr_get_data_size_used 1061 4.2 0.003 0.003 0.003 0.003 2 +17: dbcsr_distribution_new 500 2.6 0.002 0.002 0.002 0.002 1 +17: dbcsr_make_dbcsr_index 1061 5.2 0.001 0.002 0.001 0.002 5 +17: mp_maxloc_dv 123 1.0 0.001 0.001 0.001 0.001 3 +17: mp_sum_d 125 1.0 0.001 0.001 0.001 0.001 6 +17: csr_assert_consistency_with_db 400 2.0 0.001 0.001 0.001 0.001 0 +17: mp_bcast_av 60 1.0 0.000 0.000 0.001 0.001 2 +17: csr_create_new 200 3.0 0.001 0.001 0.001 0.001 3 +17: mp_max_i 54 1.0 0.000 0.001 0.000 0.001 3 +17: mp_bcast_i 61 2.0 0.000 0.000 0.000 0.000 1 +17: csr_create_nzerow 200 3.0 0.000 0.000 0.000 0.000 1 +17: dbcsr_scale_anytype 200 3.0 0.000 0.000 0.000 0.000 4 +17: mp_max_r 1 1.0 0.000 0.000 0.000 0.000 3 +17: mp_sum_lm3 1 1.0 0.000 0.000 0.000 0.000 3 +17: mp_sum_lv 1 1.0 0.000 0.000 0.000 0.000 0 +17: mp_min_rv 1 1.0 0.000 0.000 0.000 0.000 0 +17: mp_max_rv 1 1.0 0.000 0.000 0.000 0.000 2 +17: mp_sum_rv 1 1.0 0.000 0.000 0.000 0.000 3 17: mp_sum_r 1 1.0 0.000 0.000 0.000 0.000 0 -17: mp_min_rv 1 1.0 0.000 0.000 0.000 0.000 9 -17: mp_max_rv 1 1.0 0.000 0.000 0.000 0.000 10 -17: mp_sum_rv 1 1.0 0.000 0.000 0.000 0.000 7 +17: mp_sum_i 1 1.0 0.000 0.000 0.000 0.000 0 17: ------------------------------------------------------------------------------- 17: -17/19 Test #17: dbcsr_test_csr_conversions ............................ Passed 4.95 sec +17/19 Test #17: dbcsr_test_csr_conversions ............................ Passed 11.48 sec test 18 Start 18: dbcsr_test -18: Test command: /usr/bin/mpiexec "-n" "12" "./dbcsr_test" +18: Test command: /usr/bin/mpiexec "-n" "7" "./dbcsr_test" 18: Working Directory: /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/tests 18: Environment variables: 18: OMP_NUM_THREADS=2 18: Test timeout computed to be: 1500 -18: I'm processor 0 over 12 proc, (0, 0) in the 2D grid -18: I'm processor 1 over 12 proc, (0, 1) in the 2D grid -18: I'm processor 2 over 12 proc, (0, 2) in the 2D grid -18: I'm processor 3 over 12 proc, (1, 0) in the 2D grid -18: I'm processor 4 over 12 proc, (1, 1) in the 2D grid -18: I'm processor 5 over 12 proc, (1, 2) in the 2D grid -18: I'm processor 6 over 12 proc, (2, 0) in the 2D grid -18: I'm processor 7 over 12 proc, (2, 1) in the 2D grid -18: I'm processor 8 over 12 proc, (2, 2) in the 2D grid -18: I'm processor 9 over 12 proc, (3, 0) in the 2D grid -18: I'm processor 10 over 12 proc, (3, 1) in the 2D grid -18: I'm processor 11 over 12 proc, (3, 2) in the 2D grid +18: I'm processor 0 over 7 proc, (0, 0) in the 2D grid +18: I'm processor 1 over 7 proc, (1, 0) in the 2D grid +18: I'm processor 2 over 7 proc, (2, 0) in the 2D grid +18: I'm processor 3 over 7 proc, (3, 0) in the 2D grid +18: I'm processor 4 over 7 proc, (4, 0) in the 2D grid +18: I'm processor 5 over 7 proc, (5, 0) in the 2D grid +18: I'm processor 6 over 7 proc, (6, 0) in the 2D grid 18: Creating distributions... 18: Creating matrices... 18: Filling matrices... @@ -58291,17 +58159,17 @@ 18: nfullrowstot: 12 18: nfullcolstot: 15 18: nblkrowsloc: 1 -18: nblkcolsloc: 2 +18: nblkcolsloc: 4 18: nfullrowsloc: 2 -18: nfullcolsloc: 8 +18: nfullcolsloc: 15 18: local_rows: 18: 0 18: local_cols: -18: 0 3 +18: 0 1 2 3 0 18: proc_row: 18: 0 1 2 3 18: proc_col: -18: 0 1 2 0 0 +18: 0 0 0 0 0 18: row_blk: 18: 2 3 5 2 18: col_blk: @@ -58310,443 +58178,110 @@ 18: 0 0 0 0 18: col_off: 18: 0 0 0 0 0 -18: Testing distribution_get for dist1 -18: nrows: 4 -18: ncols: 5 -18: mynode: 0 -18: numnodes: 12 -18: nprows: 4 -18: npcols: 3 -18: myprow: 0 -18: mypcol: 0 -18: prow_group: -1006632943 -18: pcol_group: -1006632940 -18: Correct MPI communicator. -18: dist row: -18: 0 1 2 3 -18: dist col: -18: 0 1 2 0 1 -18: grid: -18: 0 1 2 -18: 3 4 5 -18: 6 7 8 -18: 9 10 11 -18: Extracting block diagonal... -18: dbcsr_io:dbcsr_print Contents of matrix named matrix d -18: dbcsr_io:dbcsr_print Flags F F F type 3 serial 111130 -18: dbcsr_io:dbcsr_print 1 blocks 9 nzes, 9 data els -18: 9 used -18: dbcsr_io:dbcsr_print Full size 9x 9 -18: dbcsr_io:dbcsr_print Blocked size 3x 3 -18: Checksum for ( 1, 3) at 1 size 3 3= 9 checksum= 0.252E+01 -18: dbcsr_io:dbcsr_print Contents of matrix named matrix d -18: dbcsr_io:dbcsr_print Flags F F F type 3 serial 111130 -18: dbcsr_io:dbcsr_print 1 blocks 9 nzes, 9 data els -18: 9 used -18: dbcsr_io:dbcsr_print Full size 9x 9 -18: dbcsr_io:dbcsr_print Blocked size 3x 3 -18: Checksum for ( 2, 1) at 1 size 3 3= 9 checksum= 0.282E+01 -18: dbcsr_io:dbcsr_print Contents of matrix named matrix d -18: dbcsr_io:dbcsr_print Flags F F F type 3 serial 111130 -18: dbcsr_io:dbcsr_print 1 blocks 9 nzes, 9 data els -18: 9 used -18: dbcsr_io:dbcsr_print Full size 9x 9 -18: dbcsr_io:dbcsr_print Blocked size 3x 3 -18: Checksum for ( 3, 1) at 1 size 3 3= 9 checksum= 0.226E+01 -18: dbcsr_io:dbcsr_print Contents of matrix named matrix d -18: dbcsr_io:dbcsr_print Flags F F F type 3 serial 111130 -18: dbcsr_io:dbcsr_print 1 blocks 9 nzes, 9 data els -18: 9 used -18: dbcsr_io:dbcsr_print Full size 9x 9 -18: dbcsr_io:dbcsr_print Blocked size 3x 3 -18: Checksum for ( 3, 2) at 1 size 3 3= 9 checksum= 0.184E+01 -18: dbcsr_io:dbcsr_print Contents of matrix named matrix d -18: dbcsr_io:dbcsr_print Flags F F F type 3 serial 111130 -18: dbcsr_io:dbcsr_print 0 blocks 0 nzes, 0 data els -18: 0 used -18: dbcsr_io:dbcsr_print Full size 9x 9 -18: dbcsr_io:dbcsr_print Blocked size 3x 3 -18: dbcsr_io:dbcsr_print Contents of matrix named matrix d -18: dbcsr_io:dbcsr_print Flags F F F type 3 serial 111130 -18: dbcsr_io:dbcsr_print 0 blocks 0 nzes, 0 data els -18: 0 used -18: dbcsr_io:dbcsr_print Full size 9x 9 -18: dbcsr_io:dbcsr_print Blocked size 3x 3 -18: dbcsr_io:dbcsr_print Contents of matrix named diag of matrix d -18: dbcsr_io:dbcsr_print Flags F F F type 3 serial 111131 -18: dbcsr_io:dbcsr_print 0 blocks 0 nzes, 0 data els -18: 0 used -18: dbcsr_io:dbcsr_print Full size 9x 9 -18: dbcsr_io:dbcsr_print Blocked size 3x 3 -18: dbcsr_io:dbcsr_print Contents of matrix named matrix d -18: dbcsr_io:dbcsr_print Flags F F F type 3 serial 111130 -18: dbcsr_io:dbcsr_print 1 blocks 9 nzes, 9 data els -18: 9 used -18: dbcsr_io:dbcsr_print Full size 9x 9 -18: dbcsr_io:dbcsr_print Blocked size 3x 3 -18: Checksum for ( 1, 2) at 1 size 3 3= 9 checksum= 0.419E+01 -18: 0.7882 0.7974 0.1058 -18: 0.8262 0.2023 0.5237 -18: 0.6380 0.3293 0.1947 -18: dbcsr_io:dbcsr_print Contents of matrix named matrix d -18: dbcsr_io:dbcsr_print Flags F F F type 3 serial 111130 -18: dbcsr_io:dbcsr_print 1 blocks 9 nzes, 9 data els -18: 9 used -18: dbcsr_io:dbcsr_print Full size 9x 9 -18: dbcsr_io:dbcsr_print Blocked size 3x 3 -18: Checksum for ( 2, 1) at 1 size 3 3= 9 checksum= 0.208E+01 -18: 0.0000 0.7974 0.2117 -18: 0.0000 0.2023 1.0473 -18: 0.0000 0.3293 0.3895 -18: dbcsr_io:dbcsr_print Contents of matrix named diag of matrix d -18: dbcsr_io:dbcsr_print Flags F F F type 3 serial 111131 -18: dbcsr_io:dbcsr_print 0 blocks 0 nzes, 0 data els -18: 0 used -18: dbcsr_io:dbcsr_print Full size 9x 9 -18: dbcsr_io:dbcsr_print Blocked size 3x 3 -18: dbcsr_io:dbcsr_print Contents of matrix named matrix d -18: dbcsr_io:dbcsr_print Flags F F F type 3 serial 111130 -18: dbcsr_io:dbcsr_print 1 blocks 9 nzes, 9 data els -18: 9 used -18: dbcsr_io:dbcsr_print Full size 9x 9 -18: dbcsr_io:dbcsr_print Blocked size 3x 3 -18: Checksum for ( 2, 3) at 1 size 3 3= 9 checksum= 0.292E+01 -18: dbcsr_io:dbcsr_print Contents of matrix named matrix d -18: dbcsr_io:dbcsr_print Flags F F F type 3 serial 111130 -18: dbcsr_io:dbcsr_print 1 blocks 9 nzes, 9 data els -18: 9 used -18: dbcsr_io:dbcsr_print Full size 9x 9 -18: dbcsr_io:dbcsr_print Blocked size 3x 3 -18: Checksum for ( 3, 3) at 1 size 3 3= 9 checksum= 0.245E+01 -18: 0.1657 0.5252 0.0269 -18: 0.8539 0.7725 0.4124 -18: 0.3836 0.1889 0.6841 -18: dbcsr_io:dbcsr_print Contents of matrix named matrix d -18: dbcsr_io:dbcsr_print Flags F F F type 3 serial 111130 -18: dbcsr_io:dbcsr_print 1 blocks 9 nzes, 9 data els -18: 9 used -18: dbcsr_io:dbcsr_print Full size 9x 9 -18: dbcsr_io:dbcsr_print Blocked size 3x 3 -18: Checksum for ( 3, 3) at 1 size 3 3= 9 checksum= 0.118E+03 -18: 0.9943 3.6764 0.2151 -18: 5.1234 5.4078 3.2994 -18: 2.3016 1.3224 5.4729 -18: dbcsr_io:dbcsr_print Contents of matrix named diag of matrix d -18: dbcsr_io:dbcsr_print Flags F F F type 3 serial 111131 -18: dbcsr_io:dbcsr_print 1 blocks 9 nzes, 9 data els -18: 9 used -18: dbcsr_io:dbcsr_print Full size 9x 9 -18: dbcsr_io:dbcsr_print Blocked size 3x 3 -18: Checksum for ( 3, 3) at 1 size 3 3= 9 checksum= 0.118E+03 -18: 0.9943 3.6764 0.2151 -18: 5.1234 5.4078 3.2994 -18: 2.3016 1.3224 5.4729 -18: dbcsr_io:dbcsr_print Contents of matrix named matrix d -18: dbcsr_io:dbcsr_print Flags F F F type 3 serial 111130 -18: dbcsr_io:dbcsr_print 0 blocks 0 nzes, 0 data els -18: 0 used -18: dbcsr_io:dbcsr_print Full size 9x 9 -18: dbcsr_io:dbcsr_print Blocked size 3x 3 -18: dbcsr_io:dbcsr_print Contents of matrix named matrix d -18: dbcsr_io:dbcsr_print Flags F F F type 3 serial 111130 -18: dbcsr_io:dbcsr_print 0 blocks 0 nzes, 0 data els -18: 0 used -18: dbcsr_io:dbcsr_print Full size 9x 9 -18: dbcsr_io:dbcsr_print Blocked size 3x 3 -18: dbcsr_io:dbcsr_print Contents of matrix named diag of matrix d -18: dbcsr_io:dbcsr_print Flags F F F type 3 serial 111131 -18: dbcsr_io:dbcsr_print 0 blocks 0 nzes, 0 data els -18: 0 used -18: dbcsr_io:dbcsr_print Full size 9x 9 -18: dbcsr_io:dbcsr_print Blocked size 3x 3 -18: 0.7532 0.7196 0.0833 -18: 0.9770 0.6510 0.9204 -18: 0.1368 0.8606 0.3346 -18: dbcsr_io:dbcsr_print Contents of matrix named matrix d -18: dbcsr_io:dbcsr_print Flags F F F type 3 serial 111130 -18: dbcsr_io:dbcsr_print 1 blocks 9 nzes, 9 data els -18: 9 used -18: dbcsr_io:dbcsr_print Full size 9x 9 -18: dbcsr_io:dbcsr_print Blocked size 3x 3 -18: Checksum for ( 1, 2) at 1 size 3 3= 9 checksum= 0.649E+02 -18: 2.2597 2.8784 0.4164 -18: 2.9309 2.6039 4.6022 -18: 0.4103 3.4425 1.6728 -18: dbcsr_io:dbcsr_print Contents of matrix named diag of matrix d -18: dbcsr_io:dbcsr_print Flags F F F type 3 serial 111131 -18: dbcsr_io:dbcsr_print 0 blocks 0 nzes, 0 data els -18: 0 used -18: dbcsr_io:dbcsr_print Full size 9x 9 -18: dbcsr_io:dbcsr_print Blocked size 3x 3 -18: 0.6832 0.5641 0.0382 -18: 0.2785 0.5482 0.7140 -18: 0.1342 0.9233 0.6142 -18: dbcsr_io:dbcsr_print Contents of matrix named matrix d -18: dbcsr_io:dbcsr_print Flags F F F type 3 serial 111130 -18: dbcsr_io:dbcsr_print 1 blocks 9 nzes, 9 data els -18: 9 used -18: dbcsr_io:dbcsr_print Full size 9x 9 -18: dbcsr_io:dbcsr_print Blocked size 3x 3 -18: Checksum for ( 2, 3) at 1 size 3 3= 9 checksum= 0.149E+03 -18: 4.0993 3.9485 0.3054 -18: 1.6711 3.8376 5.7122 -18: 0.8054 6.4628 4.9136 -18: dbcsr_io:dbcsr_print Contents of matrix named diag of matrix d -18: dbcsr_io:dbcsr_print Flags F F F type 3 serial 111131 -18: dbcsr_io:dbcsr_print 0 blocks 0 nzes, 0 data els -18: 0 used -18: dbcsr_io:dbcsr_print Full size 9x 9 -18: dbcsr_io:dbcsr_print Blocked size 3x 3 -18: dbcsr_io:dbcsr_print Contents of matrix named matrix d -18: dbcsr_io:dbcsr_print Flags F F F type 3 serial 111130 -18: dbcsr_io:dbcsr_print 0 blocks 0 nzes, 0 data els -18: 0 used -18: dbcsr_io:dbcsr_print Full size 9x 9 -18: dbcsr_io:dbcsr_print Blocked size 3x 3 -18: dbcsr_io:dbcsr_print Contents of matrix named matrix d -18: dbcsr_io:dbcsr_print Flags F F F type 3 serial 111130 -18: dbcsr_io:dbcsr_print 0 blocks 0 nzes, 0 data els -18: 0 used -18: dbcsr_io:dbcsr_print Full size 9x 9 -18: dbcsr_io:dbcsr_print Blocked size 3x 3 -18: dbcsr_io:dbcsr_print Contents of matrix named diag of matrix d -18: dbcsr_io:dbcsr_print Flags F F F type 3 serial 111131 -18: dbcsr_io:dbcsr_print 0 blocks 0 nzes, 0 data els -18: 0 used -18: dbcsr_io:dbcsr_print Full size 9x 9 -18: dbcsr_io:dbcsr_print Blocked size 3x 3 -18: 0.2707 0.7585 0.0946 -18: 0.4016 0.4267 0.2221 -18: 0.8874 0.5950 0.2647 -18: dbcsr_io:dbcsr_print Contents of matrix named matrix d -18: dbcsr_io:dbcsr_print Flags F F F type 3 serial 111130 -18: dbcsr_io:dbcsr_print 1 blocks 9 nzes, 9 data els -18: 9 used -18: dbcsr_io:dbcsr_print Full size 9x 9 -18: dbcsr_io:dbcsr_print Blocked size 3x 3 -18: Checksum for ( 3, 1) at 1 size 3 3= 9 checksum= 0.162E+01 -18: 0.0000 0.7585 0.1891 -18: 0.0000 0.4267 0.4441 -18: 0.0000 0.5950 0.5293 -18: dbcsr_io:dbcsr_print Contents of matrix named diag of matrix d -18: dbcsr_io:dbcsr_print Flags F F F type 3 serial 111131 -18: dbcsr_io:dbcsr_print 0 blocks 0 nzes, 0 data els -18: 0 used -18: dbcsr_io:dbcsr_print Full size 9x 9 -18: dbcsr_io:dbcsr_print Blocked size 3x 3 -18: dbcsr_io:dbcsr_print Contents of matrix named matrix d -18: dbcsr_io:dbcsr_print Flags F F F type 3 serial 111130 -18: dbcsr_io:dbcsr_print 1 blocks 9 nzes, 9 data els -18: 9 used -18: dbcsr_io:dbcsr_print Full size 9x 9 -18: dbcsr_io:dbcsr_print Blocked size 3x 3 -18: Checksum for ( 2, 2) at 1 size 3 3= 9 checksum= 0.231E+01 -18: 0.2357 0.6807 0.0720 -18: 0.5524 0.8753 0.6188 -18: 0.3861 0.1263 0.4045 -18: dbcsr_io:dbcsr_print Contents of matrix named matrix d -18: dbcsr_io:dbcsr_print Flags F F F type 3 serial 111130 -18: dbcsr_io:dbcsr_print 1 blocks 9 nzes, 9 data els -18: 9 used -18: dbcsr_io:dbcsr_print Full size 9x 9 -18: dbcsr_io:dbcsr_print Blocked size 3x 3 -18: Checksum for ( 2, 2) at 1 size 3 3= 9 checksum= 0.383E+02 -18: 0.7072 2.7229 0.3600 -18: 1.6571 3.5011 3.0942 -18: 1.1584 0.5052 2.0224 -18: dbcsr_io:dbcsr_print Contents of matrix named diag of matrix d -18: dbcsr_io:dbcsr_print Flags F F F type 3 serial 111131 -18: dbcsr_io:dbcsr_print 1 blocks 9 nzes, 9 data els -18: 9 used -18: dbcsr_io:dbcsr_print Full size 9x 9 -18: dbcsr_io:dbcsr_print Blocked size 3x 3 -18: Checksum for ( 2, 2) at 1 size 3 3= 9 checksum= 0.383E+02 -18: 0.7072 2.7229 0.3600 -18: 1.6571 3.5011 3.0942 -18: 1.1584 0.5052 2.0224 -18: dbcsr_io:dbcsr_print Contents of matrix named matrix d -18: dbcsr_io:dbcsr_print Flags F F F type 3 serial 111130 -18: dbcsr_io:dbcsr_print 1 blocks 9 nzes, 9 data els -18: 9 used -18: dbcsr_io:dbcsr_print Full size 9x 9 -18: dbcsr_io:dbcsr_print Blocked size 3x 3 -18: Checksum for ( 1, 1) at 1 size 3 3= 9 checksum= 0.268E+01 -18: 0.3057 0.8363 0.1171 -18: 0.2508 0.9780 0.8253 -18: 0.3887 0.0637 0.1248 -18: dbcsr_io:dbcsr_print Contents of matrix named matrix d -18: dbcsr_io:dbcsr_print Flags F F F type 3 serial 111130 -18: dbcsr_io:dbcsr_print 1 blocks 9 nzes, 9 data els -18: 9 used -18: dbcsr_io:dbcsr_print Full size 9x 9 -18: dbcsr_io:dbcsr_print Blocked size 3x 3 -18: Checksum for ( 1, 1) at 1 size 3 3= 9 checksum= 0.450E+01 -18: 0.0000 0.8363 0.2342 -18: 0.0000 0.9780 1.6505 -18: 0.0000 0.0637 0.2497 -18: Data on rank 0: -18: 0 0 0 0.836257 0.978025 0.063674 0.234232 1.65052 0.249672 -18: dbcsr_io:dbcsr_print Contents of matrix named diag of matrix d -18: dbcsr_io:dbcsr_print Flags F F F type 3 serial 111131 -18: dbcsr_io:dbcsr_print 1 blocks 9 nzes, 9 data els -18: 9 used -18: dbcsr_io:dbcsr_print Full size 9x 9 -18: dbcsr_io:dbcsr_print Blocked size 3x 3 -18: Checksum for ( 1, 1) at 1 size 3 3= 9 checksum= 0.450E+01 -18: 0.0000 0.8363 0.2342 -18: 0.0000 0.9780 1.6505 -18: 0.0000 0.0637 0.2497 -18: -18: ------------------------------------------------------------------------------- -18: - - -18: - DBCSR STATISTICS - -18: - - -18: ------------------------------------------------------------------------------- -18: 0.2007 0.6030 0.0494 -18: 0.7031 0.3239 0.0156 -18: 0.8849 0.6576 0.5443 -18: dbcsr_io:dbcsr_print Contents of matrix named matrix d -18: dbcsr_io:dbcsr_print Flags F F F type 3 serial 111130 -18: dbcsr_io:dbcsr_print 1 blocks 9 nzes, 9 data els -18: 9 used -18: dbcsr_io:dbcsr_print Full size 9x 9 -18: dbcsr_io:dbcsr_print Blocked size 3x 3 -18: Checksum for ( 1, 3) at 1 size 3 3= 9 checksum= 0.111E+03 -18: 1.2043 4.2207 0.3956 -18: 4.2188 2.2674 0.1251 -18: 5.3092 4.6032 4.3543 -18: dbcsr_io:dbcsr_print Contents of matrix named diag of matrix d -18: dbcsr_io:dbcsr_print Flags F F F type 3 serial 111131 -18: dbcsr_io:dbcsr_print 0 blocks 0 nzes, 0 data els -18: 0 used -18: dbcsr_io:dbcsr_print Full size 9x 9 -18: dbcsr_io:dbcsr_print Blocked size 3x 3 -18: 0.7182 0.6418 0.0607 -18: 0.1277 0.0996 0.3172 -18: 0.6355 0.3919 0.4744 -18: dbcsr_io:dbcsr_print Contents of matrix named matrix d -18: dbcsr_io:dbcsr_print Flags F F F type 3 serial 111130 -18: dbcsr_io:dbcsr_print 1 blocks 9 nzes, 9 data els -18: 9 used -18: dbcsr_io:dbcsr_print Full size 9x 9 -18: dbcsr_io:dbcsr_print Blocked size 3x 3 -18: Checksum for ( 3, 2) at 1 size 3 3= 9 checksum= 0.259E+02 -18: 2.1547 2.5674 0.3036 -18: 0.3832 0.3984 1.5862 -18: 1.9065 1.5678 2.3719 -18: dbcsr_io:dbcsr_print Contents of matrix named diag of matrix d -18: dbcsr_io:dbcsr_print Flags F F F type 3 serial 111131 -18: dbcsr_io:dbcsr_print 0 blocks 0 nzes, 0 data els -18: 0 used -18: dbcsr_io:dbcsr_print Full size 9x 9 -18: dbcsr_io:dbcsr_print Blocked size 3x 3 -18: COUNTER TOTAL BLAS SMM ACC -18: flops 2 x 2 x 2 16 100.0% 0.0% 0.0% -18: flops 2 x 3 x 2 24 100.0% 0.0% 0.0% -18: flops 5 x 2 x 2 40 100.0% 0.0% 0.0% -18: flops 2 x 2 x 3 48 100.0% 0.0% 0.0% -18: flops 3 x 3 x 3 54 100.0% 0.0% 0.0% -18: flops 5 x 2 x 3 60 100.0% 0.0% 0.0% -18: flops 5 x 3 x 2 60 100.0% 0.0% 0.0% -18: flops 3 x 3 x 4 72 100.0% 0.0% 0.0% -18: flops 2 x 5 x 2 80 100.0% 0.0% 0.0% -18: flops 5 x 3 x 3 90 100.0% 0.0% 0.0% -18: flops 2 x 3 x 4 96 100.0% 0.0% 0.0% -18: flops 2 x 3 x 3 144 100.0% 0.0% 0.0% -18: flops 3 x 5 x 3 180 100.0% 0.0% 0.0% -18: flops 5 x 5 x 2 200 100.0% 0.0% 0.0% -18: flops 3 x 5 x 4 240 100.0% 0.0% 0.0% -18: flops 5 x 5 x 3 300 100.0% 0.0% 0.0% -18: flops 2 x 5 x 4 320 100.0% 0.0% 0.0% -18: flops 2 x 5 x 3 480 100.0% 0.0% 0.0% -18: flops inhomo. stacks 1152 100.0% 0.0% 0.0% -18: flops total 3.656000E+03 100.0% 0.0% 0.0% -18: flops max/rank 700.000000E+00 100.0% 0.0% 0.0% -18: matmuls inhomo. stacks 6 100.0% 0.0% 0.0% -18: matmuls total 44 100.0% 0.0% 0.0% -18: number of processed stacks 44 100.0% 0.0% 0.0% -18: average stack size 1.0 0.0 0.0 -18: marketing flops 6.480000E+03 -18: ------------------------------------------------------------------------------- -18: # multiplications 1 -18: max memory usage/rank 101.961728E+06 -18: # max total images/rank 4 -18: # max 3D layers 1 -18: # MPI messages exchanged 204 -18: MPI messages size (bytes): -18: total size 7.632000E+03 -18: min size 0.000000E+00 -18: max size 256.000000E+00 -18: average size 37.411766E+00 -18: MPI breakdown and total messages size (bytes): -18: size <= 128 182 3312 -18: 128 < size <= 8192 22 4320 -18: 8192 < size <= 32768 0 0 -18: 32768 < size <= 131072 0 0 -18: 131072 < size <= 4194304 0 0 -18: 4194304 < size <= 16777216 0 0 -18: 16777216 < size 0 0 -18: ------------------------------------------------------------------------------- -18: -18: *** WARNING in dbcsr_mm.F:291 :: Using a non-square number of MPI ranks *** -18: *** might lead to poor performance. Used ranks: 12 Suggested: 9 25 *** 18: -18: ------------------------------------------------------------------------------- -18: - - -18: - DBCSR MESSAGE PASSING PERFORMANCE - -18: - - -18: ------------------------------------------------------------------------------- -18: ROUTINE CALLS AVE VOLUME [Bytes] -18: MP_Bcast 19 12. -18: MP_Allreduce 60 23. -18: MP_Alltoall 2 672. -18: MP_ISend 38 91. -18: MP_IRecv 40 80. -18: ------------------------------------------------------------------------------- -18/19 Test #18: dbcsr_test ............................................ Passed 0.11 sec +18: =================================================================================== +18: = BAD TERMINATION OF ONE OF YOUR APPLICATION PROCESSES +18: = PID 12151 RUNNING AT i-capture-the-hostname +18: = EXIT CODE: 9 +18: = CLEANING UP REMAINING PROCESSES +18: = YOU CAN IGNORE THE BELOW CLEANUP MESSAGES +18: =================================================================================== +18: YOUR APPLICATION TERMINATED WITH THE EXIT STRING: Segmentation fault (signal 11) +18: This typically refers to a problem with your application. +18: Please see the FAQ page for debugging suggestions +18/19 Test #18: dbcsr_test ............................................***Failed 4.95 sec +I'm processor 0 over 7 proc, (0, 0) in the 2D grid +I'm processor 1 over 7 proc, (1, 0) in the 2D grid +I'm processor 2 over 7 proc, (2, 0) in the 2D grid +I'm processor 3 over 7 proc, (3, 0) in the 2D grid +I'm processor 4 over 7 proc, (4, 0) in the 2D grid +I'm processor 5 over 7 proc, (5, 0) in the 2D grid +I'm processor 6 over 7 proc, (6, 0) in the 2D grid +Creating distributions... +Creating matrices... +Filling matrices... +Multiplying... +Testing get_info for matrix_c +Name: matrix c +nblkrowstot: 4 +nblkcolstot: 4 +nfullrowstot: 12 +nfullcolstot: 15 +nblkrowsloc: 1 +nblkcolsloc: 4 +nfullrowsloc: 2 +nfullcolsloc: 15 +local_rows: +0 +local_cols: +0 1 2 3 0 +proc_row: +0 1 2 3 +proc_col: +0 0 0 0 0 +row_blk: +2 3 5 2 +col_blk: +5 2 5 3 0 +row_off: +0 0 0 0 +col_off: +0 0 0 0 0 + +=================================================================================== += BAD TERMINATION OF ONE OF YOUR APPLICATION PROCESSES += PID 12151 RUNNING AT i-capture-the-hostname += EXIT CODE: 9 += CLEANING UP REMAINING PROCESSES += YOU CAN IGNORE THE BELOW CLEANUP MESSAGES +=================================================================================== +YOUR APPLICATION TERMINATED WITH THE EXIT STRING: Segmentation fault (signal 11) +This typically refers to a problem with your application. +Please see the FAQ page for debugging suggestions + test 19 Start 19: dbcsr_tensor_test -19: Test command: /usr/bin/mpiexec "-n" "12" "./dbcsr_tensor_test" +19: Test command: /usr/bin/mpiexec "-n" "7" "./dbcsr_tensor_test" 19: Working Directory: /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/tests 19: Environment variables: 19: OMP_NUM_THREADS=2 19: Test timeout computed to be: 1500 19: pgrid3-dimensions: -19: 3 2 2 +19: 7 1 1 19: 19: pgrid4-dimensions: -19: 3 2 2 1 +19: 7 1 1 1 19: 19: dist11: -19: 0 1 2 0 +19: 0 1 2 3 19: 19: dist12: -19: 0 1 0 1 0 1 0 1 0 1 0 +19: 0 0 0 0 0 0 0 0 0 0 0 19: 19: dist13: -19: 0 1 0 1 0 1 0 1 0 +19: 0 0 0 0 0 0 0 0 0 19: 19: dist21: -19: 0 1 2 0 +19: 0 1 2 3 19: 19: dist22: -19: 0 1 0 1 0 1 0 1 0 1 0 +19: 0 0 0 0 0 0 0 0 0 0 0 19: 19: dist23: -19: 0 1 0 1 0 +19: 0 0 0 0 0 19: 19: dist24: 19: 0 0 0 19: 19: dist31: -19: 0 1 2 0 1 2 0 1 2 +19: 0 1 2 3 4 5 6 0 1 19: 19: dist32: -19: 0 1 0 1 0 +19: 0 0 0 0 0 19: 19: dist33: -19: 0 1 0 +19: 0 0 0 19: 19: Creating dist objects... 19: @@ -58773,43 +58308,43 @@ 19: GLOBAL INFO OF (13|2) 19: block dimensions: 4 11 9 19: full dimensions: 25 83 74 -19: process grid dimensions: 3 2 2 +19: process grid dimensions: 7 1 1 19: Block sizes: 19: Dim 1: 3 9 12 1 19: Dim 2: 4 2 3 1 9 2 32 10 5 8 7 19: Dim 3: 7 3 8 7 9 5 10 23 2 19: Block distribution: -19: Dim 1: 0 1 2 0 -19: Dim 2: 0 1 0 1 0 1 0 1 0 1 0 -19: Dim 3: 0 1 0 1 0 1 0 1 0 +19: Dim 1: 0 1 2 3 +19: Dim 2: 0 0 0 0 0 0 0 0 0 0 0 +19: Dim 3: 0 0 0 0 0 0 0 0 0 19: DISTRIBUTION OF (13|2) 19: Number of non-zero blocks: 32 19: Percentage of non-zero blocks: 8.08 -19: Average number of blocks per CPU: 3 -19: Maximum number of blocks per CPU: 6 -19: Average number of matrix elements per CPU: 1360 -19: Maximum number of matrix elements per CPU: 3537 +19: Average number of blocks per CPU: 5 +19: Maximum number of blocks per CPU: 11 +19: Average number of matrix elements per CPU: 2330 +19: Maximum number of matrix elements per CPU: 7584 19: GLOBAL INFO OF (54|21) 19: block dimensions: 4 11 5 3 19: full dimensions: 25 83 32 28 -19: process grid dimensions: 3 2 2 1 +19: process grid dimensions: 7 1 1 1 19: Block sizes: 19: Dim 1: 3 9 12 1 19: Dim 2: 4 2 3 1 9 2 32 10 5 8 7 19: Dim 3: 8 1 4 13 6 19: Dim 4: 4 2 22 19: Block distribution: -19: Dim 1: 0 1 2 0 -19: Dim 2: 0 1 0 1 0 1 0 1 0 1 0 -19: Dim 3: 0 1 0 1 0 +19: Dim 1: 0 1 2 3 +19: Dim 2: 0 0 0 0 0 0 0 0 0 0 0 +19: Dim 3: 0 0 0 0 0 19: Dim 4: 0 0 0 19: DISTRIBUTION OF (54|21) 19: Number of non-zero blocks: 36 19: Percentage of non-zero blocks: 5.45 -19: Average number of blocks per CPU: 3 -19: Maximum number of blocks per CPU: 5 -19: Average number of matrix elements per CPU: 12458 -19: Maximum number of matrix elements per CPU: 100620 +19: Average number of blocks per CPU: 6 +19: Maximum number of blocks per CPU: 15 +19: Average number of matrix elements per CPU: 21356 +19: Maximum number of matrix elements per CPU: 130644 19: INDEX INFO 19: tensor index: (bca) x (bcde) = (ade) 19: matrix index: (ba|c) x (ed|cb) = (a|de) @@ -58833,149 +58368,149 @@ 19: GLOBAL INFO OF (13|2) 19: block dimensions: 4 9 11 19: full dimensions: 25 74 83 -19: process grid dimensions: 3 2 2 +19: process grid dimensions: 7 1 1 19: Block sizes: 19: Dim 1: 3 9 12 1 19: Dim 2: 7 3 8 7 9 5 10 23 2 19: Dim 3: 4 2 3 1 9 2 32 10 5 8 7 19: Block distribution: -19: Dim 1: 0 1 2 0 -19: Dim 2: 0 0 0 1 0 1 0 1 1 -19: Dim 3: 0 1 0 1 0 1 0 1 0 1 0 +19: Dim 1: 0 1 2 3 +19: Dim 2: 0 0 0 0 0 0 0 0 0 +19: Dim 3: 0 0 0 0 0 0 0 0 0 0 0 19: DISTRIBUTION OF (13|2) 19: Number of non-zero blocks: 32 19: Percentage of non-zero blocks: 8.08 -19: Average number of blocks per CPU: 3 -19: Maximum number of blocks per CPU: 8 -19: Average number of matrix elements per CPU: 1360 -19: Maximum number of matrix elements per CPU: 4401 +19: Average number of blocks per CPU: 5 +19: Maximum number of blocks per CPU: 11 +19: Average number of matrix elements per CPU: 2330 +19: Maximum number of matrix elements per CPU: 7584 19: -------------------------------------------------------------------------------- 19: DBCSR TAS MATRIX MULTIPLICATION: (13|2) matrix x (54|21) matrix = (3|45) matrix 19: -------------------------------------------------------------------------------- 19: mm dims: 9 44 15 19: MM PARAMETERS -19: Est. number of matrix elements per CPU of result matrix: 879 -19: Est. optimal split factor: 12 +19: Est. number of matrix elements per CPU of result matrix: 1506 +19: Est. optimal split factor: 7 19: No redistribution of (13|2) matrix and (54|21) matrix -19: Change split factor of (13|2) matrix : Yes -19: Change split factor of (54|21) matrix : Yes +19: Change split factor of (13|2) matrix : No +19: Change split factor of (54|21) matrix : No 19: mm case: -- x --T = + 19: SPLIT / PARALLELIZATION INFO -19: splitting columns by factor 6 -19: global grid sizes: 2x 6 -19: grid sizes on subgroups: 2x 1 +19: splitting columns by factor 7 +19: global grid sizes: 1x 7 +19: grid sizes on subgroups: 1x 1 19: GLOBAL INFO OF (13|2) matrix 19: block dimensions: 9 44 19: full dimensions: 74 2075 -19: process grid dimensions: 2 6 +19: process grid dimensions: 1 7 19: Block sizes: 19: Row: 7 3 8 7 9 5 10 23 2 19: Column: 12 6 9 3 27 6 96 30 15 24 21 36 18 27 9 81 18 288 90 45 72 63 48 24 36 12 108 24 384 120 60 96 84 4 2 3 1 9 2 32 10 5 8 7 19: Block distribution: -19: Row: 0 0 0 1 0 1 0 1 1 -19: Column: 0 3 0 3 0 3 0 3 0 3 0 1 4 1 4 1 4 1 4 1 4 1 2 5 2 5 2 5 2 5 2 5 2 0 3 0 3 0 3 0 3 0 3 0 +19: Row: 0 0 0 0 0 0 0 0 0 +19: Column: 0 0 0 0 0 0 0 0 0 0 0 1 1 1 1 1 1 1 1 1 1 1 2 2 2 2 2 2 2 2 2 2 2 3 3 3 3 3 3 3 3 3 3 3 19: GLOBAL INFO OF (54|21) matrix 19: block dimensions: 15 44 19: full dimensions: 896 2075 -19: process grid dimensions: 2 6 +19: process grid dimensions: 1 7 19: Block sizes: 19: Row: 32 16 176 4 2 22 16 8 88 52 26 286 24 12 132 19: Column: 12 6 9 3 27 6 96 30 15 24 21 36 18 27 9 81 18 288 90 45 72 63 48 24 36 12 108 24 384 120 60 96 84 4 2 3 1 9 2 32 10 5 8 7 19: Block distribution: -19: Row: 0 0 0 1 1 1 0 0 0 1 1 1 0 0 0 -19: Column: 0 3 0 3 0 3 0 3 0 3 0 1 4 1 4 1 4 1 4 1 4 1 2 5 2 5 2 5 2 5 2 5 2 0 3 0 3 0 3 0 3 0 3 0 +19: Row: 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 +19: Column: 0 0 0 0 0 0 0 0 0 0 0 1 1 1 1 1 1 1 1 1 1 1 2 2 2 2 2 2 2 2 2 2 2 3 3 3 3 3 3 3 3 3 3 3 19: GLOBAL INFO OF (3|45) matrix 19: block dimensions: 9 15 19: full dimensions: 74 896 -19: process grid dimensions: 2 6 +19: process grid dimensions: 1 7 19: Block sizes: 19: Row: 7 3 8 7 9 5 10 23 2 19: Column: 32 16 176 4 2 22 16 8 88 52 26 286 24 12 132 19: Block distribution: -19: Row: 0 0 0 1 0 1 0 1 1 -19: Column: 1 1 4 1 3 1 3 3 2 3 1 0 3 2 5 +19: Row: 0 0 0 0 0 0 0 0 0 +19: Column: 0 6 1 0 6 0 5 5 3 6 5 2 5 0 4 19: Change process grid: No 19: DISTRIBUTION OF (13|2) matrix 19: Number of non-zero blocks: 32 19: Percentage of non-zero blocks: 8.08 -19: Average number of blocks per group: 6 -19: Maximum number of blocks per group: 9 -19: Average number of matrix elements per group: 2719 -19: Maximum number of matrix elements per group: 4824 -19: Average number of blocks per CPU: 3 -19: Maximum number of blocks per CPU: 8 -19: Average number of matrix elements per CPU: 1360 -19: Maximum number of matrix elements per CPU: 4401 +19: Average number of blocks per group: 5 +19: Maximum number of blocks per group: 11 +19: Average number of matrix elements per group: 2330 +19: Maximum number of matrix elements per group: 7584 +19: Average number of blocks per CPU: 5 +19: Maximum number of blocks per CPU: 11 +19: Average number of matrix elements per CPU: 2330 +19: Maximum number of matrix elements per CPU: 7584 19: DISTRIBUTION OF (54|21) matrix 19: Number of non-zero blocks: 36 19: Percentage of non-zero blocks: 5.45 19: Average number of blocks per group: 6 -19: Maximum number of blocks per group: 8 -19: Average number of matrix elements per group: 24915 -19: Maximum number of matrix elements per group: 125460 -19: Average number of blocks per CPU: 3 -19: Maximum number of blocks per CPU: 5 -19: Average number of matrix elements per CPU: 12458 -19: Maximum number of matrix elements per CPU: 100620 +19: Maximum number of blocks per group: 15 +19: Average number of matrix elements per group: 21356 +19: Maximum number of matrix elements per group: 130644 +19: Average number of blocks per CPU: 6 +19: Maximum number of blocks per CPU: 15 +19: Average number of matrix elements per CPU: 21356 +19: Maximum number of matrix elements per CPU: 130644 19: DISTRIBUTION OF (3|45) matrix replicated 19: Number of non-zero blocks: 23 -19: Percentage of non-zero blocks: 2.84 +19: Percentage of non-zero blocks: 2.43 19: Average number of blocks per group: 4 -19: Maximum number of blocks per group: 7 -19: Average number of matrix elements per group: 1784 -19: Maximum number of matrix elements per group: 7014 -19: Average number of blocks per CPU: 2 -19: Maximum number of blocks per CPU: 7 -19: Average number of matrix elements per CPU: 892 -19: Maximum number of matrix elements per CPU: 7014 +19: Maximum number of blocks per group: 9 +19: Average number of matrix elements per group: 1529 +19: Maximum number of matrix elements per group: 7266 +19: Average number of blocks per CPU: 4 +19: Maximum number of blocks per CPU: 9 +19: Average number of matrix elements per CPU: 1529 +19: Maximum number of matrix elements per CPU: 7266 19: Row distribution on subgroup: -19: 0 0 0 1 0 1 0 1 1 +19: 0 0 0 0 0 0 0 0 0 19: Column distribution on subgroup: 19: 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 19: MM PARAMETERS -19: Number of matrix elements per CPU of result matrix: 585 -19: Optimal split factor: 12 +19: Number of matrix elements per CPU of result matrix: 1038 +19: Optimal split factor: 7 19: -------------------------------------------------------------------------------- 19: TAS MATRIX MULTIPLICATION DONE 19: -------------------------------------------------------------------------------- 19: GLOBAL INFO OF (3|45) 19: block dimensions: 9 5 3 19: full dimensions: 74 32 28 -19: process grid dimensions: 3 2 2 +19: process grid dimensions: 7 1 1 19: Block sizes: 19: Dim 1: 7 3 8 7 9 5 10 23 2 19: Dim 2: 8 1 4 13 6 19: Dim 3: 4 2 22 19: Block distribution: -19: Dim 1: 1 0 1 0 1 0 0 2 2 -19: Dim 2: 0 0 1 1 0 -19: Dim 3: 0 0 1 +19: Dim 1: 4 0 3 6 5 0 2 1 6 +19: Dim 2: 0 0 0 0 0 +19: Dim 3: 0 0 0 19: DISTRIBUTION OF (3|45) 19: Number of non-zero blocks: 21 19: Percentage of non-zero blocks: 15.56 -19: Average number of blocks per CPU: 2 -19: Maximum number of blocks per CPU: 4 -19: Average number of matrix elements per CPU: 879 -19: Maximum number of matrix elements per CPU: 3718 +19: Average number of blocks per CPU: 3 +19: Maximum number of blocks per CPU: 5 +19: Average number of matrix elements per CPU: 1506 +19: Maximum number of matrix elements per CPU: 4760 19: GLOBAL INFO OF (3|45) 19: block dimensions: 9 5 3 19: full dimensions: 74 32 28 -19: process grid dimensions: 3 2 2 +19: process grid dimensions: 7 1 1 19: Block sizes: 19: Dim 1: 7 3 8 7 9 5 10 23 2 19: Dim 2: 8 1 4 13 6 19: Dim 3: 4 2 22 19: Block distribution: -19: Dim 1: 0 1 2 0 1 2 0 1 2 -19: Dim 2: 0 1 0 1 0 -19: Dim 3: 0 1 0 +19: Dim 1: 0 1 2 3 4 5 6 0 1 +19: Dim 2: 0 0 0 0 0 +19: Dim 3: 0 0 0 19: DISTRIBUTION OF (3|45) 19: Number of non-zero blocks: 29 19: Percentage of non-zero blocks: 21.48 -19: Average number of blocks per CPU: 3 -19: Maximum number of blocks per CPU: 6 -19: Average number of matrix elements per CPU: 1072 -19: Maximum number of matrix elements per CPU: 4066 +19: Average number of blocks per CPU: 5 +19: Maximum number of blocks per CPU: 7 +19: Average number of matrix elements per CPU: 1838 +19: Maximum number of matrix elements per CPU: 4760 19: -------------------------------------------------------------------------------- 19: TENSOR CONTRACTION DONE 19: -------------------------------------------------------------------------------- @@ -58990,77 +58525,30 @@ 19: 25 83 74 19: 19: Total number of local blocks: -19: 2 6 5 +19: 1 11 9 19: 19: Total number of local elements: -19: 4 60 36 +19: 3 83 74 19: 19: Pgrid dimensions: -19: 3 2 2 +19: 7 1 1 19: 19: Process coordinates: 19: 0 0 0 19: 19: blks_local: -19: 0 3 -19: -19: 0 2 4 6 8 10 -19: -19: 0 2 4 6 8 -19: -19: proc_dist: -19: 0 1 2 0 -19: -19: 0 1 0 1 0 1 0 1 0 1 0 -19: -19: 0 1 0 1 0 1 0 1 0 -19: -19: blk_size: -19: 3 9 12 1 -19: -19: 4 2 3 1 9 2 32 10 5 8 7 -19: -19: 7 3 8 7 9 5 10 23 2 -19: -19: blk_offset: -19: 0 3 12 24 -19: -19: 0 4 6 9 10 19 21 53 63 68 76 -19: -19: 0 7 10 18 25 34 39 49 72 -19: -19: ======= Process: 1 ======== -19: Total number of blocks: -19: 4 11 9 -19: -19: Total number of elements: -19: 25 83 74 -19: -19: Total number of local blocks: -19: 2 5 5 -19: -19: Total number of local elements: -19: 4 23 36 -19: -19: Pgrid dimensions: -19: 3 2 2 -19: -19: Process coordinates: -19: 0 1 0 -19: -19: blks_local: -19: 0 3 +19: 0 19: -19: 1 3 5 7 9 +19: 0 1 2 3 4 5 6 7 8 9 10 19: -19: 0 2 4 6 8 +19: 0 1 2 3 4 5 6 7 8 19: 19: proc_dist: -19: 0 1 2 0 +19: 0 1 2 3 19: -19: 0 1 0 1 0 1 0 1 0 1 0 +19: 0 0 0 0 0 0 0 0 0 0 0 19: -19: 0 1 0 1 0 1 0 1 0 +19: 0 0 0 0 0 0 0 0 0 19: 19: blk_size: 19: 3 9 12 1 @@ -59076,101 +58564,38 @@ 19: 19: 0 7 10 18 25 34 39 49 72 19: -19: ======= Process: 2 ======== -19: Total number of blocks: -19: 4 11 9 -19: -19: Total number of elements: -19: 25 83 74 -19: -19: Total number of local blocks: -19: 2 6 4 -19: -19: Total number of local elements: -19: 4 60 38 -19: -19: Pgrid dimensions: -19: 3 2 2 -19: -19: Process coordinates: -19: 0 0 1 -19: -19: blks_local: -19: 0 3 -19: -19: 0 2 4 6 8 10 -19: -19: 1 3 5 7 -19: -19: proc_dist: -19: 0 1 2 0 -19: -19: 0 1 0 1 0 1 0 1 0 1 0 -19: -19: 0 1 0 1 0 1 0 1 0 -19: -19: blk_size: -19: 3 9 12 1 -19: -19: 4 2 3 1 9 2 32 10 5 8 7 -19: -19: 7 3 8 7 9 5 10 23 2 -19: -19: blk_offset: -19: 0 3 12 24 -19: -19: 0 4 6 9 10 19 21 53 63 68 76 -19: -19: 0 7 10 18 25 34 39 49 72 -19: -19: ======= Process: 3 ======== -19: Total number of blocks: -19: 4 11 9 -19: -19: Total number of elements: -19: 25 83 74 -19: -19: Total number of local blocks: -19: 2 5 4 -19: -19: Total number of local elements: -19: 4 23 38 -19: -19: Pgrid dimensions: -19: 3 2 2 -19: -19: Process coordinates: -19: 0 1 1 -19: -19: blks_local: -19: 0 3 -19: -19: 1 3 5 7 9 -19: -19: 1 3 5 7 +19: Testing get_mapping_info for Tensor 1... +19: ndim_nd = 3 +19: ndim1_2d = 2 +19: ndim2_2d = 1 +19: dims_2d_i8: 36 11 19: -19: proc_dist: -19: 0 1 2 0 +19: dims_2d: 36 11 19: -19: 0 1 0 1 0 1 0 1 0 1 0 +19: dims_nd: +19: 3 10 8 19: -19: 0 1 0 1 0 1 0 1 0 +19: dims1_2d: +19: 3 8 19: -19: blk_size: -19: 3 9 12 1 +19: dims2_2d: +19: 10 19: -19: 4 2 3 1 9 2 32 10 5 8 7 +19: map1_2d: +19: 0 2 19: -19: 7 3 8 7 9 5 10 23 2 +19: map2_2d: +19: 1 19: -19: blk_offset: -19: 0 3 12 24 +19: map_nd: +19: 0 2 1 19: -19: 0 4 6 9 10 19 21 53 63 68 76 +19: Base: 1 +19: col_major 1 19: -19: 0 7 10 18 25 34 39 49 72 +19: Testing c_dbcsr_t_contract_index... 19: -19: ======= Process: 4 ======== +19: ======= Process: 1 ======== 19: Total number of blocks: 19: 4 11 9 19: @@ -59178,13 +58603,13 @@ 19: 25 83 74 19: 19: Total number of local blocks: -19: 1 6 5 +19: 1 11 9 19: 19: Total number of local elements: -19: 9 60 36 +19: 9 83 74 19: 19: Pgrid dimensions: -19: 3 2 2 +19: 7 1 1 19: 19: Process coordinates: 19: 1 0 0 @@ -59192,16 +58617,16 @@ 19: blks_local: 19: 1 19: -19: 0 2 4 6 8 10 +19: 0 1 2 3 4 5 6 7 8 9 10 19: -19: 0 2 4 6 8 +19: 0 1 2 3 4 5 6 7 8 19: 19: proc_dist: -19: 0 1 2 0 +19: 0 1 2 3 19: -19: 0 1 0 1 0 1 0 1 0 1 0 +19: 0 0 0 0 0 0 0 0 0 0 0 19: -19: 0 1 0 1 0 1 0 1 0 +19: 0 0 0 0 0 0 0 0 0 19: 19: blk_size: 19: 3 9 12 1 @@ -59217,7 +58642,7 @@ 19: 19: 0 7 10 18 25 34 39 49 72 19: -19: ======= Process: 5 ======== +19: ======= Process: 2 ======== 19: Total number of blocks: 19: 4 11 9 19: @@ -59225,30 +58650,30 @@ 19: 25 83 74 19: 19: Total number of local blocks: -19: 1 5 5 +19: 1 11 9 19: 19: Total number of local elements: -19: 9 23 36 +19: 12 83 74 19: 19: Pgrid dimensions: -19: 3 2 2 +19: 7 1 1 19: 19: Process coordinates: -19: 1 1 0 +19: 2 0 0 19: 19: blks_local: -19: 1 +19: 2 19: -19: 1 3 5 7 9 +19: 0 1 2 3 4 5 6 7 8 9 10 19: -19: 0 2 4 6 8 +19: 0 1 2 3 4 5 6 7 8 19: 19: proc_dist: -19: 0 1 2 0 +19: 0 1 2 3 19: -19: 0 1 0 1 0 1 0 1 0 1 0 +19: 0 0 0 0 0 0 0 0 0 0 0 19: -19: 0 1 0 1 0 1 0 1 0 +19: 0 0 0 0 0 0 0 0 0 19: 19: blk_size: 19: 3 9 12 1 @@ -59264,7 +58689,7 @@ 19: 19: 0 7 10 18 25 34 39 49 72 19: -19: ======= Process: 6 ======== +19: ======= Process: 3 ======== 19: Total number of blocks: 19: 4 11 9 19: @@ -59272,30 +58697,30 @@ 19: 25 83 74 19: 19: Total number of local blocks: -19: 1 6 4 +19: 1 11 9 19: 19: Total number of local elements: -19: 9 60 38 +19: 1 83 74 19: 19: Pgrid dimensions: -19: 3 2 2 +19: 7 1 1 19: 19: Process coordinates: -19: 1 0 1 +19: 3 0 0 19: 19: blks_local: -19: 1 +19: 3 19: -19: 0 2 4 6 8 10 +19: 0 1 2 3 4 5 6 7 8 9 10 19: -19: 1 3 5 7 +19: 0 1 2 3 4 5 6 7 8 19: 19: proc_dist: -19: 0 1 2 0 +19: 0 1 2 3 19: -19: 0 1 0 1 0 1 0 1 0 1 0 +19: 0 0 0 0 0 0 0 0 0 0 0 19: -19: 0 1 0 1 0 1 0 1 0 +19: 0 0 0 0 0 0 0 0 0 19: 19: blk_size: 19: 3 9 12 1 @@ -59311,7 +58736,7 @@ 19: 19: 0 7 10 18 25 34 39 49 72 19: -19: ======= Process: 7 ======== +19: ======= Process: 4 ======== 19: Total number of blocks: 19: 4 11 9 19: @@ -59319,77 +58744,30 @@ 19: 25 83 74 19: 19: Total number of local blocks: -19: 1 5 4 +19: 0 11 9 19: 19: Total number of local elements: -19: 9 23 38 +19: 0 83 74 19: 19: Pgrid dimensions: -19: 3 2 2 +19: 7 1 1 19: 19: Process coordinates: -19: 1 1 1 +19: 4 0 0 19: 19: blks_local: -19: 1 -19: -19: 1 3 5 7 9 -19: -19: 1 3 5 7 19: -19: proc_dist: -19: 0 1 2 0 -19: -19: 0 1 0 1 0 1 0 1 0 1 0 19: -19: 0 1 0 1 0 1 0 1 0 +19: 0 1 2 3 4 5 6 7 8 9 10 19: -19: blk_size: -19: 3 9 12 1 -19: -19: 4 2 3 1 9 2 32 10 5 8 7 -19: -19: 7 3 8 7 9 5 10 23 2 -19: -19: blk_offset: -19: 0 3 12 24 -19: -19: 0 4 6 9 10 19 21 53 63 68 76 -19: -19: 0 7 10 18 25 34 39 49 72 -19: -19: ======= Process: 8 ======== -19: Total number of blocks: -19: 4 11 9 -19: -19: Total number of elements: -19: 25 83 74 -19: -19: Total number of local blocks: -19: 1 6 5 -19: -19: Total number of local elements: -19: 12 60 36 -19: -19: Pgrid dimensions: -19: 3 2 2 -19: -19: Process coordinates: -19: 2 0 0 -19: -19: blks_local: -19: 2 -19: -19: 0 2 4 6 8 10 -19: -19: 0 2 4 6 8 +19: 0 1 2 3 4 5 6 7 8 19: 19: proc_dist: -19: 0 1 2 0 +19: 0 1 2 3 19: -19: 0 1 0 1 0 1 0 1 0 1 0 +19: 0 0 0 0 0 0 0 0 0 0 0 19: -19: 0 1 0 1 0 1 0 1 0 +19: 0 0 0 0 0 0 0 0 0 19: 19: blk_size: 19: 3 9 12 1 @@ -59405,7 +58783,7 @@ 19: 19: 0 7 10 18 25 34 39 49 72 19: -19: ======= Process: 9 ======== +19: ======= Process: 5 ======== 19: Total number of blocks: 19: 4 11 9 19: @@ -59413,77 +58791,30 @@ 19: 25 83 74 19: 19: Total number of local blocks: -19: 1 5 5 +19: 0 11 9 19: 19: Total number of local elements: -19: 12 23 36 +19: 0 83 74 19: 19: Pgrid dimensions: -19: 3 2 2 +19: 7 1 1 19: 19: Process coordinates: -19: 2 1 0 +19: 5 0 0 19: 19: blks_local: -19: 2 -19: -19: 1 3 5 7 9 -19: -19: 0 2 4 6 8 -19: -19: proc_dist: -19: 0 1 2 0 -19: -19: 0 1 0 1 0 1 0 1 0 1 0 -19: -19: 0 1 0 1 0 1 0 1 0 -19: -19: blk_size: -19: 3 9 12 1 -19: -19: 4 2 3 1 9 2 32 10 5 8 7 -19: -19: 7 3 8 7 9 5 10 23 2 -19: -19: blk_offset: -19: 0 3 12 24 -19: -19: 0 4 6 9 10 19 21 53 63 68 76 -19: -19: 0 7 10 18 25 34 39 49 72 -19: -19: ======= Process: 10 ======== -19: Total number of blocks: -19: 4 11 9 -19: -19: Total number of elements: -19: 25 83 74 -19: -19: Total number of local blocks: -19: 1 6 4 -19: -19: Total number of local elements: -19: 12 60 38 -19: -19: Pgrid dimensions: -19: 3 2 2 -19: -19: Process coordinates: -19: 2 0 1 19: -19: blks_local: -19: 2 19: -19: 0 2 4 6 8 10 +19: 0 1 2 3 4 5 6 7 8 9 10 19: -19: 1 3 5 7 +19: 0 1 2 3 4 5 6 7 8 19: 19: proc_dist: -19: 0 1 2 0 +19: 0 1 2 3 19: -19: 0 1 0 1 0 1 0 1 0 1 0 +19: 0 0 0 0 0 0 0 0 0 0 0 19: -19: 0 1 0 1 0 1 0 1 0 +19: 0 0 0 0 0 0 0 0 0 19: 19: blk_size: 19: 3 9 12 1 @@ -59499,7 +58830,7 @@ 19: 19: 0 7 10 18 25 34 39 49 72 19: -19: ======= Process: 11 ======== +19: ======= Process: 6 ======== 19: Total number of blocks: 19: 4 11 9 19: @@ -59507,30 +58838,30 @@ 19: 25 83 74 19: 19: Total number of local blocks: -19: 1 5 4 +19: 0 11 9 19: 19: Total number of local elements: -19: 12 23 38 +19: 0 83 74 19: 19: Pgrid dimensions: -19: 3 2 2 +19: 7 1 1 19: 19: Process coordinates: -19: 2 1 1 +19: 6 0 0 19: 19: blks_local: -19: 2 19: -19: 1 3 5 7 9 19: -19: 1 3 5 7 +19: 0 1 2 3 4 5 6 7 8 9 10 +19: +19: 0 1 2 3 4 5 6 7 8 19: 19: proc_dist: -19: 0 1 2 0 +19: 0 1 2 3 19: -19: 0 1 0 1 0 1 0 1 0 1 0 +19: 0 0 0 0 0 0 0 0 0 0 0 19: -19: 0 1 0 1 0 1 0 1 0 +19: 0 0 0 0 0 0 0 0 0 19: 19: blk_size: 19: 3 9 12 1 @@ -59546,314 +58877,62 @@ 19: 19: 0 7 10 18 25 34 39 49 72 19: -19: Testing get_mapping_info for Tensor 1... -19: ndim_nd = 3 -19: ndim1_2d = 2 -19: ndim2_2d = 1 -19: dims_2d_i8: 36 11 -19: -19: dims_2d: 36 11 -19: -19: dims_nd: -19: 3 10 8 -19: -19: dims1_2d: -19: 3 8 -19: -19: dims2_2d: -19: 10 -19: -19: map1_2d: -19: 0 2 -19: -19: map2_2d: -19: 1 -19: -19: map_nd: -19: 0 2 1 -19: -19: Base: 1 -19: col_major 1 -19: -19: Testing c_dbcsr_t_contract_index... -19: 19: Result Indices on Rank 0 19: 1 0 0 +19: 1 3 2 19: 5 0 0 -19: 6 0 0 -19: Result Indices on Rank 1 -19: 3 2 1 19: 5 2 0 19: 5 2 1 -19: 6 3 1 +19: Result Indices on Rank 1 +19: 7 1 0 +19: 7 1 2 +19: 7 2 0 +19: 7 2 1 19: Result Indices on Rank 2 +19: 6 0 0 +19: 6 3 1 +19: 6 3 2 19: 6 4 2 19: Result Indices on Rank 3 -19: 1 3 2 -19: 6 3 2 -19: Result Indices on Rank 4 19: 2 1 0 -19: 4 1 0 -19: Result Indices on Rank 5 -19: 0 3 1 19: 2 3 1 +19: Result Indices on Rank 4 +19: 0 3 1 +19: Result Indices on Rank 5 +19: 4 1 0 19: 4 2 1 19: 4 3 1 -19: Result Indices on Rank 6 -19: Result Indices on Rank 7 19: 4 3 2 -19: Result Indices on Rank 8 -19: 7 1 0 -19: Result Indices on Rank 9 -19: 7 2 0 -19: 7 2 1 -19: Result Indices on Rank 10 -19: 7 1 2 -19: Result Indices on Rank 11 -19/19 Test #19: dbcsr_tensor_test ..................................... Passed 0.21 sec +19: Result Indices on Rank 6 +19: 3 2 1 +19/19 Test #19: dbcsr_tensor_test ..................................... Passed 0.74 sec -100% tests passed, 0 tests failed out of 19 +95% tests passed, 1 tests failed out of 19 -Total Test time (real) = 1348.23 sec +Total Test time (real) = 1946.66 sec + +The following tests FAILED: + 18 - dbcsr_test (Failed) +Errors while running CTest +make[2]: *** [Makefile:74: test] Error 8 make[2]: Leaving directory '/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu' +dh_auto_test: error: cd obj-i686-linux-gnu && make -j1 test ARGS\+=--verbose ARGS\+=-j1 returned exit code 2 +make[1]: *** [debian/rules:19: override_dh_auto_test] Error 25 make[1]: Leaving directory '/build/reproducible-path/dbcsr-2.6.0' - create-stamp debian/debhelper-build-stamp - fakeroot debian/rules binary -dh binary --buildsystem=cmake - dh_testroot -O--buildsystem=cmake - dh_prep -O--buildsystem=cmake - dh_auto_install --destdir=debian/libdbcsr-dev/ -O--buildsystem=cmake - cd obj-i686-linux-gnu && make -j22 install DESTDIR=/build/reproducible-path/dbcsr-2.6.0/debian/libdbcsr-dev AM_UPDATE_INFO_DIR=no -make[1]: Entering directory '/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu' -/usr/bin/cmake -S/build/reproducible-path/dbcsr-2.6.0 -B/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu --check-build-system CMakeFiles/Makefile.cmake 0 -/usr/bin/cmake -E cmake_progress_start /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/CMakeFiles /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu//CMakeFiles/progress.marks -make -f CMakeFiles/Makefile2 all -make[2]: Entering directory '/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu' -make -f src/CMakeFiles/dbcsr.dir/build.make src/CMakeFiles/dbcsr.dir/depend -make[3]: Entering directory '/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu' -cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu && /usr/bin/cmake -E cmake_depends "Unix Makefiles" /build/reproducible-path/dbcsr-2.6.0 /build/reproducible-path/dbcsr-2.6.0/src /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/CMakeFiles/dbcsr.dir/DependInfo.cmake "--color=" -make[3]: Leaving directory '/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu' -make -f src/CMakeFiles/dbcsr.dir/build.make src/CMakeFiles/dbcsr.dir/build -make[3]: Entering directory '/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu' -make[3]: Nothing to be done for 'src/CMakeFiles/dbcsr.dir/build'. -make[3]: Leaving directory '/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu' -[ 81%] Built target dbcsr -make -f src/CMakeFiles/dbcsr_c.dir/build.make src/CMakeFiles/dbcsr_c.dir/depend -make -f tests/CMakeFiles/dbcsr_perf.dir/build.make tests/CMakeFiles/dbcsr_perf.dir/depend -make -f tests/CMakeFiles/dbcsr_unittest_common.dir/build.make tests/CMakeFiles/dbcsr_unittest_common.dir/depend -make -f examples/CMakeFiles/dbcsr_example_1.dir/build.make examples/CMakeFiles/dbcsr_example_1.dir/depend -make -f examples/CMakeFiles/dbcsr_example_2.dir/build.make examples/CMakeFiles/dbcsr_example_2.dir/depend -make -f examples/CMakeFiles/dbcsr_example_3.dir/build.make examples/CMakeFiles/dbcsr_example_3.dir/depend -make -f examples/CMakeFiles/dbcsr_tensor_example_1.dir/build.make examples/CMakeFiles/dbcsr_tensor_example_1.dir/depend -make[3]: Entering directory '/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu' -cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu && /usr/bin/cmake -E cmake_depends "Unix Makefiles" /build/reproducible-path/dbcsr-2.6.0 /build/reproducible-path/dbcsr-2.6.0/tests /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/tests /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/tests/CMakeFiles/dbcsr_perf.dir/DependInfo.cmake "--color=" -make[3]: Entering directory '/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu' -cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu && /usr/bin/cmake -E cmake_depends "Unix Makefiles" /build/reproducible-path/dbcsr-2.6.0 /build/reproducible-path/dbcsr-2.6.0/tests /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/tests /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/tests/CMakeFiles/dbcsr_unittest_common.dir/DependInfo.cmake "--color=" -make[3]: Entering directory '/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu' -cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu && /usr/bin/cmake -E cmake_depends "Unix Makefiles" /build/reproducible-path/dbcsr-2.6.0 /build/reproducible-path/dbcsr-2.6.0/examples /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/examples /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/examples/CMakeFiles/dbcsr_example_1.dir/DependInfo.cmake "--color=" -make[3]: Entering directory '/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu' -cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu && /usr/bin/cmake -E cmake_depends "Unix Makefiles" /build/reproducible-path/dbcsr-2.6.0 /build/reproducible-path/dbcsr-2.6.0/src /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/src/CMakeFiles/dbcsr_c.dir/DependInfo.cmake "--color=" -make[3]: Entering directory '/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu' -cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu && /usr/bin/cmake -E cmake_depends "Unix Makefiles" /build/reproducible-path/dbcsr-2.6.0 /build/reproducible-path/dbcsr-2.6.0/examples /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/examples /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/examples/CMakeFiles/dbcsr_example_2.dir/DependInfo.cmake "--color=" -make[3]: Entering directory '/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu' -cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu && /usr/bin/cmake -E cmake_depends "Unix Makefiles" /build/reproducible-path/dbcsr-2.6.0 /build/reproducible-path/dbcsr-2.6.0/examples /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/examples /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/examples/CMakeFiles/dbcsr_tensor_example_1.dir/DependInfo.cmake "--color=" -make[3]: Entering directory '/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu' -cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu && /usr/bin/cmake -E cmake_depends "Unix Makefiles" /build/reproducible-path/dbcsr-2.6.0 /build/reproducible-path/dbcsr-2.6.0/examples /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/examples /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/examples/CMakeFiles/dbcsr_example_3.dir/DependInfo.cmake "--color=" -make[3]: Leaving directory '/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu' -make[3]: Leaving directory '/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu' -make -f src/CMakeFiles/dbcsr_c.dir/build.make src/CMakeFiles/dbcsr_c.dir/build -make -f tests/CMakeFiles/dbcsr_unittest_common.dir/build.make tests/CMakeFiles/dbcsr_unittest_common.dir/build -make[3]: Leaving directory '/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu' -make[3]: Leaving directory '/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu' -make[3]: Leaving directory '/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu' -make -f examples/CMakeFiles/dbcsr_example_1.dir/build.make examples/CMakeFiles/dbcsr_example_1.dir/build -make -f tests/CMakeFiles/dbcsr_perf.dir/build.make tests/CMakeFiles/dbcsr_perf.dir/build -make[3]: Entering directory '/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu' -make[3]: Nothing to be done for 'src/CMakeFiles/dbcsr_c.dir/build'. -make[3]: Leaving directory '/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu' -make -f examples/CMakeFiles/dbcsr_example_2.dir/build.make examples/CMakeFiles/dbcsr_example_2.dir/build -make[3]: Entering directory '/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu' -make[3]: Nothing to be done for 'tests/CMakeFiles/dbcsr_unittest_common.dir/build'. -make[3]: Leaving directory '/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu' -make[3]: Entering directory '/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu' -make[3]: Nothing to be done for 'examples/CMakeFiles/dbcsr_example_1.dir/build'. -make[3]: Leaving directory '/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu' -make[3]: Entering directory '/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu' -make[3]: Nothing to be done for 'examples/CMakeFiles/dbcsr_example_2.dir/build'. -make[3]: Leaving directory '/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu' -make[3]: Entering directory '/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu' -make[3]: Nothing to be done for 'tests/CMakeFiles/dbcsr_perf.dir/build'. -make[3]: Leaving directory '/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu' -make[3]: Leaving directory '/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu' -make -f examples/CMakeFiles/dbcsr_example_3.dir/build.make examples/CMakeFiles/dbcsr_example_3.dir/build -make[3]: Leaving directory '/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu' -make -f examples/CMakeFiles/dbcsr_tensor_example_1.dir/build.make examples/CMakeFiles/dbcsr_tensor_example_1.dir/build -make[3]: Entering directory '/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu' -make[3]: Nothing to be done for 'examples/CMakeFiles/dbcsr_example_3.dir/build'. -make[3]: Leaving directory '/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu' -make[3]: Entering directory '/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu' -make[3]: Nothing to be done for 'examples/CMakeFiles/dbcsr_tensor_example_1.dir/build'. -make[3]: Leaving directory '/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu' -[ 82%] Built target dbcsr_unittest_common -make -f tests/CMakeFiles/dbcsr_unittest1.dir/build.make tests/CMakeFiles/dbcsr_unittest1.dir/depend -make -f tests/CMakeFiles/dbcsr_unittest2.dir/build.make tests/CMakeFiles/dbcsr_unittest2.dir/depend -make -f tests/CMakeFiles/dbcsr_unittest3.dir/build.make tests/CMakeFiles/dbcsr_unittest3.dir/depend -make -f tests/CMakeFiles/dbcsr_unittest4.dir/build.make tests/CMakeFiles/dbcsr_unittest4.dir/depend -make -f tests/CMakeFiles/dbcsr_tensor_unittest.dir/build.make tests/CMakeFiles/dbcsr_tensor_unittest.dir/depend -[ 85%] Built target dbcsr_c -make -f tests/CMakeFiles/dbcsr_tas_unittest.dir/build.make tests/CMakeFiles/dbcsr_tas_unittest.dir/depend -make -f tests/CMakeFiles/dbcsr_test_csr_conversions.dir/build.make tests/CMakeFiles/dbcsr_test_csr_conversions.dir/depend -make -f tests/CMakeFiles/dbcsr_test.dir/build.make tests/CMakeFiles/dbcsr_test.dir/depend -make -f tests/CMakeFiles/dbcsr_tensor_test.dir/build.make tests/CMakeFiles/dbcsr_tensor_test.dir/depend -[ 86%] Built target dbcsr_perf -make -f examples/CMakeFiles/dbcsr_example_3_cpp.dir/build.make examples/CMakeFiles/dbcsr_example_3_cpp.dir/depend -make -f examples/CMakeFiles/dbcsr_tensor_example_2_cpp.dir/build.make examples/CMakeFiles/dbcsr_tensor_example_2_cpp.dir/depend -make[3]: Entering directory '/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu' -cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu && /usr/bin/cmake -E cmake_depends "Unix Makefiles" /build/reproducible-path/dbcsr-2.6.0 /build/reproducible-path/dbcsr-2.6.0/tests /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/tests /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/tests/CMakeFiles/dbcsr_unittest1.dir/DependInfo.cmake "--color=" -make[3]: Entering directory '/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu' -cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu && /usr/bin/cmake -E cmake_depends "Unix Makefiles" /build/reproducible-path/dbcsr-2.6.0 /build/reproducible-path/dbcsr-2.6.0/tests /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/tests /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/tests/CMakeFiles/dbcsr_unittest2.dir/DependInfo.cmake "--color=" -[ 88%] Built target dbcsr_example_1 -make[3]: Entering directory '/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu' -cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu && /usr/bin/cmake -E cmake_depends "Unix Makefiles" /build/reproducible-path/dbcsr-2.6.0 /build/reproducible-path/dbcsr-2.6.0/tests /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/tests /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/tests/CMakeFiles/dbcsr_unittest3.dir/DependInfo.cmake "--color=" -make[3]: Entering directory '/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu' -cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu && /usr/bin/cmake -E cmake_depends "Unix Makefiles" /build/reproducible-path/dbcsr-2.6.0 /build/reproducible-path/dbcsr-2.6.0/tests /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/tests /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/tests/CMakeFiles/dbcsr_unittest4.dir/DependInfo.cmake "--color=" -[ 88%] Built target dbcsr_example_2 -make[3]: Entering directory '/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu' -cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu && /usr/bin/cmake -E cmake_depends "Unix Makefiles" /build/reproducible-path/dbcsr-2.6.0 /build/reproducible-path/dbcsr-2.6.0/tests /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/tests /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/tests/CMakeFiles/dbcsr_tas_unittest.dir/DependInfo.cmake "--color=" -[ 89%] Built target dbcsr_example_3 -make[3]: Entering directory '/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu' -cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu && /usr/bin/cmake -E cmake_depends "Unix Makefiles" /build/reproducible-path/dbcsr-2.6.0 /build/reproducible-path/dbcsr-2.6.0/tests /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/tests /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/tests/CMakeFiles/dbcsr_tensor_unittest.dir/DependInfo.cmake "--color=" -make[3]: Entering directory '/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu' -cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu && /usr/bin/cmake -E cmake_depends "Unix Makefiles" /build/reproducible-path/dbcsr-2.6.0 /build/reproducible-path/dbcsr-2.6.0/tests /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/tests /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/tests/CMakeFiles/dbcsr_test_csr_conversions.dir/DependInfo.cmake "--color=" -make[3]: Entering directory '/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu' -cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu && /usr/bin/cmake -E cmake_depends "Unix Makefiles" /build/reproducible-path/dbcsr-2.6.0 /build/reproducible-path/dbcsr-2.6.0/tests /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/tests /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/tests/CMakeFiles/dbcsr_test.dir/DependInfo.cmake "--color=" -make[3]: Entering directory '/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu' -cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu && /usr/bin/cmake -E cmake_depends "Unix Makefiles" /build/reproducible-path/dbcsr-2.6.0 /build/reproducible-path/dbcsr-2.6.0/tests /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/tests /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/tests/CMakeFiles/dbcsr_tensor_test.dir/DependInfo.cmake "--color=" -make[3]: Entering directory '/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu' -cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu && /usr/bin/cmake -E cmake_depends "Unix Makefiles" /build/reproducible-path/dbcsr-2.6.0 /build/reproducible-path/dbcsr-2.6.0/examples /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/examples /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/examples/CMakeFiles/dbcsr_example_3_cpp.dir/DependInfo.cmake "--color=" -make[3]: Entering directory '/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu' -cd /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu && /usr/bin/cmake -E cmake_depends "Unix Makefiles" /build/reproducible-path/dbcsr-2.6.0 /build/reproducible-path/dbcsr-2.6.0/examples /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/examples /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/examples/CMakeFiles/dbcsr_tensor_example_2_cpp.dir/DependInfo.cmake "--color=" -[ 89%] Built target dbcsr_tensor_example_1 -make[3]: Leaving directory '/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu' -make[3]: Leaving directory '/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu' -make -f tests/CMakeFiles/dbcsr_unittest2.dir/build.make tests/CMakeFiles/dbcsr_unittest2.dir/build -make -f tests/CMakeFiles/dbcsr_unittest1.dir/build.make tests/CMakeFiles/dbcsr_unittest1.dir/build -make[3]: Leaving directory '/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu' -make -f tests/CMakeFiles/dbcsr_unittest3.dir/build.make tests/CMakeFiles/dbcsr_unittest3.dir/build -make[3]: Leaving directory '/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu' -make -f tests/CMakeFiles/dbcsr_tas_unittest.dir/build.make tests/CMakeFiles/dbcsr_tas_unittest.dir/build -make[3]: Leaving directory '/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu' -make -f tests/CMakeFiles/dbcsr_tensor_unittest.dir/build.make tests/CMakeFiles/dbcsr_tensor_unittest.dir/build -make[3]: Leaving directory '/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu' -make -f tests/CMakeFiles/dbcsr_tensor_test.dir/build.make tests/CMakeFiles/dbcsr_tensor_test.dir/build -make[3]: Leaving directory '/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu' -make -f tests/CMakeFiles/dbcsr_unittest4.dir/build.make tests/CMakeFiles/dbcsr_unittest4.dir/build -make[3]: Leaving directory '/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu' -make -f tests/CMakeFiles/dbcsr_test.dir/build.make tests/CMakeFiles/dbcsr_test.dir/build -make[3]: Leaving directory '/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu' -make -f examples/CMakeFiles/dbcsr_example_3_cpp.dir/build.make examples/CMakeFiles/dbcsr_example_3_cpp.dir/build -make[3]: Leaving directory '/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu' -make -f tests/CMakeFiles/dbcsr_test_csr_conversions.dir/build.make tests/CMakeFiles/dbcsr_test_csr_conversions.dir/build -make[3]: Leaving directory '/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu' -make -f examples/CMakeFiles/dbcsr_tensor_example_2_cpp.dir/build.make examples/CMakeFiles/dbcsr_tensor_example_2_cpp.dir/build -make[3]: Entering directory '/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu' -make[3]: Nothing to be done for 'tests/CMakeFiles/dbcsr_unittest2.dir/build'. -make[3]: Leaving directory '/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu' -make[3]: Entering directory '/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu' -make[3]: Nothing to be done for 'tests/CMakeFiles/dbcsr_unittest3.dir/build'. -make[3]: Leaving directory '/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu' -make[3]: Entering directory '/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu' -make[3]: Nothing to be done for 'tests/CMakeFiles/dbcsr_tensor_unittest.dir/build'. -make[3]: Leaving directory '/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu' -make[3]: Entering directory '/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu' -make[3]: Nothing to be done for 'tests/CMakeFiles/dbcsr_unittest1.dir/build'. -make[3]: Leaving directory '/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu' -make[3]: Entering directory '/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu' -make[3]: Nothing to be done for 'tests/CMakeFiles/dbcsr_tas_unittest.dir/build'. -make[3]: Leaving directory '/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu' -make[3]: Entering directory '/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu' -make[3]: Nothing to be done for 'tests/CMakeFiles/dbcsr_test_csr_conversions.dir/build'. -make[3]: Leaving directory '/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu' -make[3]: Entering directory '/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu' -make[3]: Nothing to be done for 'tests/CMakeFiles/dbcsr_unittest4.dir/build'. -make[3]: Leaving directory '/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu' -[ 89%] Built target dbcsr_tensor_unittest -[ 89%] Built target dbcsr_unittest2 -[ 91%] Built target dbcsr_unittest3 -[ 92%] Built target dbcsr_tas_unittest -[ 92%] Built target dbcsr_test_csr_conversions -[ 94%] Built target dbcsr_unittest1 -[ 95%] Built target dbcsr_unittest4 -make[3]: Entering directory '/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu' -make[3]: Nothing to be done for 'tests/CMakeFiles/dbcsr_tensor_test.dir/build'. -make[3]: Entering directory '/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu' -make[3]: Nothing to be done for 'examples/CMakeFiles/dbcsr_example_3_cpp.dir/build'. -make[3]: Leaving directory '/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu' -make[3]: Leaving directory '/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu' -make[3]: Entering directory '/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu' -make[3]: Nothing to be done for 'examples/CMakeFiles/dbcsr_tensor_example_2_cpp.dir/build'. -make[3]: Leaving directory '/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu' -make[3]: Entering directory '/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu' -make[3]: Nothing to be done for 'tests/CMakeFiles/dbcsr_test.dir/build'. -make[3]: Leaving directory '/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu' -[ 98%] Built target dbcsr_tensor_test -[ 98%] Built target dbcsr_test -[ 98%] Built target dbcsr_example_3_cpp -[100%] Built target dbcsr_tensor_example_2_cpp -make[2]: Leaving directory '/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu' -/usr/bin/cmake -E cmake_progress_start /build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu/CMakeFiles 0 -make -f CMakeFiles/Makefile2 preinstall -make[2]: Entering directory '/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu' -make[2]: Nothing to be done for 'preinstall'. -make[2]: Leaving directory '/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu' -Install the project... -/usr/bin/cmake -P cmake_install.cmake --- Install configuration: "None" --- Installing: /build/reproducible-path/dbcsr-2.6.0/debian/libdbcsr-dev/usr/lib/i386-linux-gnu/libdbcsr.a --- Installing: /build/reproducible-path/dbcsr-2.6.0/debian/libdbcsr-dev/usr/include/dbcsr_api.mod --- Installing: /build/reproducible-path/dbcsr-2.6.0/debian/libdbcsr-dev/usr/include/dbcsr_tensor_api.mod --- Installing: /build/reproducible-path/dbcsr-2.6.0/debian/libdbcsr-dev/usr/include/dbcsr_config.mod --- Installing: /build/reproducible-path/dbcsr-2.6.0/debian/libdbcsr-dev/usr/lib/i386-linux-gnu/libdbcsr_c.a --- Installing: /build/reproducible-path/dbcsr-2.6.0/debian/libdbcsr-dev/usr/include/dbcsr.h --- Installing: /build/reproducible-path/dbcsr-2.6.0/debian/libdbcsr-dev/usr/include/dbcsr_tensor.h --- Installing: /build/reproducible-path/dbcsr-2.6.0/debian/libdbcsr-dev/usr/lib/i386-linux-gnu/cmake/dbcsr/DBCSRTargets.cmake --- Installing: /build/reproducible-path/dbcsr-2.6.0/debian/libdbcsr-dev/usr/lib/i386-linux-gnu/cmake/dbcsr/DBCSRTargets-none.cmake --- Installing: /build/reproducible-path/dbcsr-2.6.0/debian/libdbcsr-dev/usr/lib/i386-linux-gnu/cmake/dbcsr/DBCSRConfig.cmake --- Installing: /build/reproducible-path/dbcsr-2.6.0/debian/libdbcsr-dev/usr/lib/i386-linux-gnu/cmake/dbcsr/DBCSRConfigVersion.cmake -make[1]: Leaving directory '/build/reproducible-path/dbcsr-2.6.0/obj-i686-linux-gnu' - dh_installdocs -O--buildsystem=cmake - dh_installchangelogs -O--buildsystem=cmake - dh_systemd_enable -O--buildsystem=cmake - dh_installinit -O--buildsystem=cmake - dh_systemd_start -O--buildsystem=cmake - dh_perl -O--buildsystem=cmake - dh_link -O--buildsystem=cmake - dh_strip_nondeterminism -O--buildsystem=cmake - dh_compress -O--buildsystem=cmake - dh_fixperms -O--buildsystem=cmake - dh_missing -O--buildsystem=cmake - dh_strip -O--buildsystem=cmake - dh_makeshlibs -O--buildsystem=cmake - dh_shlibdeps -O--buildsystem=cmake - dh_installdeb -O--buildsystem=cmake - dh_gencontrol -O--buildsystem=cmake -dpkg-gencontrol: warning: Depends field of package libdbcsr-dev: substitution variable ${shlibs:Depends} used, but is not defined - dh_md5sums -O--buildsystem=cmake - dh_builddeb -O--buildsystem=cmake -dpkg-deb: building package 'libdbcsr-dev' in '../libdbcsr-dev_2.6.0-2_i386.deb'. - dpkg-genbuildinfo --build=binary -O../dbcsr_2.6.0-2_i386.buildinfo - dpkg-genchanges --build=binary -O../dbcsr_2.6.0-2_i386.changes -dpkg-genchanges: info: binary-only upload (no source code included) - dpkg-source --after-build . -dpkg-buildpackage: info: binary-only upload (no source included) -dpkg-genchanges: info: not including original source code in upload +make: *** [debian/rules:10: build] Error 2 +dpkg-buildpackage: error: debian/rules build subprocess returned exit status 2 I: copying local configuration +E: Failed autobuilding of package +I: user script /srv/workspace/pbuilder/6634/tmp/hooks/C01_cleanup starting +debug output: disk usage on i-capture-the-hostname at Fri Nov 22 14:22:57 UTC 2024 +Filesystem Size Used Avail Use% Mounted on +tmpfs 3.9G 0 3.9G 0% /dev/shm + +I: user script /srv/workspace/pbuilder/6634/tmp/hooks/C01_cleanup finished I: unmounting dev/ptmx filesystem I: unmounting dev/pts filesystem I: unmounting dev/shm filesystem I: unmounting proc filesystem I: unmounting sys filesystem I: cleaning the build env -I: removing directory /srv/workspace/pbuilder/87525 and its subdirectories -I: Current time: Thu Dec 25 08:12:02 -12 2025 -I: pbuilder-time-stamp: 1766693522 +I: removing directory /srv/workspace/pbuilder/6634 and its subdirectories