Diff of the two buildlogs: -- --- b1/build.log 2023-05-16 01:42:38.008405734 +0000 +++ b2/build.log 2023-05-16 01:57:39.916933075 +0000 @@ -1,6 +1,6 @@ I: pbuilder: network access will be disabled during build -I: Current time: Mon May 15 13:34:21 -12 2023 -I: pbuilder-time-stamp: 1684200861 +I: Current time: Tue May 16 15:42:59 +14 2023 +I: pbuilder-time-stamp: 1684201379 I: Building the build Environment I: extracting base tarball [/var/cache/pbuilder/bookworm-reproducible-base.tgz] I: copying local configuration @@ -16,7 +16,7 @@ I: copying [./fenicsx-performance-tests_0.5.0~git20220731.821823b.orig.tar.gz] I: copying [./fenicsx-performance-tests_0.5.0~git20220731.821823b-1.debian.tar.xz] I: Extracting source -gpgv: Signature made Thu Sep 22 00:05:12 2022 -12 +gpgv: Signature made Fri Sep 23 02:05:12 2022 +14 gpgv: using RSA key 23C9A93E585819E9126D0A36573EF1E4BD5A01FA gpgv: Can't check signature: No public key dpkg-source: warning: cannot verify inline signature for ./fenicsx-performance-tests_0.5.0~git20220731.821823b-1.dsc: no acceptable signature found @@ -27,135 +27,167 @@ dpkg-source: info: applying enable_complex_build.patch I: Not using root during the build. I: Installing the build-deps -I: user script /srv/workspace/pbuilder/1361/tmp/hooks/D02_print_environment starting +I: user script /srv/workspace/pbuilder/27026/tmp/hooks/D01_modify_environment starting +debug: Running on virt32c. +I: Changing host+domainname to test build reproducibility +I: Adding a custom variable just for the fun of it... +I: Changing /bin/sh to bash +'/bin/sh' -> '/bin/bash' +lrwxrwxrwx 1 root root 9 May 16 15:44 /bin/sh -> /bin/bash +I: Setting pbuilder2's login shell to /bin/bash +I: Setting pbuilder2's GECOS to second user,second room,second work-phone,second home-phone,second other +I: user script /srv/workspace/pbuilder/27026/tmp/hooks/D01_modify_environment finished +I: user script /srv/workspace/pbuilder/27026/tmp/hooks/D02_print_environment starting I: set - BUILDDIR='/build' - BUILDUSERGECOS='first user,first room,first work-phone,first home-phone,first other' - BUILDUSERNAME='pbuilder1' - BUILD_ARCH='armhf' - DEBIAN_FRONTEND='noninteractive' - DEB_BUILD_OPTIONS='buildinfo=+all reproducible=+all parallel=3 ' - DISTRIBUTION='bookworm' - HOME='/root' - HOST_ARCH='armhf' + BASH=/bin/sh + BASHOPTS=checkwinsize:cmdhist:complete_fullquote:extquote:force_fignore:globasciiranges:globskipdots:hostcomplete:interactive_comments:patsub_replacement:progcomp:promptvars:sourcepath + BASH_ALIASES=() + BASH_ARGC=() + BASH_ARGV=() + BASH_CMDS=() + BASH_LINENO=([0]="12" [1]="0") + BASH_LOADABLES_PATH=/usr/local/lib/bash:/usr/lib/bash:/opt/local/lib/bash:/usr/pkg/lib/bash:/opt/pkg/lib/bash:. + BASH_SOURCE=([0]="/tmp/hooks/D02_print_environment" [1]="/tmp/hooks/D02_print_environment") + BASH_VERSINFO=([0]="5" [1]="2" [2]="15" [3]="1" [4]="release" [5]="arm-unknown-linux-gnueabihf") + BASH_VERSION='5.2.15(1)-release' + BUILDDIR=/build + BUILDUSERGECOS='second user,second room,second work-phone,second home-phone,second other' + BUILDUSERNAME=pbuilder2 + BUILD_ARCH=armhf + DEBIAN_FRONTEND=noninteractive + DEB_BUILD_OPTIONS='buildinfo=+all reproducible=+all parallel=4 ' + DIRSTACK=() + DISTRIBUTION=bookworm + EUID=0 + FUNCNAME=([0]="Echo" [1]="main") + GROUPS=() + HOME=/root + HOSTNAME=i-capture-the-hostname + HOSTTYPE=arm + HOST_ARCH=armhf IFS=' ' - INVOCATION_ID='441a3a87a28b46ebb8ae815b7d5b4581' - LANG='C' - LANGUAGE='en_US:en' - LC_ALL='C' - MAIL='/var/mail/root' - OPTIND='1' - PATH='/usr/sbin:/usr/bin:/sbin:/bin:/usr/games' - PBCURRENTCOMMANDLINEOPERATION='build' - PBUILDER_OPERATION='build' - PBUILDER_PKGDATADIR='/usr/share/pbuilder' - PBUILDER_PKGLIBDIR='/usr/lib/pbuilder' - PBUILDER_SYSCONFDIR='/etc' - PPID='1361' - PS1='# ' - PS2='> ' + INVOCATION_ID=dff376bd81554a83b89a81357db9ed71 + LANG=C + LANGUAGE=it_CH:it + LC_ALL=C + MACHTYPE=arm-unknown-linux-gnueabihf + MAIL=/var/mail/root + OPTERR=1 + OPTIND=1 + OSTYPE=linux-gnueabihf + PATH=/usr/sbin:/usr/bin:/sbin:/bin:/usr/games:/i/capture/the/path + PBCURRENTCOMMANDLINEOPERATION=build + PBUILDER_OPERATION=build + PBUILDER_PKGDATADIR=/usr/share/pbuilder + PBUILDER_PKGLIBDIR=/usr/lib/pbuilder + PBUILDER_SYSCONFDIR=/etc + PIPESTATUS=([0]="0") + POSIXLY_CORRECT=y + PPID=27026 PS4='+ ' - PWD='/' - SHELL='/bin/bash' - SHLVL='2' - SUDO_COMMAND='/usr/bin/timeout -k 18.1h 18h /usr/bin/ionice -c 3 /usr/bin/nice /usr/sbin/pbuilder --build --configfile /srv/reproducible-results/rbuild-debian/r-b-build.hm1oJCHB/pbuilderrc_v8cX --distribution bookworm --hookdir /etc/pbuilder/first-build-hooks --debbuildopts -b --basetgz /var/cache/pbuilder/bookworm-reproducible-base.tgz --buildresult /srv/reproducible-results/rbuild-debian/r-b-build.hm1oJCHB/b1 --logfile b1/build.log fenicsx-performance-tests_0.5.0~git20220731.821823b-1.dsc' - SUDO_GID='113' - SUDO_UID='107' - SUDO_USER='jenkins' - TERM='unknown' - TZ='/usr/share/zoneinfo/Etc/GMT+12' - USER='root' - _='/usr/bin/systemd-run' - http_proxy='http://10.0.0.15:3142/' + PWD=/ + SHELL=/bin/bash + SHELLOPTS=braceexpand:errexit:hashall:interactive-comments:posix + SHLVL=3 + SUDO_COMMAND='/usr/bin/timeout -k 24.1h 24h /usr/bin/ionice -c 3 /usr/bin/nice -n 11 /usr/bin/unshare --uts -- /usr/sbin/pbuilder --build --configfile /srv/reproducible-results/rbuild-debian/r-b-build.hm1oJCHB/pbuilderrc_PK6M --distribution bookworm --hookdir /etc/pbuilder/rebuild-hooks --debbuildopts -b --basetgz /var/cache/pbuilder/bookworm-reproducible-base.tgz --buildresult /srv/reproducible-results/rbuild-debian/r-b-build.hm1oJCHB/b2 --logfile b2/build.log --extrapackages usrmerge fenicsx-performance-tests_0.5.0~git20220731.821823b-1.dsc' + SUDO_GID=113 + SUDO_UID=107 + SUDO_USER=jenkins + TERM=unknown + TZ=/usr/share/zoneinfo/Etc/GMT-14 + UID=0 + USER=root + _='I: set' + http_proxy=http://10.0.0.15:3142/ I: uname -a - Linux virt64c 5.10.0-23-arm64 #1 SMP Debian 5.10.179-1 (2023-05-12) aarch64 GNU/Linux + Linux i-capture-the-hostname 5.10.0-23-armmp-lpae #1 SMP Debian 5.10.179-1 (2023-05-12) armv7l GNU/Linux I: ls -l /bin total 5072 - -rwxr-xr-x 1 root root 838488 Apr 23 09:24 bash - -rwxr-xr-x 3 root root 67144 Sep 18 2022 bunzip2 - -rwxr-xr-x 3 root root 67144 Sep 18 2022 bzcat - lrwxrwxrwx 1 root root 6 Sep 18 2022 bzcmp -> bzdiff - -rwxr-xr-x 1 root root 2225 Sep 18 2022 bzdiff - lrwxrwxrwx 1 root root 6 Sep 18 2022 bzegrep -> bzgrep - -rwxr-xr-x 1 root root 4893 Nov 27 2021 bzexe - lrwxrwxrwx 1 root root 6 Sep 18 2022 bzfgrep -> bzgrep - -rwxr-xr-x 1 root root 3775 Sep 18 2022 bzgrep - -rwxr-xr-x 3 root root 67144 Sep 18 2022 bzip2 - -rwxr-xr-x 1 root root 67112 Sep 18 2022 bzip2recover - lrwxrwxrwx 1 root root 6 Sep 18 2022 bzless -> bzmore - -rwxr-xr-x 1 root root 1297 Sep 18 2022 bzmore - -rwxr-xr-x 1 root root 67632 Sep 20 2022 cat - -rwxr-xr-x 1 root root 67676 Sep 20 2022 chgrp - -rwxr-xr-x 1 root root 67644 Sep 20 2022 chmod - -rwxr-xr-x 1 root root 67684 Sep 20 2022 chown - -rwxr-xr-x 1 root root 133532 Sep 20 2022 cp - -rwxr-xr-x 1 root root 132868 Jan 5 01:20 dash - -rwxr-xr-x 1 root root 133220 Sep 20 2022 date - -rwxr-xr-x 1 root root 67732 Sep 20 2022 dd - -rwxr-xr-x 1 root root 68104 Sep 20 2022 df - -rwxr-xr-x 1 root root 133632 Sep 20 2022 dir - -rwxr-xr-x 1 root root 59128 Mar 22 21:02 dmesg - lrwxrwxrwx 1 root root 8 Dec 19 01:33 dnsdomainname -> hostname - lrwxrwxrwx 1 root root 8 Dec 19 01:33 domainname -> hostname - -rwxr-xr-x 1 root root 67560 Sep 20 2022 echo - -rwxr-xr-x 1 root root 41 Jan 24 02:43 egrep - -rwxr-xr-x 1 root root 67548 Sep 20 2022 false - -rwxr-xr-x 1 root root 41 Jan 24 02:43 fgrep - -rwxr-xr-x 1 root root 55748 Mar 22 21:02 findmnt - -rwsr-xr-x 1 root root 26208 Mar 22 20:15 fusermount - -rwxr-xr-x 1 root root 128608 Jan 24 02:43 grep - -rwxr-xr-x 2 root root 2346 Apr 9 2022 gunzip - -rwxr-xr-x 1 root root 6447 Apr 9 2022 gzexe - -rwxr-xr-x 1 root root 64220 Apr 9 2022 gzip - -rwxr-xr-x 1 root root 67032 Dec 19 01:33 hostname - -rwxr-xr-x 1 root root 67720 Sep 20 2022 ln - -rwxr-xr-x 1 root root 35132 Mar 22 21:51 login - -rwxr-xr-x 1 root root 133632 Sep 20 2022 ls - -rwxr-xr-x 1 root root 136808 Mar 22 21:02 lsblk - -rwxr-xr-x 1 root root 67800 Sep 20 2022 mkdir - -rwxr-xr-x 1 root root 67764 Sep 20 2022 mknod - -rwxr-xr-x 1 root root 67596 Sep 20 2022 mktemp - -rwxr-xr-x 1 root root 38504 Mar 22 21:02 more - -rwsr-xr-x 1 root root 38496 Mar 22 21:02 mount - -rwxr-xr-x 1 root root 9824 Mar 22 21:02 mountpoint - -rwxr-xr-x 1 root root 133532 Sep 20 2022 mv - lrwxrwxrwx 1 root root 8 Dec 19 01:33 nisdomainname -> hostname - lrwxrwxrwx 1 root root 14 Apr 2 18:25 pidof -> /sbin/killall5 - -rwxr-xr-x 1 root root 67608 Sep 20 2022 pwd - lrwxrwxrwx 1 root root 4 Apr 23 09:24 rbash -> bash - -rwxr-xr-x 1 root root 67600 Sep 20 2022 readlink - -rwxr-xr-x 1 root root 67672 Sep 20 2022 rm - -rwxr-xr-x 1 root root 67600 Sep 20 2022 rmdir - -rwxr-xr-x 1 root root 67400 Nov 2 2022 run-parts - -rwxr-xr-x 1 root root 133372 Jan 5 07:55 sed - lrwxrwxrwx 1 root root 4 Jan 5 01:20 sh -> dash - -rwxr-xr-x 1 root root 67584 Sep 20 2022 sleep - -rwxr-xr-x 1 root root 67644 Sep 20 2022 stty - -rwsr-xr-x 1 root root 50800 Mar 22 21:02 su - -rwxr-xr-x 1 root root 67584 Sep 20 2022 sync - -rwxr-xr-x 1 root root 336764 Apr 6 02:25 tar - -rwxr-xr-x 1 root root 67144 Nov 2 2022 tempfile - -rwxr-xr-x 1 root root 133224 Sep 20 2022 touch - -rwxr-xr-x 1 root root 67548 Sep 20 2022 true - -rwxr-xr-x 1 root root 9768 Mar 22 20:15 ulockmgr_server - -rwsr-xr-x 1 root root 22108 Mar 22 21:02 umount - -rwxr-xr-x 1 root root 67572 Sep 20 2022 uname - -rwxr-xr-x 2 root root 2346 Apr 9 2022 uncompress - -rwxr-xr-x 1 root root 133632 Sep 20 2022 vdir - -rwxr-xr-x 1 root root 42608 Mar 22 21:02 wdctl - lrwxrwxrwx 1 root root 8 Dec 19 01:33 ypdomainname -> hostname - -rwxr-xr-x 1 root root 1984 Apr 9 2022 zcat - -rwxr-xr-x 1 root root 1678 Apr 9 2022 zcmp - -rwxr-xr-x 1 root root 6460 Apr 9 2022 zdiff - -rwxr-xr-x 1 root root 29 Apr 9 2022 zegrep - -rwxr-xr-x 1 root root 29 Apr 9 2022 zfgrep - -rwxr-xr-x 1 root root 2081 Apr 9 2022 zforce - -rwxr-xr-x 1 root root 8103 Apr 9 2022 zgrep - -rwxr-xr-x 1 root root 2206 Apr 9 2022 zless - -rwxr-xr-x 1 root root 1842 Apr 9 2022 zmore - -rwxr-xr-x 1 root root 4577 Apr 9 2022 znew -I: user script /srv/workspace/pbuilder/1361/tmp/hooks/D02_print_environment finished + -rwxr-xr-x 1 root root 838488 Apr 24 11:24 bash + -rwxr-xr-x 3 root root 67144 Sep 19 2022 bunzip2 + -rwxr-xr-x 3 root root 67144 Sep 19 2022 bzcat + lrwxrwxrwx 1 root root 6 Sep 19 2022 bzcmp -> bzdiff + -rwxr-xr-x 1 root root 2225 Sep 19 2022 bzdiff + lrwxrwxrwx 1 root root 6 Sep 19 2022 bzegrep -> bzgrep + -rwxr-xr-x 1 root root 4893 Nov 28 2021 bzexe + lrwxrwxrwx 1 root root 6 Sep 19 2022 bzfgrep -> bzgrep + -rwxr-xr-x 1 root root 3775 Sep 19 2022 bzgrep + -rwxr-xr-x 3 root root 67144 Sep 19 2022 bzip2 + -rwxr-xr-x 1 root root 67112 Sep 19 2022 bzip2recover + lrwxrwxrwx 1 root root 6 Sep 19 2022 bzless -> bzmore + -rwxr-xr-x 1 root root 1297 Sep 19 2022 bzmore + -rwxr-xr-x 1 root root 67632 Sep 21 2022 cat + -rwxr-xr-x 1 root root 67676 Sep 21 2022 chgrp + -rwxr-xr-x 1 root root 67644 Sep 21 2022 chmod + -rwxr-xr-x 1 root root 67684 Sep 21 2022 chown + -rwxr-xr-x 1 root root 133532 Sep 21 2022 cp + -rwxr-xr-x 1 root root 132868 Jan 6 03:20 dash + -rwxr-xr-x 1 root root 133220 Sep 21 2022 date + -rwxr-xr-x 1 root root 67732 Sep 21 2022 dd + -rwxr-xr-x 1 root root 68104 Sep 21 2022 df + -rwxr-xr-x 1 root root 133632 Sep 21 2022 dir + -rwxr-xr-x 1 root root 59128 Mar 23 23:02 dmesg + lrwxrwxrwx 1 root root 8 Dec 20 03:33 dnsdomainname -> hostname + lrwxrwxrwx 1 root root 8 Dec 20 03:33 domainname -> hostname + -rwxr-xr-x 1 root root 67560 Sep 21 2022 echo + -rwxr-xr-x 1 root root 41 Jan 25 04:43 egrep + -rwxr-xr-x 1 root root 67548 Sep 21 2022 false + -rwxr-xr-x 1 root root 41 Jan 25 04:43 fgrep + -rwxr-xr-x 1 root root 55748 Mar 23 23:02 findmnt + -rwsr-xr-x 1 root root 26208 Mar 23 22:15 fusermount + -rwxr-xr-x 1 root root 128608 Jan 25 04:43 grep + -rwxr-xr-x 2 root root 2346 Apr 10 2022 gunzip + -rwxr-xr-x 1 root root 6447 Apr 10 2022 gzexe + -rwxr-xr-x 1 root root 64220 Apr 10 2022 gzip + -rwxr-xr-x 1 root root 67032 Dec 20 03:33 hostname + -rwxr-xr-x 1 root root 67720 Sep 21 2022 ln + -rwxr-xr-x 1 root root 35132 Mar 23 23:51 login + -rwxr-xr-x 1 root root 133632 Sep 21 2022 ls + -rwxr-xr-x 1 root root 136808 Mar 23 23:02 lsblk + -rwxr-xr-x 1 root root 67800 Sep 21 2022 mkdir + -rwxr-xr-x 1 root root 67764 Sep 21 2022 mknod + -rwxr-xr-x 1 root root 67596 Sep 21 2022 mktemp + -rwxr-xr-x 1 root root 38504 Mar 23 23:02 more + -rwsr-xr-x 1 root root 38496 Mar 23 23:02 mount + -rwxr-xr-x 1 root root 9824 Mar 23 23:02 mountpoint + -rwxr-xr-x 1 root root 133532 Sep 21 2022 mv + lrwxrwxrwx 1 root root 8 Dec 20 03:33 nisdomainname -> hostname + lrwxrwxrwx 1 root root 14 Apr 3 20:25 pidof -> /sbin/killall5 + -rwxr-xr-x 1 root root 67608 Sep 21 2022 pwd + lrwxrwxrwx 1 root root 4 Apr 24 11:24 rbash -> bash + -rwxr-xr-x 1 root root 67600 Sep 21 2022 readlink + -rwxr-xr-x 1 root root 67672 Sep 21 2022 rm + -rwxr-xr-x 1 root root 67600 Sep 21 2022 rmdir + -rwxr-xr-x 1 root root 67400 Nov 3 2022 run-parts + -rwxr-xr-x 1 root root 133372 Jan 6 09:55 sed + lrwxrwxrwx 1 root root 9 May 16 15:44 sh -> /bin/bash + -rwxr-xr-x 1 root root 67584 Sep 21 2022 sleep + -rwxr-xr-x 1 root root 67644 Sep 21 2022 stty + -rwsr-xr-x 1 root root 50800 Mar 23 23:02 su + -rwxr-xr-x 1 root root 67584 Sep 21 2022 sync + -rwxr-xr-x 1 root root 336764 Apr 7 04:25 tar + -rwxr-xr-x 1 root root 67144 Nov 3 2022 tempfile + -rwxr-xr-x 1 root root 133224 Sep 21 2022 touch + -rwxr-xr-x 1 root root 67548 Sep 21 2022 true + -rwxr-xr-x 1 root root 9768 Mar 23 22:15 ulockmgr_server + -rwsr-xr-x 1 root root 22108 Mar 23 23:02 umount + -rwxr-xr-x 1 root root 67572 Sep 21 2022 uname + -rwxr-xr-x 2 root root 2346 Apr 10 2022 uncompress + -rwxr-xr-x 1 root root 133632 Sep 21 2022 vdir + -rwxr-xr-x 1 root root 42608 Mar 23 23:02 wdctl + lrwxrwxrwx 1 root root 8 Dec 20 03:33 ypdomainname -> hostname + -rwxr-xr-x 1 root root 1984 Apr 10 2022 zcat + -rwxr-xr-x 1 root root 1678 Apr 10 2022 zcmp + -rwxr-xr-x 1 root root 6460 Apr 10 2022 zdiff + -rwxr-xr-x 1 root root 29 Apr 10 2022 zegrep + -rwxr-xr-x 1 root root 29 Apr 10 2022 zfgrep + -rwxr-xr-x 1 root root 2081 Apr 10 2022 zforce + -rwxr-xr-x 1 root root 8103 Apr 10 2022 zgrep + -rwxr-xr-x 1 root root 2206 Apr 10 2022 zless + -rwxr-xr-x 1 root root 1842 Apr 10 2022 zmore + -rwxr-xr-x 1 root root 4577 Apr 10 2022 znew +I: user script /srv/workspace/pbuilder/27026/tmp/hooks/D02_print_environment finished -> Attempting to satisfy build-dependencies -> Creating pbuilder-satisfydepends-dummy package Package: pbuilder-satisfydepends-dummy @@ -474,7 +506,7 @@ Get: 269 http://deb.debian.org/debian bookworm/main armhf libxtensor-dev armhf 0.24.3-1 [189 kB] Get: 270 http://deb.debian.org/debian bookworm/main armhf libdolfinx-dev armhf 1:0.5.2-2+b1 [155 kB] Get: 271 http://deb.debian.org/debian bookworm/main armhf xtensor-dev all 0.24.3-1 [5372 B] -Fetched 163 MB in 6s (27.9 MB/s) +Fetched 163 MB in 16s (10.4 MB/s) debconf: delaying package configuration, since apt-utils is not installed Selecting previously unselected package libpython3.11-minimal:armhf. (Reading database ... (Reading database ... 5% (Reading database ... 10% (Reading database ... 15% (Reading database ... 20% (Reading database ... 25% (Reading database ... 30% (Reading database ... 35% (Reading database ... 40% (Reading database ... 45% (Reading database ... 50% (Reading database ... 55% (Reading database ... 60% (Reading database ... 65% (Reading database ... 70% (Reading database ... 75% (Reading database ... 80% (Reading database ... 85% (Reading database ... 90% (Reading database ... 95% (Reading database ... 100% (Reading database ... 19329 files and directories currently installed.) @@ -1597,8 +1629,19 @@ Writing extended state information... Building tag database... -> Finished parsing the build-deps +Reading package lists... +Building dependency tree... +Reading state information... +usrmerge is already the newest version (35). +0 upgraded, 0 newly installed, 0 to remove and 0 not upgraded. I: Building the package -I: Running cd /build/fenicsx-performance-tests-0.5.0~git20220731.821823b/ && env PATH="/usr/sbin:/usr/bin:/sbin:/bin:/usr/games" HOME="/nonexistent/first-build" dpkg-buildpackage -us -uc -b && env PATH="/usr/sbin:/usr/bin:/sbin:/bin:/usr/games" HOME="/nonexistent/first-build" dpkg-genchanges -S > ../fenicsx-performance-tests_0.5.0~git20220731.821823b-1_source.changes +I: user script /srv/workspace/pbuilder/27026/tmp/hooks/A99_set_merged_usr starting +Re-configuring usrmerge... +removed '/etc/unsupported-skip-usrmerge-conversion' +The system has been successfully converted. +I: user script /srv/workspace/pbuilder/27026/tmp/hooks/A99_set_merged_usr finished +hostname: Name or service not known +I: Running cd /build/fenicsx-performance-tests-0.5.0~git20220731.821823b/ && env PATH="/usr/sbin:/usr/bin:/sbin:/bin:/usr/games:/i/capture/the/path" HOME="/nonexistent/second-build" dpkg-buildpackage -us -uc -b && env PATH="/usr/sbin:/usr/bin:/sbin:/bin:/usr/games:/i/capture/the/path" HOME="/nonexistent/second-build" dpkg-genchanges -S > ../fenicsx-performance-tests_0.5.0~git20220731.821823b-1_source.changes dpkg-buildpackage: info: source package fenicsx-performance-tests dpkg-buildpackage: info: source version 0.5.0~git20220731.821823b-1 dpkg-buildpackage: info: source distribution unstable @@ -1694,7 +1737,7 @@ -- Build files have been written to: /build/fenicsx-performance-tests-0.5.0~git20220731.821823b/obj-arm-linux-gnueabihf make[1]: Leaving directory '/build/fenicsx-performance-tests-0.5.0~git20220731.821823b' dh_auto_build -O--buildsystem=cmake -O--sourcedirectory=src - cd obj-arm-linux-gnueabihf && make -j3 "INSTALL=install --strip-program=true" VERBOSE=1 + cd obj-arm-linux-gnueabihf && make -j4 "INSTALL=install --strip-program=true" VERBOSE=1 make[1]: Entering directory '/build/fenicsx-performance-tests-0.5.0~git20220731.821823b/obj-arm-linux-gnueabihf' /usr/bin/cmake -S"/build/fenicsx-performance-tests-0.5.0~git20220731.821823b/src" -B"/build/fenicsx-performance-tests-0.5.0~git20220731.821823b/obj-arm-linux-gnueabihf" --check-build-system CMakeFiles/Makefile.cmake 0 /usr/bin/cmake -E cmake_progress_start "/build/fenicsx-performance-tests-0.5.0~git20220731.821823b/obj-arm-linux-gnueabihf/CMakeFiles" "/build/fenicsx-performance-tests-0.5.0~git20220731.821823b/obj-arm-linux-gnueabihf//CMakeFiles/progress.marks" @@ -1702,20 +1745,22 @@ make[2]: Entering directory '/build/fenicsx-performance-tests-0.5.0~git20220731.821823b/obj-arm-linux-gnueabihf' make -f CMakeFiles/dolfinx-scaling-test.dir/build.make CMakeFiles/dolfinx-scaling-test.dir/depend make[3]: Entering directory '/build/fenicsx-performance-tests-0.5.0~git20220731.821823b/obj-arm-linux-gnueabihf' -[ 10%] Generating Poisson.c -ffcx /build/fenicsx-performance-tests-0.5.0~git20220731.821823b/src/Poisson.py -[ 20%] Generating Elasticity.c +[ 10%] Generating Elasticity.c ffcx /build/fenicsx-performance-tests-0.5.0~git20220731.821823b/src/Elasticity.py +[ 20%] Generating Poisson.c +ffcx /build/fenicsx-performance-tests-0.5.0~git20220731.821823b/src/Poisson.py cd "/build/fenicsx-performance-tests-0.5.0~git20220731.821823b/obj-arm-linux-gnueabihf" && /usr/bin/cmake -E cmake_depends "Unix Makefiles" "/build/fenicsx-performance-tests-0.5.0~git20220731.821823b/src" "/build/fenicsx-performance-tests-0.5.0~git20220731.821823b/src" "/build/fenicsx-performance-tests-0.5.0~git20220731.821823b/obj-arm-linux-gnueabihf" "/build/fenicsx-performance-tests-0.5.0~git20220731.821823b/obj-arm-linux-gnueabihf" "/build/fenicsx-performance-tests-0.5.0~git20220731.821823b/obj-arm-linux-gnueabihf/CMakeFiles/dolfinx-scaling-test.dir/DependInfo.cmake" --color= make[3]: Leaving directory '/build/fenicsx-performance-tests-0.5.0~git20220731.821823b/obj-arm-linux-gnueabihf' make -f CMakeFiles/dolfinx-scaling-test.dir/build.make CMakeFiles/dolfinx-scaling-test.dir/build make[3]: Entering directory '/build/fenicsx-performance-tests-0.5.0~git20220731.821823b/obj-arm-linux-gnueabihf' -[ 30%] Building CXX object CMakeFiles/dolfinx-scaling-test.dir/mesh.cpp.o -/usr/bin/c++ -DBOOST_ALL_NO_LIB -DBOOST_CHRONO_DYN_LINK -DBOOST_PROGRAM_OPTIONS_DYN_LINK -DBOOST_TIMER_DYN_LINK -DDOLFINX_VERSION=\"0.5.2\" -DHAS_PTSCOTCH -DHAS_SLEPC -D_FILE_OFFSET_BITS=64 -I"/build/fenicsx-performance-tests-0.5.0~git20220731.821823b/obj-arm-linux-gnueabihf" -I"/build/fenicsx-performance-tests-0.5.0~git20220731.821823b/src" -isystem /usr/lib/python3/dist-packages/ffcx/codegeneration -isystem /usr/lib/arm-linux-gnueabihf/openmpi/include -isystem /usr/lib/arm-linux-gnueabihf/openmpi/include/openmpi -isystem /usr/lib/petscdir/petsc3.18/arm-linux-gnueabihf-real/include -isystem /usr/include/hdf5/openmpi -isystem /usr/lib/slepcdir/slepc3.18/arm-linux-gnueabihf-real/include -g -O2 -ffile-prefix-map=/build/fenicsx-performance-tests-0.5.0~git20220731.821823b=. -fstack-protector-strong -Wformat -Werror=format-security -Wdate-time -D_FORTIFY_SOURCE=2 -O3 -DNDEBUG -Wdate-time -D_FORTIFY_SOURCE=2 -std=c++20 -MD -MT CMakeFiles/dolfinx-scaling-test.dir/mesh.cpp.o -MF CMakeFiles/dolfinx-scaling-test.dir/mesh.cpp.o.d -o CMakeFiles/dolfinx-scaling-test.dir/mesh.cpp.o -c "/build/fenicsx-performance-tests-0.5.0~git20220731.821823b/src/mesh.cpp" -[ 40%] Building CXX object CMakeFiles/dolfinx-scaling-test.dir/main.cpp.o +[ 30%] Building CXX object CMakeFiles/dolfinx-scaling-test.dir/main.cpp.o /usr/bin/c++ -DBOOST_ALL_NO_LIB -DBOOST_CHRONO_DYN_LINK -DBOOST_PROGRAM_OPTIONS_DYN_LINK -DBOOST_TIMER_DYN_LINK -DDOLFINX_VERSION=\"0.5.2\" -DHAS_PTSCOTCH -DHAS_SLEPC -D_FILE_OFFSET_BITS=64 -I"/build/fenicsx-performance-tests-0.5.0~git20220731.821823b/obj-arm-linux-gnueabihf" -I"/build/fenicsx-performance-tests-0.5.0~git20220731.821823b/src" -isystem /usr/lib/python3/dist-packages/ffcx/codegeneration -isystem /usr/lib/arm-linux-gnueabihf/openmpi/include -isystem /usr/lib/arm-linux-gnueabihf/openmpi/include/openmpi -isystem /usr/lib/petscdir/petsc3.18/arm-linux-gnueabihf-real/include -isystem /usr/include/hdf5/openmpi -isystem /usr/lib/slepcdir/slepc3.18/arm-linux-gnueabihf-real/include -g -O2 -ffile-prefix-map=/build/fenicsx-performance-tests-0.5.0~git20220731.821823b=. -fstack-protector-strong -Wformat -Werror=format-security -Wdate-time -D_FORTIFY_SOURCE=2 -O3 -DNDEBUG -Wdate-time -D_FORTIFY_SOURCE=2 -std=c++20 -MD -MT CMakeFiles/dolfinx-scaling-test.dir/main.cpp.o -MF CMakeFiles/dolfinx-scaling-test.dir/main.cpp.o.d -o CMakeFiles/dolfinx-scaling-test.dir/main.cpp.o -c "/build/fenicsx-performance-tests-0.5.0~git20220731.821823b/src/main.cpp" +[ 40%] Building CXX object CMakeFiles/dolfinx-scaling-test.dir/mesh.cpp.o +/usr/bin/c++ -DBOOST_ALL_NO_LIB -DBOOST_CHRONO_DYN_LINK -DBOOST_PROGRAM_OPTIONS_DYN_LINK -DBOOST_TIMER_DYN_LINK -DDOLFINX_VERSION=\"0.5.2\" -DHAS_PTSCOTCH -DHAS_SLEPC -D_FILE_OFFSET_BITS=64 -I"/build/fenicsx-performance-tests-0.5.0~git20220731.821823b/obj-arm-linux-gnueabihf" -I"/build/fenicsx-performance-tests-0.5.0~git20220731.821823b/src" -isystem /usr/lib/python3/dist-packages/ffcx/codegeneration -isystem /usr/lib/arm-linux-gnueabihf/openmpi/include -isystem /usr/lib/arm-linux-gnueabihf/openmpi/include/openmpi -isystem /usr/lib/petscdir/petsc3.18/arm-linux-gnueabihf-real/include -isystem /usr/include/hdf5/openmpi -isystem /usr/lib/slepcdir/slepc3.18/arm-linux-gnueabihf-real/include -g -O2 -ffile-prefix-map=/build/fenicsx-performance-tests-0.5.0~git20220731.821823b=. -fstack-protector-strong -Wformat -Werror=format-security -Wdate-time -D_FORTIFY_SOURCE=2 -O3 -DNDEBUG -Wdate-time -D_FORTIFY_SOURCE=2 -std=c++20 -MD -MT CMakeFiles/dolfinx-scaling-test.dir/mesh.cpp.o -MF CMakeFiles/dolfinx-scaling-test.dir/mesh.cpp.o.d -o CMakeFiles/dolfinx-scaling-test.dir/mesh.cpp.o -c "/build/fenicsx-performance-tests-0.5.0~git20220731.821823b/src/mesh.cpp" [ 50%] Building CXX object CMakeFiles/dolfinx-scaling-test.dir/elasticity_problem.cpp.o /usr/bin/c++ -DBOOST_ALL_NO_LIB -DBOOST_CHRONO_DYN_LINK -DBOOST_PROGRAM_OPTIONS_DYN_LINK -DBOOST_TIMER_DYN_LINK -DDOLFINX_VERSION=\"0.5.2\" -DHAS_PTSCOTCH -DHAS_SLEPC -D_FILE_OFFSET_BITS=64 -I"/build/fenicsx-performance-tests-0.5.0~git20220731.821823b/obj-arm-linux-gnueabihf" -I"/build/fenicsx-performance-tests-0.5.0~git20220731.821823b/src" -isystem /usr/lib/python3/dist-packages/ffcx/codegeneration -isystem /usr/lib/arm-linux-gnueabihf/openmpi/include -isystem /usr/lib/arm-linux-gnueabihf/openmpi/include/openmpi -isystem /usr/lib/petscdir/petsc3.18/arm-linux-gnueabihf-real/include -isystem /usr/include/hdf5/openmpi -isystem /usr/lib/slepcdir/slepc3.18/arm-linux-gnueabihf-real/include -g -O2 -ffile-prefix-map=/build/fenicsx-performance-tests-0.5.0~git20220731.821823b=. -fstack-protector-strong -Wformat -Werror=format-security -Wdate-time -D_FORTIFY_SOURCE=2 -O3 -DNDEBUG -Wdate-time -D_FORTIFY_SOURCE=2 -std=c++20 -MD -MT CMakeFiles/dolfinx-scaling-test.dir/elasticity_problem.cpp.o -MF CMakeFiles/dolfinx-scaling-test.dir/elasticity_problem.cpp.o.d -o CMakeFiles/dolfinx-scaling-test.dir/elasticity_problem.cpp.o -c "/build/fenicsx-performance-tests-0.5.0~git20220731.821823b/src/elasticity_problem.cpp" +[ 60%] Building CXX object CMakeFiles/dolfinx-scaling-test.dir/poisson_problem.cpp.o +/usr/bin/c++ -DBOOST_ALL_NO_LIB -DBOOST_CHRONO_DYN_LINK -DBOOST_PROGRAM_OPTIONS_DYN_LINK -DBOOST_TIMER_DYN_LINK -DDOLFINX_VERSION=\"0.5.2\" -DHAS_PTSCOTCH -DHAS_SLEPC -D_FILE_OFFSET_BITS=64 -I"/build/fenicsx-performance-tests-0.5.0~git20220731.821823b/obj-arm-linux-gnueabihf" -I"/build/fenicsx-performance-tests-0.5.0~git20220731.821823b/src" -isystem /usr/lib/python3/dist-packages/ffcx/codegeneration -isystem /usr/lib/arm-linux-gnueabihf/openmpi/include -isystem /usr/lib/arm-linux-gnueabihf/openmpi/include/openmpi -isystem /usr/lib/petscdir/petsc3.18/arm-linux-gnueabihf-real/include -isystem /usr/include/hdf5/openmpi -isystem /usr/lib/slepcdir/slepc3.18/arm-linux-gnueabihf-real/include -g -O2 -ffile-prefix-map=/build/fenicsx-performance-tests-0.5.0~git20220731.821823b=. -fstack-protector-strong -Wformat -Werror=format-security -Wdate-time -D_FORTIFY_SOURCE=2 -O3 -DNDEBUG -Wdate-time -D_FORTIFY_SOURCE=2 -std=c++20 -MD -MT CMakeFiles/dolfinx-scaling-test.dir/poisson_problem.cpp.o -MF CMakeFiles/dolfinx-scaling-test.dir/poisson_problem.cpp.o.d -o CMakeFiles/dolfinx-scaling-test.dir/poisson_problem.cpp.o -c "/build/fenicsx-performance-tests-0.5.0~git20220731.821823b/src/poisson_problem.cpp" /build/fenicsx-performance-tests-0.5.0~git20220731.821823b/src/mesh.cpp: In function 'std::shared_ptr create_spoke_mesh(MPI_Comm, std::size_t, bool, std::size_t)': /build/fenicsx-performance-tests-0.5.0~git20220731.821823b/src/mesh.cpp:342:79: note: parameter passing for argument of type 'std::span' changed in GCC 7.1 342 | auto mesh = std::make_shared(dolfinx::mesh::create_mesh( @@ -1728,8 +1773,6 @@ | ~~~~~~~~~~~~~~~~~~~~ 346 | element, x, {x.size() / 3, 3}, dolfinx::mesh::GhostMode::none)); | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ -[ 60%] Building CXX object CMakeFiles/dolfinx-scaling-test.dir/poisson_problem.cpp.o -/usr/bin/c++ -DBOOST_ALL_NO_LIB -DBOOST_CHRONO_DYN_LINK -DBOOST_PROGRAM_OPTIONS_DYN_LINK -DBOOST_TIMER_DYN_LINK -DDOLFINX_VERSION=\"0.5.2\" -DHAS_PTSCOTCH -DHAS_SLEPC -D_FILE_OFFSET_BITS=64 -I"/build/fenicsx-performance-tests-0.5.0~git20220731.821823b/obj-arm-linux-gnueabihf" -I"/build/fenicsx-performance-tests-0.5.0~git20220731.821823b/src" -isystem /usr/lib/python3/dist-packages/ffcx/codegeneration -isystem /usr/lib/arm-linux-gnueabihf/openmpi/include -isystem /usr/lib/arm-linux-gnueabihf/openmpi/include/openmpi -isystem /usr/lib/petscdir/petsc3.18/arm-linux-gnueabihf-real/include -isystem /usr/include/hdf5/openmpi -isystem /usr/lib/slepcdir/slepc3.18/arm-linux-gnueabihf-real/include -g -O2 -ffile-prefix-map=/build/fenicsx-performance-tests-0.5.0~git20220731.821823b=. -fstack-protector-strong -Wformat -Werror=format-security -Wdate-time -D_FORTIFY_SOURCE=2 -O3 -DNDEBUG -Wdate-time -D_FORTIFY_SOURCE=2 -std=c++20 -MD -MT CMakeFiles/dolfinx-scaling-test.dir/poisson_problem.cpp.o -MF CMakeFiles/dolfinx-scaling-test.dir/poisson_problem.cpp.o.d -o CMakeFiles/dolfinx-scaling-test.dir/poisson_problem.cpp.o -c "/build/fenicsx-performance-tests-0.5.0~git20220731.821823b/src/poisson_problem.cpp" [ 70%] Building CXX object CMakeFiles/dolfinx-scaling-test.dir/mem.cpp.o /usr/bin/c++ -DBOOST_ALL_NO_LIB -DBOOST_CHRONO_DYN_LINK -DBOOST_PROGRAM_OPTIONS_DYN_LINK -DBOOST_TIMER_DYN_LINK -DDOLFINX_VERSION=\"0.5.2\" -DHAS_PTSCOTCH -DHAS_SLEPC -D_FILE_OFFSET_BITS=64 -I"/build/fenicsx-performance-tests-0.5.0~git20220731.821823b/obj-arm-linux-gnueabihf" -I"/build/fenicsx-performance-tests-0.5.0~git20220731.821823b/src" -isystem /usr/lib/python3/dist-packages/ffcx/codegeneration -isystem /usr/lib/arm-linux-gnueabihf/openmpi/include -isystem /usr/lib/arm-linux-gnueabihf/openmpi/include/openmpi -isystem /usr/lib/petscdir/petsc3.18/arm-linux-gnueabihf-real/include -isystem /usr/include/hdf5/openmpi -isystem /usr/lib/slepcdir/slepc3.18/arm-linux-gnueabihf-real/include -g -O2 -ffile-prefix-map=/build/fenicsx-performance-tests-0.5.0~git20220731.821823b=. -fstack-protector-strong -Wformat -Werror=format-security -Wdate-time -D_FORTIFY_SOURCE=2 -O3 -DNDEBUG -Wdate-time -D_FORTIFY_SOURCE=2 -std=c++20 -MD -MT CMakeFiles/dolfinx-scaling-test.dir/mem.cpp.o -MF CMakeFiles/dolfinx-scaling-test.dir/mem.cpp.o.d -o CMakeFiles/dolfinx-scaling-test.dir/mem.cpp.o -c "/build/fenicsx-performance-tests-0.5.0~git20220731.821823b/src/mem.cpp" [ 80%] Building C object CMakeFiles/dolfinx-scaling-test.dir/Elasticity.c.o @@ -1739,8 +1782,8 @@ In file included from /usr/include/dolfinx/fem/CoordinateElement.h:15, from /usr/include/dolfinx/fem/interpolate.h:10, from /usr/include/dolfinx/fem/Function.h:12, - from /build/fenicsx-performance-tests-0.5.0~git20220731.821823b/src/elasticity_problem.h:9, - from /build/fenicsx-performance-tests-0.5.0~git20220731.821823b/src/elasticity_problem.cpp:7: + from /build/fenicsx-performance-tests-0.5.0~git20220731.821823b/src/poisson_problem.h:9, + from /build/fenicsx-performance-tests-0.5.0~git20220731.821823b/src/poisson_problem.cpp:7: /usr/include/dolfinx/common/math.h: In function 'auto dolfinx::math::det(Matrix) [with Matrix = std::experimental::mdspan >]': /usr/include/dolfinx/common/math.h:85:6: note: parameter passing for argument of type 'std::experimental::mdspan >' changed in GCC 7.1 85 | auto det(Matrix A) @@ -1761,6 +1804,20 @@ /usr/include/dolfinx/common/math.h:239:23: note: parameter passing for argument of type 'std::experimental::mdspan, std::experimental::layout_right, std::experimental::default_accessor >' changed in GCC 7.1 239 | dolfinx::math::inv(ATA, Inv); | ~~~~~~~~~~~~~~~~~~^~~~~~~~~~ +In file included from /usr/include/dolfinx/fem/CoordinateElement.h:15, + from /usr/include/dolfinx/fem/interpolate.h:10, + from /usr/include/dolfinx/fem/Function.h:12, + from /build/fenicsx-performance-tests-0.5.0~git20220731.821823b/src/elasticity_problem.h:9, + from /build/fenicsx-performance-tests-0.5.0~git20220731.821823b/src/elasticity_problem.cpp:7: +/usr/include/dolfinx/common/math.h: In function 'auto dolfinx::math::det(Matrix) [with Matrix = std::experimental::mdspan >]': +/usr/include/dolfinx/common/math.h:85:6: note: parameter passing for argument of type 'std::experimental::mdspan >' changed in GCC 7.1 + 85 | auto det(Matrix A) + | ^~~ +/usr/include/dolfinx/common/math.h: In function 'void dolfinx::math::inv(U, V) [with U = std::experimental::mdspan >; V = std::experimental::mdspan >]': +/usr/include/dolfinx/common/math.h:123:6: note: parameter passing for argument of type 'std::experimental::mdspan >' changed in GCC 7.1 + 123 | void inv(U A, V B) + | ^~~ +/usr/include/dolfinx/common/math.h:123:6: note: parameter passing for argument of type 'std::experimental::mdspan >' changed in GCC 7.1 /usr/include/dolfinx/fem/interpolate.h: In function 'void dolfinx::fem::interpolate(Function&, std::span, std::array, std::span) [with T = double]': /usr/include/dolfinx/fem/interpolate.h:421:6: note: parameter passing for argument of type 'std::span' changed in GCC 7.1 421 | void interpolate(Function& u, std::span f, @@ -1781,26 +1838,6 @@ 116 | math::pinv(J, K); | ~~~~~~~~~~^~~~~~ /usr/include/dolfinx/fem/CoordinateElement.h:116:17: note: parameter passing for argument of type 'std::experimental::mdspan >' changed in GCC 7.1 -/usr/include/dolfinx/fem/Function.h: In member function 'void dolfinx::fem::Function::interpolate(const std::function >, xt::layout_type::row_major, xt::svector >::size_type, 4, std::allocator::size_type>, true>, xt::xtensor_expression_tag>(const xt::xtensor_container >, 2, xt::layout_type::row_major, xt::xtensor_expression_tag>&)>&, std::span) [with T = double]': -/usr/include/dolfinx/fem/Function.h:216:21: note: parameter passing for argument of type 'std::span' changed in GCC 7.1 - 216 | fem::interpolate(*this, std::span(fx.data(), fx.size()), fshape, - | ~~~~~~~~~~~~~~~~^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ - 217 | cells); - | ~~~~~~ -In file included from /usr/include/dolfinx/fem/CoordinateElement.h:15, - from /usr/include/dolfinx/fem/interpolate.h:10, - from /usr/include/dolfinx/fem/Function.h:12, - from /build/fenicsx-performance-tests-0.5.0~git20220731.821823b/src/poisson_problem.h:9, - from /build/fenicsx-performance-tests-0.5.0~git20220731.821823b/src/poisson_problem.cpp:7: -/usr/include/dolfinx/common/math.h: In function 'auto dolfinx::math::det(Matrix) [with Matrix = std::experimental::mdspan >]': -/usr/include/dolfinx/common/math.h:85:6: note: parameter passing for argument of type 'std::experimental::mdspan >' changed in GCC 7.1 - 85 | auto det(Matrix A) - | ^~~ -/usr/include/dolfinx/common/math.h: In function 'void dolfinx::math::inv(U, V) [with U = std::experimental::mdspan >; V = std::experimental::mdspan >]': -/usr/include/dolfinx/common/math.h:123:6: note: parameter passing for argument of type 'std::experimental::mdspan >' changed in GCC 7.1 - 123 | void inv(U A, V B) - | ^~~ -/usr/include/dolfinx/common/math.h:123:6: note: parameter passing for argument of type 'std::experimental::mdspan >' changed in GCC 7.1 /usr/include/dolfinx/common/math.h: In function 'void dolfinx::math::inv(U, V) [with U = std::experimental::mdspan, std::experimental::layout_right, std::experimental::default_accessor >; V = std::experimental::mdspan, std::experimental::layout_right, std::experimental::default_accessor >]': /usr/include/dolfinx/common/math.h:123:6: note: parameter passing for argument of type 'std::experimental::mdspan, std::experimental::layout_right, std::experimental::default_accessor >' changed in GCC 7.1 /usr/include/dolfinx/common/math.h:123:6: note: parameter passing for argument of type 'std::experimental::mdspan, std::experimental::layout_right, std::experimental::default_accessor >' changed in GCC 7.1 @@ -1812,6 +1849,12 @@ /usr/include/dolfinx/common/math.h:239:23: note: parameter passing for argument of type 'std::experimental::mdspan, std::experimental::layout_right, std::experimental::default_accessor >' changed in GCC 7.1 239 | dolfinx::math::inv(ATA, Inv); | ~~~~~~~~~~~~~~~~~~^~~~~~~~~~ +/usr/include/dolfinx/fem/Function.h: In member function 'void dolfinx::fem::Function::interpolate(const std::function >, xt::layout_type::row_major, xt::svector >::size_type, 4, std::allocator::size_type>, true>, xt::xtensor_expression_tag>(const xt::xtensor_container >, 2, xt::layout_type::row_major, xt::xtensor_expression_tag>&)>&, std::span) [with T = double]': +/usr/include/dolfinx/fem/Function.h:216:21: note: parameter passing for argument of type 'std::span' changed in GCC 7.1 + 216 | fem::interpolate(*this, std::span(fx.data(), fx.size()), fshape, + | ~~~~~~~~~~~~~~~~^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ + 217 | cells); + | ~~~~~~ /usr/include/dolfinx/fem/interpolate.h: In function 'void dolfinx::fem::interpolate(Function&, std::span, std::array, std::span) [with T = double]': /usr/include/dolfinx/fem/interpolate.h:421:6: note: parameter passing for argument of type 'std::span' changed in GCC 7.1 421 | void interpolate(Function& u, std::span f, @@ -1850,61 +1893,61 @@ make[1]: Entering directory '/build/fenicsx-performance-tests-0.5.0~git20220731.821823b' debian/tests/run-dolfinx-scaling-test -p /build/fenicsx-performance-tests-0.5.0~git20220731.821823b/obj-arm-linux-gnueabihf ==== elasticity weak scaling (3 processes with ndofs=10000) ==== -2023-05-15 13:41:00.181 ( 0.183s) [RANK: 0 ] utils.cpp:612 INFO| Compute partition of cells across ranks -2023-05-15 13:41:00.181 ( 0.183s) [RANK: 0 ] graphbuild.cpp:533 INFO| Building mesh dual graph -2023-05-15 13:41:00.181 ( 0.183s) [RANK: 0 ] graphbuild.cpp:396 INFO| Build local part of mesh dual graph -2023-05-15 13:41:00.228 ( 0.230s) [RANK: 0 ] graphbuild.cpp:89 INFO| Build nonlocal part of mesh dual graph -2023-05-15 13:41:00.273 ( 0.275s) [RANK: 0 ] MPI.cpp:154 INFO| Computing communicaton graph edges (using NBX algorithm). Number of input edges: 2 -2023-05-15 13:41:00.273 ( 0.275s) [RANK: 0 ] MPI.cpp:217 INFO| Finished graph edge discovery using NBX algorithm. Number of discovered edges 2 -2023-05-15 13:41:00.273 ( 0.275s) [RANK: 0 ] graphbuild.cpp:203 INFO| Number of destination and source ranks in non-local dual graph construction, and ratio to total number of ranks: 2, 2, 0.666667, 0.666667 -2023-05-15 13:41:00.283 ( 0.285s) [RANK: 0 ] graphbuild.cpp:545 INFO| Graph edges (local: 66332, non-local: 962) -2023-05-15 13:41:00.283 ( 0.285s) [RANK: 0 ] partitioners.cpp:316 INFO| Compute graph partition using PT-SCOTCH -2023-05-15 13:41:10.661 ( 10.663s) [RANK: 0 ] MPI.cpp:154 INFO| Computing communicaton graph edges (using NBX algorithm). Number of input edges: 3 -2023-05-15 13:41:10.662 ( 10.664s) [RANK: 0 ] MPI.cpp:217 INFO| Finished graph edge discovery using NBX algorithm. Number of discovered edges 3 -2023-05-15 13:41:10.666 ( 10.668s) [RANK: 0 ] graphbuild.cpp:396 INFO| Build local part of mesh dual graph -2023-05-15 13:41:10.715 ( 10.716s) [RANK: 0 ] ordering.cpp:202 INFO| GPS pseudo-diameter:(121) 645-16278 - -2023-05-15 13:41:10.721 ( 10.723s) [RANK: 0 ] Topology.cpp:923 INFO| Create topology -2023-05-15 13:41:10.726 ( 10.728s) [RANK: 0 ] MPI.cpp:154 INFO| Computing communicaton graph edges (using NBX algorithm). Number of input edges: 3 -2023-05-15 13:41:10.726 ( 10.728s) [RANK: 0 ] MPI.cpp:217 INFO| Finished graph edge discovery using NBX algorithm. Number of discovered edges 3 -2023-05-15 13:41:10.743 ( 10.745s) [RANK: 0 ] MPI.cpp:154 INFO| Computing communicaton graph edges (using NBX algorithm). Number of input edges: 2 -2023-05-15 13:41:10.744 ( 10.746s) [RANK: 0 ] MPI.cpp:217 INFO| Finished graph edge discovery using NBX algorithm. Number of discovered edges 2 -2023-05-15 13:41:10.745 ( 10.746s) [RANK: 0 ] MPI.cpp:154 INFO| Computing communicaton graph edges (using NBX algorithm). Number of input edges: 2 -2023-05-15 13:41:10.745 ( 10.747s) [RANK: 0 ] MPI.cpp:217 INFO| Finished graph edge discovery using NBX algorithm. Number of discovered edges 2 -2023-05-15 13:41:10.749 ( 10.751s) [RANK: 0 ] MPI.cpp:154 INFO| Computing communicaton graph edges (using NBX algorithm). Number of input edges: 2 -2023-05-15 13:41:10.749 ( 10.751s) [RANK: 0 ] MPI.cpp:217 INFO| Finished graph edge discovery using NBX algorithm. Number of discovered edges 2 -2023-05-15 13:41:10.749 ( 10.751s) [RANK: 0 ] MPI.cpp:154 INFO| Computing communicaton graph edges (using NBX algorithm). Number of input edges: 0 -2023-05-15 13:41:10.749 ( 10.751s) [RANK: 0 ] MPI.cpp:217 INFO| Finished graph edge discovery using NBX algorithm. Number of discovered edges 0 -2023-05-15 13:41:10.750 ( 10.752s) [RANK: 0 ] MPI.cpp:154 INFO| Computing communicaton graph edges (using NBX algorithm). Number of input edges: 2 -2023-05-15 13:41:10.750 ( 10.752s) [RANK: 0 ] MPI.cpp:217 INFO| Finished graph edge discovery using NBX algorithm. Number of discovered edges 2 -2023-05-15 13:41:10.755 ( 10.757s) [RANK: 0 ] MPI.cpp:154 INFO| Computing communicaton graph edges (using NBX algorithm). Number of input edges: 0 -2023-05-15 13:41:10.755 ( 10.757s) [RANK: 0 ] MPI.cpp:217 INFO| Finished graph edge discovery using NBX algorithm. Number of discovered edges 0 -2023-05-15 13:41:10.755 ( 10.757s) [RANK: 0 ] MPI.h:368 INFO| Number of neighbourhood source ranks in distribute_to_postoffice: 0 -2023-05-15 13:41:10.756 ( 10.758s) [RANK: 0 ] MPI.cpp:154 INFO| Computing communicaton graph edges (using NBX algorithm). Number of input edges: 2 -2023-05-15 13:41:10.756 ( 10.758s) [RANK: 0 ] MPI.cpp:217 INFO| Finished graph edge discovery using NBX algorithm. Number of discovered edges 2 -2023-05-15 13:41:10.756 ( 10.758s) [RANK: 0 ] MPI.h:500 INFO| Neighbourhood destination ranks from post office in distribute_data (rank, num dests, num dests/mpi_size): 0, 2, 0.666667 +2023-05-16 15:54:04.885 ( 0.433s) [RANK: 0 ] utils.cpp:612 INFO| Compute partition of cells across ranks +2023-05-16 15:54:04.886 ( 0.433s) [RANK: 0 ] graphbuild.cpp:533 INFO| Building mesh dual graph +2023-05-16 15:54:04.886 ( 0.433s) [RANK: 0 ] graphbuild.cpp:396 INFO| Build local part of mesh dual graph +2023-05-16 15:54:05.046 ( 0.593s) [RANK: 0 ] graphbuild.cpp:89 INFO| Build nonlocal part of mesh dual graph +2023-05-16 15:54:05.060 ( 0.607s) [RANK: 0 ] MPI.cpp:154 INFO| Computing communicaton graph edges (using NBX algorithm). Number of input edges: 2 +2023-05-16 15:54:05.060 ( 0.607s) [RANK: 0 ] MPI.cpp:217 INFO| Finished graph edge discovery using NBX algorithm. Number of discovered edges 2 +2023-05-16 15:54:05.060 ( 0.607s) [RANK: 0 ] graphbuild.cpp:203 INFO| Number of destination and source ranks in non-local dual graph construction, and ratio to total number of ranks: 2, 2, 0.666667, 0.666667 +2023-05-16 15:54:05.097 ( 0.644s) [RANK: 0 ] graphbuild.cpp:545 INFO| Graph edges (local: 66332, non-local: 962) +2023-05-16 15:54:05.097 ( 0.644s) [RANK: 0 ] partitioners.cpp:316 INFO| Compute graph partition using PT-SCOTCH +2023-05-16 15:54:18.587 ( 14.134s) [RANK: 0 ] MPI.cpp:154 INFO| Computing communicaton graph edges (using NBX algorithm). Number of input edges: 3 +2023-05-16 15:54:18.608 ( 14.155s) [RANK: 0 ] MPI.cpp:217 INFO| Finished graph edge discovery using NBX algorithm. Number of discovered edges 3 +2023-05-16 15:54:18.874 ( 14.421s) [RANK: 0 ] graphbuild.cpp:396 INFO| Build local part of mesh dual graph +2023-05-16 15:54:19.026 ( 14.573s) [RANK: 0 ] ordering.cpp:202 INFO| GPS pseudo-diameter:(119) 17038-1320 + +2023-05-16 15:54:19.040 ( 14.587s) [RANK: 0 ] Topology.cpp:923 INFO| Create topology +2023-05-16 15:54:19.060 ( 14.607s) [RANK: 0 ] MPI.cpp:154 INFO| Computing communicaton graph edges (using NBX algorithm). Number of input edges: 3 +2023-05-16 15:54:19.084 ( 14.631s) [RANK: 0 ] MPI.cpp:217 INFO| Finished graph edge discovery using NBX algorithm. Number of discovered edges 3 +2023-05-16 15:54:19.283 ( 14.830s) [RANK: 0 ] MPI.cpp:154 INFO| Computing communicaton graph edges (using NBX algorithm). Number of input edges: 2 +2023-05-16 15:54:19.304 ( 14.851s) [RANK: 0 ] MPI.cpp:217 INFO| Finished graph edge discovery using NBX algorithm. Number of discovered edges 2 +2023-05-16 15:54:19.340 ( 14.887s) [RANK: 0 ] MPI.cpp:154 INFO| Computing communicaton graph edges (using NBX algorithm). Number of input edges: 2 +2023-05-16 15:54:19.364 ( 14.911s) [RANK: 0 ] MPI.cpp:217 INFO| Finished graph edge discovery using NBX algorithm. Number of discovered edges 2 +2023-05-16 15:54:19.404 ( 14.951s) [RANK: 0 ] MPI.cpp:154 INFO| Computing communicaton graph edges (using NBX algorithm). Number of input edges: 2 +2023-05-16 15:54:19.436 ( 14.983s) [RANK: 0 ] MPI.cpp:217 INFO| Finished graph edge discovery using NBX algorithm. Number of discovered edges 2 +2023-05-16 15:54:19.480 ( 15.027s) [RANK: 0 ] MPI.cpp:154 INFO| Computing communicaton graph edges (using NBX algorithm). Number of input edges: 0 +2023-05-16 15:54:19.504 ( 15.051s) [RANK: 0 ] MPI.cpp:217 INFO| Finished graph edge discovery using NBX algorithm. Number of discovered edges 0 +2023-05-16 15:54:19.597 ( 15.144s) [RANK: 0 ] MPI.cpp:154 INFO| Computing communicaton graph edges (using NBX algorithm). Number of input edges: 2 +2023-05-16 15:54:19.628 ( 15.175s) [RANK: 0 ] MPI.cpp:217 INFO| Finished graph edge discovery using NBX algorithm. Number of discovered edges 2 +2023-05-16 15:54:19.705 ( 15.252s) [RANK: 0 ] MPI.cpp:154 INFO| Computing communicaton graph edges (using NBX algorithm). Number of input edges: 0 +2023-05-16 15:54:19.716 ( 15.263s) [RANK: 0 ] MPI.cpp:217 INFO| Finished graph edge discovery using NBX algorithm. Number of discovered edges 0 +2023-05-16 15:54:19.717 ( 15.264s) [RANK: 0 ] MPI.h:368 INFO| Number of neighbourhood source ranks in distribute_to_postoffice: 0 +2023-05-16 15:54:19.753 ( 15.300s) [RANK: 0 ] MPI.cpp:154 INFO| Computing communicaton graph edges (using NBX algorithm). Number of input edges: 2 +2023-05-16 15:54:19.776 ( 15.323s) [RANK: 0 ] MPI.cpp:217 INFO| Finished graph edge discovery using NBX algorithm. Number of discovered edges 2 +2023-05-16 15:54:19.777 ( 15.324s) [RANK: 0 ] MPI.h:500 INFO| Neighbourhood destination ranks from post office in distribute_data (rank, num dests, num dests/mpi_size): 0, 2, 0.666667 UnitCube (24x19x19) to be refined 0 times -2023-05-15 13:41:10.760 ( 10.762s) [RANK: 0 ]topologycomputation.cpp:746 INFO| Computing mesh entities of dimension 2 -2023-05-15 13:41:10.778 ( 10.779s) [RANK: 0 ] MPI.cpp:154 INFO| Computing communicaton graph edges (using NBX algorithm). Number of input edges: 2 -2023-05-15 13:41:10.779 ( 10.780s) [RANK: 0 ] MPI.cpp:217 INFO| Finished graph edge discovery using NBX algorithm. Number of discovered edges 2 -2023-05-15 13:41:10.857 ( 10.858s) [RANK: 0 ] MPI.cpp:154 INFO| Computing communicaton graph edges (using NBX algorithm). Number of input edges: 2 -2023-05-15 13:41:10.857 ( 10.859s) [RANK: 0 ] MPI.cpp:217 INFO| Finished graph edge discovery using NBX algorithm. Number of discovered edges 2 -2023-05-15 13:41:10.859 ( 10.861s) [RANK: 0 ]topologycomputation.cpp:786 INFO| Requesting connectivity 2 - 3 -2023-05-15 13:41:10.859 ( 10.861s) [RANK: 0 ]topologycomputation.cpp:650 INFO| Computing mesh connectivity 2 - 3 from transpose. -2023-05-15 13:41:10.862 ( 10.864s) [RANK: 0 ]topologycomputation.cpp:746 INFO| Computing mesh entities of dimension 0 -2023-05-15 13:41:10.866 ( 10.868s) [RANK: 0 ] MPI.cpp:154 INFO| Computing communicaton graph edges (using NBX algorithm). Number of input edges: 2 -2023-05-15 13:41:10.866 ( 10.868s) [RANK: 0 ] MPI.cpp:217 INFO| Finished graph edge discovery using NBX algorithm. Number of discovered edges 2 -2023-05-15 13:41:10.867 ( 10.869s) [RANK: 0 ] MPI.cpp:154 INFO| Computing communicaton graph edges (using NBX algorithm). Number of input edges: 2 -2023-05-15 13:41:10.867 ( 10.869s) [RANK: 0 ] MPI.cpp:217 INFO| Finished graph edge discovery using NBX algorithm. Number of discovered edges 2 -2023-05-15 13:41:10.868 ( 10.869s) [RANK: 0 ] MPI.cpp:154 INFO| Computing communicaton graph edges (using NBX algorithm). Number of input edges: 0 -2023-05-15 13:41:10.868 ( 10.869s) [RANK: 0 ] MPI.cpp:217 INFO| Finished graph edge discovery using NBX algorithm. Number of discovered edges 0 -2023-05-15 13:41:10.868 ( 10.870s) [RANK: 0 ] MPI.cpp:154 INFO| Computing communicaton graph edges (using NBX algorithm). Number of input edges: 2 -2023-05-15 13:41:10.868 ( 10.870s) [RANK: 0 ] MPI.cpp:217 INFO| Finished graph edge discovery using NBX algorithm. Number of discovered edges 2 -2023-05-15 13:41:10.870 ( 10.871s) [RANK: 0 ]topologycomputation.cpp:786 INFO| Requesting connectivity 3 - 0 -2023-05-15 13:41:10.870 ( 10.872s) [RANK: 0 ]topologycomputation.cpp:786 INFO| Requesting connectivity 3 - 0 -2023-05-15 13:41:10.870 ( 10.872s) [RANK: 0 ]topologycomputation.cpp:786 INFO| Requesting connectivity 2 - 0 -2023-05-15 13:41:10.871 ( 10.873s) [RANK: 0 ]topologycomputation.cpp:786 INFO| Requesting connectivity 2 - 3 -2023-05-15 13:41:10.917 ( 10.919s) [RANK: 0 ] SparsityPattern.cpp:389 INFO| Column ghost size increased from 221 to 540 +2023-05-16 15:54:19.953 ( 15.500s) [RANK: 0 ]topologycomputation.cpp:746 INFO| Computing mesh entities of dimension 2 +2023-05-16 15:54:20.014 ( 15.561s) [RANK: 0 ] MPI.cpp:154 INFO| Computing communicaton graph edges (using NBX algorithm). Number of input edges: 2 +2023-05-16 15:54:20.028 ( 15.575s) [RANK: 0 ] MPI.cpp:217 INFO| Finished graph edge discovery using NBX algorithm. Number of discovered edges 2 +2023-05-16 15:54:20.361 ( 15.908s) [RANK: 0 ] MPI.cpp:154 INFO| Computing communicaton graph edges (using NBX algorithm). Number of input edges: 2 +2023-05-16 15:54:20.388 ( 15.935s) [RANK: 0 ] MPI.cpp:217 INFO| Finished graph edge discovery using NBX algorithm. Number of discovered edges 2 +2023-05-16 15:54:20.430 ( 15.977s) [RANK: 0 ]topologycomputation.cpp:786 INFO| Requesting connectivity 2 - 3 +2023-05-16 15:54:20.430 ( 15.977s) [RANK: 0 ]topologycomputation.cpp:650 INFO| Computing mesh connectivity 2 - 3 from transpose. +2023-05-16 15:54:20.437 ( 15.984s) [RANK: 0 ]topologycomputation.cpp:746 INFO| Computing mesh entities of dimension 0 +2023-05-16 15:54:20.445 ( 15.992s) [RANK: 0 ] MPI.cpp:154 INFO| Computing communicaton graph edges (using NBX algorithm). Number of input edges: 2 +2023-05-16 15:54:20.460 ( 16.007s) [RANK: 0 ] MPI.cpp:217 INFO| Finished graph edge discovery using NBX algorithm. Number of discovered edges 2 +2023-05-16 15:54:20.537 ( 16.084s) [RANK: 0 ] MPI.cpp:154 INFO| Computing communicaton graph edges (using NBX algorithm). Number of input edges: 2 +2023-05-16 15:54:20.548 ( 16.095s) [RANK: 0 ] MPI.cpp:217 INFO| Finished graph edge discovery using NBX algorithm. Number of discovered edges 2 +2023-05-16 15:54:20.613 ( 16.160s) [RANK: 0 ] MPI.cpp:154 INFO| Computing communicaton graph edges (using NBX algorithm). Number of input edges: 0 +2023-05-16 15:54:20.624 ( 16.171s) [RANK: 0 ] MPI.cpp:217 INFO| Finished graph edge discovery using NBX algorithm. Number of discovered edges 0 +2023-05-16 15:54:20.753 ( 16.300s) [RANK: 0 ] MPI.cpp:154 INFO| Computing communicaton graph edges (using NBX algorithm). Number of input edges: 2 +2023-05-16 15:54:20.768 ( 16.315s) [RANK: 0 ] MPI.cpp:217 INFO| Finished graph edge discovery using NBX algorithm. Number of discovered edges 2 +2023-05-16 15:54:20.921 ( 16.468s) [RANK: 0 ]topologycomputation.cpp:786 INFO| Requesting connectivity 3 - 0 +2023-05-16 15:54:20.921 ( 16.468s) [RANK: 0 ]topologycomputation.cpp:786 INFO| Requesting connectivity 3 - 0 +2023-05-16 15:54:20.921 ( 16.468s) [RANK: 0 ]topologycomputation.cpp:786 INFO| Requesting connectivity 2 - 0 +2023-05-16 15:54:20.922 ( 16.469s) [RANK: 0 ]topologycomputation.cpp:786 INFO| Requesting connectivity 2 - 3 +2023-05-16 15:54:21.295 ( 16.842s) [RANK: 0 ] SparsityPattern.cpp:389 INFO| Column ghost size increased from 215 to 557 ---------------------------------------------------------------- Test problem summary @@ -1919,7 +1962,7 @@ Total degrees of freedom: 30000 (30 thousand) Average degrees of freedom per process: 10000 ---------------------------------------------------------------- -2023-05-15 13:41:11.264 ( 11.266s) [RANK: 0 ] petsc.cpp:677 INFO| PETSc Krylov solver starting to solve system. +2023-05-16 15:54:23.745 ( 19.292s) [RANK: 0 ] petsc.cpp:677 INFO| PETSc Krylov solver starting to solve system. KSP Object: 3 MPI processes type: cg maximum iterations=10000, initial guess is zero @@ -1937,7 +1980,7 @@ AGG specific options Number of levels to square graph 1 Number smoothing steps 1 - Complexity: grid = 1.0636 operator = 1.25273 + Complexity: grid = 1.0674 operator = 1.27215 Coarse grid solver -- level 0 ------------------------------- KSP Object: (mg_coarse_) 3 MPI processes type: preonly @@ -1962,33 +2005,33 @@ tolerance for zero pivot 2.22045e-14 using diagonal shift on blocks to prevent zero pivot [INBLOCKS] matrix ordering: nd - factor fill ratio given 5., needed 1.02381 + factor fill ratio given 5., needed 1.03308 Factored matrix follows: Mat Object: (mg_coarse_sub_) 1 MPI process type: seqaij - rows=204, cols=204, bs=6 + rows=228, cols=228, bs=6 package used to perform factorization: petsc - total: nonzeros=40248, allocated nonzeros=40248 - using I-node routines: found 48 nodes, limit used is 5 + total: nonzeros=49464, allocated nonzeros=49464 + using I-node routines: found 57 nodes, limit used is 5 linear system matrix = precond matrix: Mat Object: (mg_coarse_sub_) 1 MPI process type: seqaij - rows=204, cols=204, bs=6 - total: nonzeros=39312, allocated nonzeros=39312 + rows=228, cols=228, bs=6 + total: nonzeros=47880, allocated nonzeros=47880 total number of mallocs used during MatSetValues calls=0 - using I-node routines: found 57 nodes, limit used is 5 + using I-node routines: found 61 nodes, limit used is 5 linear system matrix = precond matrix: Mat Object: 3 MPI processes type: mpiaij - rows=204, cols=204, bs=6 - total: nonzeros=39312, allocated nonzeros=39312 + rows=228, cols=228, bs=6 + total: nonzeros=47880, allocated nonzeros=47880 total number of mallocs used during MatSetValues calls=0 - using I-node (on process 0) routines: found 57 nodes, limit used is 5 + using I-node (on process 0) routines: found 61 nodes, limit used is 5 Down solver (pre-smoother) on level 1 ------------------------------- KSP Object: (mg_levels_1_) 3 MPI processes type: chebyshev - eigenvalue targets used: min 0.207028, max 2.27731 - eigenvalues provided (min 1.03041e-06, max 2.07028) with transform: [0. 0.1; 0. 1.1] + eigenvalue targets used: min 0.227046, max 2.4975 + eigenvalues provided (min 8.00233e-07, max 2.27046) with transform: [0. 0.1; 0. 1.1] maximum iterations=2, nonzero initial guess tolerances: relative=1e-05, absolute=1e-50, divergence=10000. left preconditioning @@ -1999,17 +2042,17 @@ linear system matrix = precond matrix: Mat Object: 3 MPI processes type: mpiaij - rows=1704, cols=1704, bs=6 - total: nonzeros=276984, allocated nonzeros=276984 + rows=1794, cols=1794, bs=6 + total: nonzeros=292716, allocated nonzeros=292716 total number of mallocs used during MatSetValues calls=0 using scalable MatPtAP() implementation - using I-node (on process 0) routines: found 172 nodes, limit used is 5 + using I-node (on process 0) routines: found 185 nodes, limit used is 5 Up solver (post-smoother) same as down solver (pre-smoother) Down solver (pre-smoother) on level 2 ------------------------------- KSP Object: (mg_levels_2_) 3 MPI processes type: chebyshev - eigenvalue targets used: min 0.258798, max 2.84678 - eigenvalues provided (min 0.0683816, max 2.58798) with transform: [0. 0.1; 0. 1.1] + eigenvalue targets used: min 0.25857, max 2.84427 + eigenvalues provided (min 0.0756389, max 2.5857) with transform: [0. 0.1; 0. 1.1] maximum iterations=2, nonzero initial guess tolerances: relative=1e-05, absolute=1e-50, divergence=10000. left preconditioning @@ -2024,7 +2067,7 @@ total: nonzeros=1251522, allocated nonzeros=1251522 total number of mallocs used during MatSetValues calls=0 has attached near null space - using I-node (on process 0) routines: found 3414 nodes, limit used is 5 + using I-node (on process 0) routines: found 3448 nodes, limit used is 5 Up solver (post-smoother) same as down solver (pre-smoother) linear system matrix = precond matrix: Mat Object: 3 MPI processes @@ -2033,49 +2076,49 @@ total: nonzeros=1251522, allocated nonzeros=1251522 total number of mallocs used during MatSetValues calls=0 has attached near null space - using I-node (on process 0) routines: found 3414 nodes, limit used is 5 + using I-node (on process 0) routines: found 3448 nodes, limit used is 5 [MPI_MAX] Summary of timings | reps wall avg wall tot --------------------------------------------------------------------------------------------------------- -Build BoxMesh | 1 10.581018 10.581018 -Build dofmap data | 2 0.006416 0.012832 -Build sparsity | 1 0.011399 0.011399 -Compute connectivity 2-3 | 1 0.001426 0.001426 -Compute dof reordering map | 2 0.000356 0.000712 -Compute entities of dim = 2 | 1 0.099688 0.099688 -Compute graph partition (SCOTCH) | 1 10.375435 10.375435 -Compute local part of mesh dual graph | 2 0.069003 0.138007 -Compute local-to-local map | 1 0.000565 0.000565 -Compute non-local part of mesh dual graph | 1 0.054754 0.054754 -Compute-local-to-global links for global/local adjacency list | 1 0.001036 0.001036 -Distribute AdjacencyList nodes to destination ranks | 1 0.006939 0.006939 -Distribute row-wise data (scalable) | 1 0.002330 0.002330 -Extract partition boundaries from SCOTCH graph | 1 0.001075 0.001075 -GPS: create_level_structure | 5 0.000752 0.004513 -Get SCOTCH graph data | 1 0.000015 0.000015 -Gibbs-Poole-Stockmeyer ordering | 1 0.009555 0.009555 -Init MPI | 1 0.174836 0.174836 -Init PETSc | 1 0.004347 0.004347 -Init dofmap from element dofmap | 2 0.003456 0.006911 -Init logging | 1 0.000071 0.000071 -PETSc Krylov solver | 1 1.305917 1.305917 -SCOTCH: call SCOTCH_dgraphBuild | 1 0.000303 0.000303 -SCOTCH: call SCOTCH_dgraphHalo | 1 0.036442 0.036442 -SCOTCH: call SCOTCH_dgraphPart | 1 10.370280 10.370280 -SparsityPattern::assemble | 1 0.015109 0.015109 -Topology: create | 1 0.024283 0.024283 -Topology: determine shared index ownership | 1 0.001762 0.001762 -Topology: determine vertex ownership groups (owned, undetermined, unowned) | 1 0.004275 0.004275 -ZZZ Assemble matrix | 1 0.302216 0.302216 -ZZZ Assemble vector | 1 0.015798 0.015798 -ZZZ Create Mesh | 1 10.581974 10.581974 -ZZZ Create RHS function | 1 0.024522 0.024522 -ZZZ Create boundary conditions | 1 0.002858 0.002858 -ZZZ Create facets and facet->cell connectivity | 1 0.101084 0.101084 -ZZZ Create forms | 1 0.000108 0.000108 -ZZZ Create near-nullspace | 1 0.014960 0.014960 -ZZZ FunctionSpace | 1 0.008922 0.008922 -ZZZ Solve | 1 1.316348 1.316348 +Build BoxMesh | 1 15.089877 15.089877 +Build dofmap data | 2 0.326229 0.652459 +Build sparsity | 1 0.058172 0.058172 +Compute connectivity 2-3 | 1 0.001090 0.001090 +Compute dof reordering map | 2 0.004372 0.008745 +Compute entities of dim = 2 | 1 0.478302 0.478302 +Compute graph partition (SCOTCH) | 1 13.478990 13.478990 +Compute local part of mesh dual graph | 2 0.154720 0.309440 +Compute local-to-local map | 1 0.000597 0.000597 +Compute non-local part of mesh dual graph | 1 0.115469 0.115469 +Compute-local-to-global links for global/local adjacency list | 1 0.000973 0.000973 +Distribute AdjacencyList nodes to destination ranks | 1 0.310685 0.310685 +Distribute row-wise data (scalable) | 1 0.212331 0.212331 +Extract partition boundaries from SCOTCH graph | 1 0.001238 0.001238 +GPS: create_level_structure | 4 0.004851 0.010855 +Get SCOTCH graph data | 1 0.000016 0.000016 +Gibbs-Poole-Stockmeyer ordering | 1 0.024069 0.024069 +Init MPI | 1 0.371885 0.371885 +Init PETSc | 1 0.058751 0.058751 +Init dofmap from element dofmap | 2 0.002709 0.005417 +Init logging | 1 0.000070 0.000070 +PETSc Krylov solver | 1 10.399788 10.399788 +SCOTCH: call SCOTCH_dgraphBuild | 1 0.015521 0.015521 +SCOTCH: call SCOTCH_dgraphHalo | 1 0.095924 0.095924 +SCOTCH: call SCOTCH_dgraphPart | 1 13.430764 13.430764 +SparsityPattern::assemble | 1 0.123636 0.123636 +Topology: create | 1 0.453010 0.453010 +Topology: determine shared index ownership | 1 0.229477 0.229477 +Topology: determine vertex ownership groups (owned, undetermined, unowned) | 1 0.011552 0.011552 +ZZZ Assemble matrix | 1 1.088322 1.088322 +ZZZ Assemble vector | 1 0.067986 0.067986 +ZZZ Create Mesh | 1 15.090140 15.090140 +ZZZ Create RHS function | 1 0.159212 0.159212 +ZZZ Create boundary conditions | 1 0.155532 0.155532 +ZZZ Create facets and facet->cell connectivity | 1 0.479468 0.479468 +ZZZ Create forms | 1 0.000110 0.000110 +ZZZ Create near-nullspace | 1 0.873164 0.873164 +ZZZ FunctionSpace | 1 0.389632 0.389632 +ZZZ Solve | 1 10.659988 10.659988 *** Number of Krylov iterations: 21 *** Solution norm: 3.6795e-05 **************************************************************************************************************************************************************** @@ -2084,17 +2127,17 @@ ------------------------------------------------------------------ PETSc Performance Summary: ------------------------------------------------------------------ -/build/fenicsx-performance-tests-0.5.0~git20220731.821823b/obj-arm-linux-gnueabihf/dolfinx-scaling-test on a named virt64c with 3 processors, by pbuilder1 Mon May 15 13:41:12 2023 +/build/fenicsx-performance-tests-0.5.0~git20220731.821823b/obj-arm-linux-gnueabihf/dolfinx-scaling-test on a named i-capture-the-hostname with 3 processors, by pbuilder2 Tue May 16 15:54:34 2023 Using Petsc Release Version 3.18.5, Feb 27, 2023 Max Max/Min Avg Total -Time (sec): 1.240e+01 1.000 1.240e+01 +Time (sec): 2.935e+01 1.000 2.935e+01 Objects: 4.630e+02 1.004 4.617e+02 -Flops: 2.153e+08 1.080 2.071e+08 6.214e+08 -Flops/sec: 1.736e+07 1.080 1.671e+07 5.012e+07 -MPI Msg Count: 8.170e+02 1.044 7.947e+02 2.384e+03 -MPI Msg Len (bytes): 6.444e+06 1.406 6.964e+03 1.660e+07 -MPI Reductions: 6.360e+02 1.000 +Flops: 2.168e+08 1.048 2.126e+08 6.377e+08 +Flops/sec: 7.387e+06 1.048 7.242e+06 2.173e+07 +MPI Msg Count: 8.210e+02 1.041 7.993e+02 2.398e+03 +MPI Msg Len (bytes): 6.991e+06 1.476 7.130e+03 1.710e+07 +MPI Reductions: 6.370e+02 1.000 Flop counting convention: 1 flop = 1 real number operation of type (multiply/divide/add/subtract) e.g., VecAXPY() for real vectors of length N --> 2N flops @@ -2102,7 +2145,7 @@ Summary of Stages: ----- Time ------ ----- Flop ------ --- Messages --- -- Message Lengths -- -- Reductions -- Avg %Total Avg %Total Count %Total Avg %Total Count %Total - 0: Main Stage: 1.2399e+01 100.0% 6.2145e+08 100.0% 2.384e+03 100.0% 6.964e+03 100.0% 6.180e+02 97.2% + 0: Main Stage: 2.9349e+01 100.0% 6.3768e+08 100.0% 2.398e+03 100.0% 7.130e+03 100.0% 6.190e+02 97.2% ------------------------------------------------------------------------------------------------------------------------ See the 'Profiling' chapter of the users' manual for details on interpreting output. @@ -2126,79 +2169,79 @@ --- Event Stage 0: Main Stage -BuildTwoSided 103 1.0 9.3472e-02 10.7 0.00e+00 0.0 1.4e+02 4.0e+00 1.0e+02 0 0 6 0 16 0 0 6 0 17 0 -BuildTwoSidedF 86 1.0 9.2749e-02 12.3 0.00e+00 0.0 1.1e+02 3.8e+04 8.6e+01 0 0 5 25 14 0 0 5 25 14 0 -MatMult 217 1.0 3.0018e-01 1.0 1.22e+08 1.1 1.3e+03 5.3e+03 2.0e+00 2 56 56 42 0 2 56 56 42 0 1161 -MatMultAdd 44 1.0 7.3101e-02 1.2 1.00e+07 1.1 1.8e+02 1.3e+03 0.0e+00 1 5 7 1 0 1 5 7 1 0 399 -MatMultTranspose 44 1.0 3.8032e-02 1.1 1.00e+07 1.1 1.9e+02 1.3e+03 2.0e+00 0 5 8 1 0 0 5 8 1 0 767 -MatSolve 22 0.0 2.4946e-03 0.0 1.77e+06 0.0 0.0e+00 0.0e+00 0.0e+00 0 0 0 0 0 0 0 0 0 0 708 -MatLUFactorSym 1 1.0 2.5631e-03 65.7 0.00e+00 0.0 0.0e+00 0.0e+00 0.0e+00 0 0 0 0 0 0 0 0 0 0 0 -MatLUFactorNum 1 1.0 9.3624e-03 2147.3 5.11e+06 0.0 0.0e+00 0.0e+00 0.0e+00 0 1 0 0 0 0 1 0 0 0 545 -MatConvert 1 1.0 9.8171e-04 1.4 0.00e+00 0.0 1.2e+01 6.8e+02 1.0e+00 0 0 1 0 0 0 0 1 0 0 0 -MatScale 4 1.0 1.5973e-03 1.2 4.54e+05 1.1 0.0e+00 0.0e+00 0.0e+00 0 0 0 0 0 0 0 0 0 0 829 -MatResidual 44 1.0 5.6744e-02 1.0 2.37e+07 1.1 2.6e+02 5.1e+03 0.0e+00 0 11 11 8 0 0 11 11 8 0 1185 -MatAssemblyBegin 59 1.0 1.1653e-01 3.6 0.00e+00 0.0 1.1e+02 3.8e+04 3.0e+01 1 0 5 25 5 1 0 5 25 5 0 -MatAssemblyEnd 59 1.0 9.2227e-02 1.0 9.09e+04 2.2 0.0e+00 0.0e+00 9.6e+01 1 0 0 0 15 1 0 0 0 16 2 -MatGetRowIJ 1 0.0 1.0595e-04 0.0 0.00e+00 0.0 0.0e+00 0.0e+00 0.0e+00 0 0 0 0 0 0 0 0 0 0 0 -MatCreateSubMat 2 1.0 1.6014e-02 1.0 0.00e+00 0.0 1.0e+01 3.5e+04 2.8e+01 0 0 0 2 4 0 0 0 2 5 0 -MatGetOrdering 1 0.0 2.6110e-04 0.0 0.00e+00 0.0 0.0e+00 0.0e+00 0.0e+00 0 0 0 0 0 0 0 0 0 0 0 -MatCoarsen 2 1.0 2.6138e-02 1.0 1.40e+05 1.1 2.3e+02 7.3e+02 9.6e+01 0 0 10 1 15 0 0 10 1 16 16 -MatZeroEntries 3 1.0 2.1208e-04 1.1 0.00e+00 0.0 0.0e+00 0.0e+00 0.0e+00 0 0 0 0 0 0 0 0 0 0 0 -MatView 6 1.5 9.9578e-03 1.5 0.00e+00 0.0 0.0e+00 0.0e+00 4.0e+00 0 0 0 0 1 0 0 0 0 1 0 -MatAXPY 4 1.0 2.7020e-02 1.0 1.15e+05 1.1 0.0e+00 0.0e+00 1.2e+01 0 0 0 0 2 0 0 0 0 2 12 -MatTranspose 10 1.0 1.5749e-02 1.1 0.00e+00 0.0 9.0e+01 2.1e+03 3.2e+01 0 0 4 1 5 0 0 4 1 5 0 -MatMatMultSym 9 1.0 9.4770e-02 1.1 0.00e+00 0.0 5.1e+01 1.1e+04 2.8e+01 1 0 2 4 4 1 0 2 4 5 0 -MatMatMultNum 3 1.0 3.0998e-02 1.0 6.46e+06 1.1 1.5e+01 2.4e+04 3.0e+00 0 3 1 2 0 0 3 1 2 0 592 -MatPtAPSymbolic 3 1.0 2.3874e-01 1.0 0.00e+00 0.0 9.9e+01 3.4e+04 2.1e+01 2 0 4 20 3 2 0 4 20 3 0 -MatPtAPNumeric 3 1.0 3.8238e-01 1.0 5.33e+07 1.1 3.0e+01 8.9e+04 1.5e+01 3 24 1 16 2 3 24 1 16 2 392 -MatGetLocalMat 9 1.0 7.5062e-03 1.2 0.00e+00 0.0 0.0e+00 0.0e+00 0.0e+00 0 0 0 0 0 0 0 0 0 0 0 -MatGetBrAoCol 9 1.0 1.0145e-02 1.0 0.00e+00 0.0 1.2e+02 3.0e+04 1.0e+00 0 0 5 22 0 0 0 5 22 0 0 -VecMDot 20 1.0 4.1666e-03 1.3 1.19e+06 1.1 0.0e+00 0.0e+00 2.0e+01 0 1 0 0 3 0 1 0 0 3 837 -VecTDot 42 1.0 4.1341e-03 1.8 8.60e+05 1.1 0.0e+00 0.0e+00 4.2e+01 0 0 0 0 7 0 0 0 0 7 610 -VecNorm 44 1.0 3.9654e-03 1.6 6.87e+05 1.1 0.0e+00 0.0e+00 4.4e+01 0 0 0 0 7 0 0 0 0 7 509 -VecScale 22 1.0 1.6296e-04 1.0 1.19e+05 1.1 0.0e+00 0.0e+00 0.0e+00 0 0 0 0 0 0 0 0 0 0 2140 -VecCopy 136 1.0 1.1067e-03 1.2 0.00e+00 0.0 0.0e+00 0.0e+00 0.0e+00 0 0 0 0 0 0 0 0 0 0 0 -VecSet 203 1.0 7.8643e-04 1.0 0.00e+00 0.0 0.0e+00 0.0e+00 0.0e+00 0 0 0 0 0 0 0 0 0 0 0 -VecAXPY 44 1.0 1.6215e-03 1.2 8.82e+05 1.1 0.0e+00 0.0e+00 0.0e+00 0 0 0 0 0 0 0 0 0 0 1593 -VecAYPX 284 1.0 7.1533e-03 1.2 2.32e+06 1.1 0.0e+00 0.0e+00 0.0e+00 0 1 0 0 0 0 1 0 0 0 948 -VecAXPBYCZ 88 1.0 5.0457e-03 1.6 2.39e+06 1.1 0.0e+00 0.0e+00 0.0e+00 0 1 0 0 0 0 1 0 0 0 1382 -VecMAXPY 22 1.0 1.9025e-03 1.1 1.41e+06 1.1 0.0e+00 0.0e+00 0.0e+00 0 1 0 0 0 0 1 0 0 0 2166 -VecAssemblyBegin 57 1.0 2.0307e-03 1.4 0.00e+00 0.0 0.0e+00 0.0e+00 5.6e+01 0 0 0 0 9 0 0 0 0 9 0 -VecAssemblyEnd 57 1.0 1.7503e-04 1.0 0.00e+00 0.0 0.0e+00 0.0e+00 0.0e+00 0 0 0 0 0 0 0 0 0 0 0 -VecPointwiseMult 198 1.0 4.8936e-03 1.0 1.07e+06 1.1 0.0e+00 0.0e+00 0.0e+00 0 1 0 0 0 0 1 0 0 0 641 -VecScatterBegin 363 1.0 9.5596e-03 1.1 0.00e+00 0.0 1.9e+03 4.0e+03 8.0e+00 0 0 80 46 1 0 0 80 46 1 0 -VecScatterEnd 363 1.0 6.9398e-02 2.4 1.23e+04 1.7 0.0e+00 0.0e+00 0.0e+00 0 0 0 0 0 0 0 0 0 0 0 -VecNormalize 22 1.0 1.4627e-03 1.7 3.58e+05 1.1 0.0e+00 0.0e+00 2.2e+01 0 0 0 0 3 0 0 0 0 4 715 -SFSetGraph 35 1.0 3.5542e-04 1.3 0.00e+00 0.0 0.0e+00 0.0e+00 0.0e+00 0 0 0 0 0 0 0 0 0 0 0 -SFSetUp 17 1.0 2.9767e-03 1.3 0.00e+00 0.0 1.6e+02 4.8e+02 1.7e+01 0 0 7 0 3 0 0 7 0 3 0 -SFBcastBegin 14 1.0 1.9956e-04 1.1 0.00e+00 0.0 8.4e+01 6.4e+02 0.0e+00 0 0 4 0 0 0 0 4 0 0 0 -SFBcastEnd 14 1.0 1.8566e-04 1.8 0.00e+00 0.0 0.0e+00 0.0e+00 0.0e+00 0 0 0 0 0 0 0 0 0 0 0 -SFReduceBegin 4 1.0 1.1933e-04 1.1 0.00e+00 0.0 1.8e+01 5.3e+02 0.0e+00 0 0 1 0 0 0 0 1 0 0 0 -SFReduceEnd 4 1.0 5.4756e-05 1.1 0.00e+00 0.0 0.0e+00 0.0e+00 0.0e+00 0 0 0 0 0 0 0 0 0 0 0 -SFPack 381 1.0 2.7815e-03 1.2 0.00e+00 0.0 0.0e+00 0.0e+00 0.0e+00 0 0 0 0 0 0 0 0 0 0 0 -SFUnpack 381 1.0 6.2282e-04 1.0 1.23e+04 1.7 0.0e+00 0.0e+00 0.0e+00 0 0 0 0 0 0 0 0 0 0 47 -KSPSetUp 7 1.0 6.7648e-04 1.2 0.00e+00 0.0 0.0e+00 0.0e+00 4.0e+00 0 0 0 0 1 0 0 0 0 1 0 -KSPSolve 1 1.0 4.1196e-01 1.0 1.39e+08 1.1 1.6e+03 4.4e+03 7.0e+01 3 65 65 41 11 3 65 65 41 11 986 -KSPGMRESOrthog 20 1.0 5.9110e-03 1.2 2.39e+06 1.1 0.0e+00 0.0e+00 2.0e+01 0 1 0 0 3 0 1 0 0 3 1180 -PCSetUp_GAMG+ 1 1.0 8.7483e-01 1.0 7.41e+07 1.1 8.0e+02 1.1e+04 5.0e+02 7 34 33 52 79 7 34 33 52 81 239 - PCGAMGCreateG 2 1.0 5.1081e-02 1.0 5.03e+04 1.1 6.0e+01 2.9e+03 4.4e+01 0 0 3 1 7 0 0 3 1 7 3 - GAMG Coarsen 2 1.0 2.8146e-02 1.0 1.40e+05 1.1 2.3e+02 7.3e+02 9.6e+01 0 0 10 1 15 0 0 10 1 16 15 - GAMG MIS/Agg 2 1.0 2.6190e-02 1.0 1.40e+05 1.1 2.3e+02 7.3e+02 9.6e+01 0 0 10 1 15 0 0 10 1 16 16 - PCGAMGProl 2 1.0 3.3644e-02 1.0 0.00e+00 0.0 1.9e+02 1.9e+03 1.9e+02 0 0 8 2 30 0 0 8 2 30 0 - GAMG Prol-col 2 1.0 1.4342e-02 1.0 0.00e+00 0.0 1.8e+02 7.0e+02 1.7e+02 0 0 8 1 27 0 0 8 1 28 0 - GAMG Prol-lift 2 1.0 1.8614e-02 1.0 0.00e+00 0.0 1.2e+01 1.9e+04 1.0e+01 0 0 1 1 2 0 0 1 1 2 0 - PCGAMGOptProl 2 1.0 1.3286e-01 1.0 2.07e+07 1.1 1.9e+02 8.3e+03 8.2e+01 1 10 8 10 13 1 10 8 10 13 445 - GAMG smooth 2 1.0 9.1543e-02 1.0 6.97e+06 1.1 4.8e+01 2.0e+04 2.6e+01 1 3 2 6 4 1 3 2 6 4 217 - PCGAMGCreateL 2 1.0 6.2683e-01 1.0 5.32e+07 1.1 1.2e+02 5.2e+04 7.7e+01 5 24 5 38 12 5 24 5 38 12 238 - GAMG PtAP 2 1.0 6.0919e-01 1.0 5.32e+07 1.1 9.6e+01 6.2e+04 2.4e+01 5 24 4 36 4 5 24 4 36 4 245 - GAMG Reduce 1 1.0 1.8754e-02 1.1 0.00e+00 0.0 2.5e+01 1.5e+04 5.3e+01 0 0 1 2 8 0 0 1 2 9 0 -PCGAMG Gal l00 1 1.0 4.3578e-01 1.0 3.42e+07 1.0 4.8e+01 8.2e+04 1.2e+01 4 16 2 24 2 4 16 2 24 2 234 -PCGAMG Opt l00 1 1.0 6.0861e-02 1.0 5.10e+06 1.1 2.4e+01 3.2e+04 1.0e+01 0 2 1 5 2 0 2 1 5 2 247 -PCGAMG Gal l01 1 1.0 1.7340e-01 1.0 1.91e+07 1.6 4.8e+01 4.1e+04 1.2e+01 1 8 2 12 2 1 8 2 12 2 273 -PCGAMG Opt l01 1 1.0 1.3331e-02 1.0 1.36e+06 1.5 2.4e+01 7.7e+03 1.0e+01 0 1 1 1 2 0 1 1 1 2 249 -PCSetUp 2 1.0 8.8727e-01 1.0 7.41e+07 1.1 8.0e+02 1.1e+04 5.0e+02 7 34 33 52 79 7 34 33 52 81 242 -PCSetUpOnBlocks 22 1.0 1.2498e-02 34.8 5.11e+06 0.0 0.0e+00 0.0e+00 0.0e+00 0 1 0 0 0 0 1 0 0 0 409 -PCApply 22 1.0 3.5936e-01 1.0 1.19e+08 1.1 1.4e+03 4.1e+03 6.0e+00 3 56 60 35 1 3 56 60 35 1 965 +BuildTwoSided 103 1.0 8.9463e-01 1.3 0.00e+00 0.0 1.4e+02 4.0e+00 1.0e+02 3 0 6 0 16 3 0 6 0 17 0 +BuildTwoSidedF 86 1.0 6.7899e-01 1.4 0.00e+00 0.0 1.2e+02 3.6e+04 8.6e+01 2 0 5 25 14 2 0 5 25 14 0 +MatMult 217 1.0 3.0318e+00 1.0 1.21e+08 1.1 1.3e+03 5.5e+03 2.0e+00 10 55 55 42 0 10 55 55 42 0 116 +MatMultAdd 44 1.0 4.0175e-01 1.2 1.02e+07 1.0 1.8e+02 1.3e+03 0.0e+00 1 5 7 1 0 1 5 7 1 0 74 +MatMultTranspose 44 1.0 3.8570e-01 1.3 1.02e+07 1.0 1.9e+02 1.2e+03 2.0e+00 1 5 8 1 0 1 5 8 1 0 77 +MatSolve 22 0.0 2.7221e-03 0.0 2.17e+06 0.0 0.0e+00 0.0e+00 0.0e+00 0 0 0 0 0 0 0 0 0 0 798 +MatLUFactorSym 1 1.0 2.9823e-03 71.2 0.00e+00 0.0 0.0e+00 0.0e+00 0.0e+00 0 0 0 0 0 0 0 0 0 0 0 +MatLUFactorNum 1 1.0 3.5502e-02 8256.2 6.90e+06 0.0 0.0e+00 0.0e+00 0.0e+00 0 1 0 0 0 0 1 0 0 0 194 +MatConvert 1 1.0 3.4617e-02 1.1 0.00e+00 0.0 1.2e+01 7.1e+02 1.0e+00 0 0 1 0 0 0 0 1 0 0 0 +MatScale 4 1.0 1.1642e-03 1.0 4.62e+05 1.0 0.0e+00 0.0e+00 0.0e+00 0 0 0 0 0 0 0 0 0 0 1165 +MatResidual 44 1.0 6.2004e-01 1.1 2.34e+07 1.1 2.6e+02 5.2e+03 0.0e+00 2 11 11 8 0 2 11 11 8 0 110 +MatAssemblyBegin 59 1.0 5.2836e-01 1.5 0.00e+00 0.0 1.2e+02 3.6e+04 3.0e+01 2 0 5 25 5 2 0 5 25 5 0 +MatAssemblyEnd 59 1.0 1.3200e+00 1.0 8.67e+04 2.0 0.0e+00 0.0e+00 9.6e+01 4 0 0 0 15 4 0 0 0 16 0 +MatGetRowIJ 1 0.0 1.1165e-04 0.0 0.00e+00 0.0 0.0e+00 0.0e+00 0.0e+00 0 0 0 0 0 0 0 0 0 0 0 +MatCreateSubMat 2 1.0 9.5750e-02 1.0 0.00e+00 0.0 1.0e+01 4.4e+04 2.8e+01 0 0 0 3 4 0 0 0 3 5 0 +MatGetOrdering 1 0.0 3.0735e-04 0.0 0.00e+00 0.0 0.0e+00 0.0e+00 0.0e+00 0 0 0 0 0 0 0 0 0 0 0 +MatCoarsen 2 1.0 1.2596e+00 1.0 1.39e+05 1.0 2.4e+02 7.5e+02 9.7e+01 4 0 10 1 15 4 0 10 1 16 0 +MatZeroEntries 3 1.0 6.1706e-04 3.6 0.00e+00 0.0 0.0e+00 0.0e+00 0.0e+00 0 0 0 0 0 0 0 0 0 0 0 +MatView 6 1.5 9.9470e-02 1.5 0.00e+00 0.0 0.0e+00 0.0e+00 4.0e+00 0 0 0 0 1 0 0 0 0 1 0 +MatAXPY 4 1.0 1.8623e-01 1.1 1.15e+05 1.1 0.0e+00 0.0e+00 1.2e+01 1 0 0 0 2 1 0 0 0 2 2 +MatTranspose 10 1.0 3.9359e-01 1.0 0.00e+00 0.0 9.0e+01 2.1e+03 3.2e+01 1 0 4 1 5 1 0 4 1 5 0 +MatMatMultSym 9 1.0 4.5617e-01 1.0 0.00e+00 0.0 5.1e+01 1.2e+04 2.8e+01 2 0 2 4 4 2 0 2 4 5 0 +MatMatMultNum 3 1.0 1.2945e-01 1.1 6.40e+06 1.1 1.5e+01 2.5e+04 3.0e+00 0 3 1 2 0 0 3 1 2 0 143 +MatPtAPSymbolic 3 1.0 1.0116e+00 1.0 0.00e+00 0.0 9.9e+01 3.4e+04 2.1e+01 3 0 4 20 3 3 0 4 20 3 0 +MatPtAPNumeric 3 1.0 1.3500e+00 1.0 5.61e+07 1.1 3.0e+01 8.8e+04 1.5e+01 5 25 1 15 2 5 25 1 15 2 118 +MatGetLocalMat 9 1.0 1.5575e-02 1.5 0.00e+00 0.0 0.0e+00 0.0e+00 0.0e+00 0 0 0 0 0 0 0 0 0 0 0 +MatGetBrAoCol 9 1.0 4.4929e-01 1.5 0.00e+00 0.0 1.2e+02 3.1e+04 1.0e+00 1 0 5 22 0 1 0 5 22 0 0 +VecMDot 20 1.0 1.7294e-01 2.1 1.20e+06 1.1 0.0e+00 0.0e+00 2.0e+01 0 1 0 0 3 0 1 0 0 3 20 +VecTDot 42 1.0 2.6172e-01 1.1 8.69e+05 1.1 0.0e+00 0.0e+00 4.2e+01 1 0 0 0 7 1 0 0 0 7 10 +VecNorm 44 1.0 2.8999e-01 1.5 6.95e+05 1.1 0.0e+00 0.0e+00 4.4e+01 1 0 0 0 7 1 0 0 0 7 7 +VecScale 22 1.0 2.5038e-04 1.2 1.20e+05 1.1 0.0e+00 0.0e+00 0.0e+00 0 0 0 0 0 0 0 0 0 0 1397 +VecCopy 136 1.0 1.0738e-03 1.1 0.00e+00 0.0 0.0e+00 0.0e+00 0.0e+00 0 0 0 0 0 0 0 0 0 0 0 +VecSet 203 1.0 8.1563e-04 1.1 0.00e+00 0.0 0.0e+00 0.0e+00 0.0e+00 0 0 0 0 0 0 0 0 0 0 0 +VecAXPY 44 1.0 2.0692e-03 1.6 8.91e+05 1.1 0.0e+00 0.0e+00 0.0e+00 0 0 0 0 0 0 0 0 0 0 1249 +VecAYPX 284 1.0 1.4715e-02 2.4 2.33e+06 1.1 0.0e+00 0.0e+00 0.0e+00 0 1 0 0 0 0 1 0 0 0 462 +VecAXPBYCZ 88 1.0 3.2111e-03 1.1 2.40e+06 1.1 0.0e+00 0.0e+00 0.0e+00 0 1 0 0 0 0 1 0 0 0 2178 +VecMAXPY 22 1.0 2.5597e-03 1.2 1.42e+06 1.1 0.0e+00 0.0e+00 0.0e+00 0 1 0 0 0 0 1 0 0 0 1615 +VecAssemblyBegin 57 1.0 2.7316e-01 1.2 0.00e+00 0.0 0.0e+00 0.0e+00 5.6e+01 1 0 0 0 9 1 0 0 0 9 0 +VecAssemblyEnd 57 1.0 2.9146e-04 1.2 0.00e+00 0.0 0.0e+00 0.0e+00 0.0e+00 0 0 0 0 0 0 0 0 0 0 0 +VecPointwiseMult 198 1.0 4.7277e-03 1.1 1.08e+06 1.1 0.0e+00 0.0e+00 0.0e+00 0 0 0 0 0 0 0 0 0 0 666 +VecScatterBegin 363 1.0 1.8983e-01 1.2 0.00e+00 0.0 1.9e+03 4.2e+03 8.0e+00 1 0 79 46 1 1 0 79 46 1 0 +VecScatterEnd 363 1.0 3.3018e+00 1.0 1.29e+04 1.8 0.0e+00 0.0e+00 0.0e+00 11 0 0 0 0 11 0 0 0 0 0 +VecNormalize 22 1.0 1.3706e-01 1.6 3.60e+05 1.1 0.0e+00 0.0e+00 2.2e+01 0 0 0 0 3 0 0 0 0 4 8 +SFSetGraph 35 1.0 4.0226e-04 1.3 0.00e+00 0.0 0.0e+00 0.0e+00 0.0e+00 0 0 0 0 0 0 0 0 0 0 0 +SFSetUp 17 1.0 3.6709e-01 1.2 0.00e+00 0.0 1.6e+02 5.0e+02 1.7e+01 1 0 7 0 3 1 0 7 0 3 0 +SFBcastBegin 15 1.0 4.6338e-04 1.1 0.00e+00 0.0 9.0e+01 6.4e+02 0.0e+00 0 0 4 0 0 0 0 4 0 0 0 +SFBcastEnd 15 1.0 2.4212e-01 1.4 0.00e+00 0.0 0.0e+00 0.0e+00 0.0e+00 1 0 0 0 0 1 0 0 0 0 0 +SFReduceBegin 4 1.0 1.5765e-04 1.2 0.00e+00 0.0 1.8e+01 5.5e+02 0.0e+00 0 0 1 0 0 0 0 1 0 0 0 +SFReduceEnd 4 1.0 4.1759e-02 1.7 0.00e+00 0.0 0.0e+00 0.0e+00 0.0e+00 0 0 0 0 0 0 0 0 0 0 0 +SFPack 382 1.0 3.1243e-03 1.2 0.00e+00 0.0 0.0e+00 0.0e+00 0.0e+00 0 0 0 0 0 0 0 0 0 0 0 +SFUnpack 382 1.0 2.7965e-03 2.2 1.29e+04 1.8 0.0e+00 0.0e+00 0.0e+00 0 0 0 0 0 0 0 0 0 0 10 +KSPSetUp 7 1.0 6.5718e-04 1.0 0.00e+00 0.0 0.0e+00 0.0e+00 4.0e+00 0 0 0 0 1 0 0 0 0 1 0 +KSPSolve 1 1.0 3.8514e+00 1.0 1.43e+08 1.1 1.6e+03 4.6e+03 7.0e+01 13 65 65 41 11 13 65 65 41 11 107 +KSPGMRESOrthog 20 1.0 1.7544e-01 2.0 2.40e+06 1.1 0.0e+00 0.0e+00 2.0e+01 0 1 0 0 3 0 1 0 0 3 40 +PCSetUp_GAMG+ 1 1.0 6.3561e+00 1.0 7.67e+07 1.1 8.0e+02 1.1e+04 5.0e+02 22 34 33 52 79 22 34 33 52 81 34 + PCGAMGCreateG 2 1.0 6.7722e-01 1.0 4.97e+04 1.0 6.0e+01 2.9e+03 4.4e+01 2 0 3 1 7 2 0 3 1 7 0 + GAMG Coarsen 2 1.0 1.2689e+00 1.0 1.39e+05 1.0 2.4e+02 7.5e+02 9.7e+01 4 0 10 1 15 4 0 10 1 16 0 + GAMG MIS/Agg 2 1.0 1.2596e+00 1.0 1.39e+05 1.0 2.4e+02 7.5e+02 9.7e+01 4 0 10 1 15 4 0 10 1 16 0 + PCGAMGProl 2 1.0 1.0609e+00 1.0 0.00e+00 0.0 1.9e+02 2.2e+03 1.9e+02 4 0 8 3 30 4 0 8 3 30 0 + GAMG Prol-col 2 1.0 9.3028e-01 1.0 0.00e+00 0.0 1.8e+02 8.3e+02 1.7e+02 3 0 8 1 27 3 0 8 1 27 0 + GAMG Prol-lift 2 1.0 1.0003e-01 1.1 0.00e+00 0.0 1.2e+01 2.3e+04 1.0e+01 0 0 1 2 2 0 0 1 2 2 0 + PCGAMGOptProl 2 1.0 1.0578e+00 1.0 2.05e+07 1.1 1.9e+02 8.5e+03 8.2e+01 4 9 8 10 13 4 9 8 10 13 56 + GAMG smooth 2 1.0 4.6057e-01 1.0 6.92e+06 1.1 4.8e+01 2.0e+04 2.6e+01 2 3 2 6 4 2 3 2 6 4 44 + PCGAMGCreateL 2 1.0 2.2261e+00 1.0 5.60e+07 1.1 1.2e+02 5.3e+04 7.7e+01 8 25 5 38 12 8 25 5 38 12 71 + GAMG PtAP 2 1.0 2.0898e+00 1.0 5.60e+07 1.1 9.6e+01 6.2e+04 2.4e+01 7 25 4 35 4 7 25 4 35 4 76 + GAMG Reduce 1 1.0 1.4452e-01 1.1 0.00e+00 0.0 2.5e+01 1.8e+04 5.3e+01 0 0 1 3 8 0 0 1 3 9 0 +PCGAMG Gal l00 1 1.0 1.5322e+00 1.0 3.52e+07 1.0 4.8e+01 7.9e+04 1.2e+01 5 16 2 22 2 5 16 2 22 2 68 +PCGAMG Opt l00 1 1.0 3.2562e-01 1.0 5.12e+06 1.0 2.4e+01 3.3e+04 1.0e+01 1 2 1 5 2 1 2 1 5 2 46 +PCGAMG Gal l01 1 1.0 5.5756e-01 1.0 2.09e+07 1.5 4.8e+01 4.5e+04 1.2e+01 2 8 2 13 2 2 8 2 13 2 97 +PCGAMG Opt l01 1 1.0 3.6571e-02 1.2 1.40e+06 1.4 2.4e+01 7.8e+03 1.0e+01 0 1 1 1 2 0 1 1 1 2 96 +PCSetUp 2 1.0 6.3911e+00 1.0 7.67e+07 1.0 8.0e+02 1.1e+04 5.0e+02 22 35 33 52 79 22 35 33 52 81 35 +PCSetUpOnBlocks 22 1.0 3.9115e-02 90.8 6.90e+06 0.0 0.0e+00 0.0e+00 0.0e+00 0 1 0 0 0 0 1 0 0 0 176 +PCApply 22 1.0 3.1825e+00 1.0 1.23e+08 1.1 1.4e+03 4.2e+03 6.0e+00 11 55 59 35 1 11 55 59 35 1 111 --- Event Stage 1: Unknown @@ -2227,9 +2270,9 @@ --- Event Stage 1: Unknown ======================================================================================================================== -Average time to get PetscTime(): 1.4e-07 -Average time for MPI_Barrier(): 4.0196e-06 -Average time for zero size MPI_Send(): 3.03967e-06 +Average time to get PetscTime(): 1.36e-07 +Average time for MPI_Barrier(): 4.8476e-06 +Average time for zero size MPI_Send(): 3.06e-06 #PETSc Option Table entries: --ndofs 10000 --problem_type elasticity @@ -2292,63 +2335,63 @@ Option left: name:--problem_type value: elasticity Option left: name:--scaling_type value: weak Option left: name:-mg_levels_esteig_ksp_type value: cg -2023-05-15 13:41:12.698 ( 12.700s) [RANK: 0 ] loguru.cpp:526 INFO| atexit +2023-05-16 15:54:37.831 ( 33.378s) [RANK: 0 ] loguru.cpp:526 INFO| atexit ==== elasticity strong scaling (3 processes with ndofs=30000) ==== -2023-05-15 13:41:12.984 ( 0.108s) [RANK: 0 ] utils.cpp:612 INFO| Compute partition of cells across ranks -2023-05-15 13:41:12.984 ( 0.108s) [RANK: 0 ] graphbuild.cpp:533 INFO| Building mesh dual graph -2023-05-15 13:41:12.984 ( 0.108s) [RANK: 0 ] graphbuild.cpp:396 INFO| Build local part of mesh dual graph -2023-05-15 13:41:13.033 ( 0.157s) [RANK: 0 ] graphbuild.cpp:89 INFO| Build nonlocal part of mesh dual graph -2023-05-15 13:41:13.034 ( 0.158s) [RANK: 0 ] MPI.cpp:154 INFO| Computing communicaton graph edges (using NBX algorithm). Number of input edges: 2 -2023-05-15 13:41:13.034 ( 0.158s) [RANK: 0 ] MPI.cpp:217 INFO| Finished graph edge discovery using NBX algorithm. Number of discovered edges 2 -2023-05-15 13:41:13.034 ( 0.158s) [RANK: 0 ] graphbuild.cpp:203 INFO| Number of destination and source ranks in non-local dual graph construction, and ratio to total number of ranks: 2, 2, 0.666667, 0.666667 -2023-05-15 13:41:13.039 ( 0.163s) [RANK: 0 ] graphbuild.cpp:545 INFO| Graph edges (local: 66332, non-local: 962) -2023-05-15 13:41:13.039 ( 0.163s) [RANK: 0 ] partitioners.cpp:316 INFO| Compute graph partition using PT-SCOTCH -2023-05-15 13:41:22.966 ( 10.090s) [RANK: 0 ] MPI.cpp:154 INFO| Computing communicaton graph edges (using NBX algorithm). Number of input edges: 3 -2023-05-15 13:41:22.991 ( 10.115s) [RANK: 0 ] MPI.cpp:217 INFO| Finished graph edge discovery using NBX algorithm. Number of discovered edges 3 -2023-05-15 13:41:23.125 ( 10.249s) [RANK: 0 ] graphbuild.cpp:396 INFO| Build local part of mesh dual graph -2023-05-15 13:41:23.212 ( 10.336s) [RANK: 0 ] ordering.cpp:202 INFO| GPS pseudo-diameter:(121) 15892-511 - -2023-05-15 13:41:23.222 ( 10.346s) [RANK: 0 ] Topology.cpp:923 INFO| Create topology -2023-05-15 13:41:23.226 ( 10.350s) [RANK: 0 ] MPI.cpp:154 INFO| Computing communicaton graph edges (using NBX algorithm). Number of input edges: 3 -2023-05-15 13:41:23.251 ( 10.375s) [RANK: 0 ] MPI.cpp:217 INFO| Finished graph edge discovery using NBX algorithm. Number of discovered edges 3 -2023-05-15 13:41:23.290 ( 10.414s) [RANK: 0 ] MPI.cpp:154 INFO| Computing communicaton graph edges (using NBX algorithm). Number of input edges: 2 -2023-05-15 13:41:23.290 ( 10.415s) [RANK: 0 ] MPI.cpp:217 INFO| Finished graph edge discovery using NBX algorithm. Number of discovered edges 2 -2023-05-15 13:41:23.291 ( 10.415s) [RANK: 0 ] MPI.cpp:154 INFO| Computing communicaton graph edges (using NBX algorithm). Number of input edges: 2 -2023-05-15 13:41:23.291 ( 10.415s) [RANK: 0 ] MPI.cpp:217 INFO| Finished graph edge discovery using NBX algorithm. Number of discovered edges 2 -2023-05-15 13:41:23.298 ( 10.422s) [RANK: 0 ] MPI.cpp:154 INFO| Computing communicaton graph edges (using NBX algorithm). Number of input edges: 2 -2023-05-15 13:41:23.298 ( 10.422s) [RANK: 0 ] MPI.cpp:217 INFO| Finished graph edge discovery using NBX algorithm. Number of discovered edges 2 -2023-05-15 13:41:23.299 ( 10.423s) [RANK: 0 ] MPI.cpp:154 INFO| Computing communicaton graph edges (using NBX algorithm). Number of input edges: 0 -2023-05-15 13:41:23.299 ( 10.423s) [RANK: 0 ] MPI.cpp:217 INFO| Finished graph edge discovery using NBX algorithm. Number of discovered edges 0 -2023-05-15 13:41:23.323 ( 10.447s) [RANK: 0 ] MPI.cpp:154 INFO| Computing communicaton graph edges (using NBX algorithm). Number of input edges: 2 -2023-05-15 13:41:23.323 ( 10.448s) [RANK: 0 ] MPI.cpp:217 INFO| Finished graph edge discovery using NBX algorithm. Number of discovered edges 2 -2023-05-15 13:41:23.332 ( 10.456s) [RANK: 0 ] MPI.cpp:154 INFO| Computing communicaton graph edges (using NBX algorithm). Number of input edges: 0 -2023-05-15 13:41:23.332 ( 10.456s) [RANK: 0 ] MPI.cpp:217 INFO| Finished graph edge discovery using NBX algorithm. Number of discovered edges 0 -2023-05-15 13:41:23.332 ( 10.456s) [RANK: 0 ] MPI.h:368 INFO| Number of neighbourhood source ranks in distribute_to_postoffice: 0 -2023-05-15 13:41:23.333 ( 10.457s) [RANK: 0 ] MPI.cpp:154 INFO| Computing communicaton graph edges (using NBX algorithm). Number of input edges: 2 -2023-05-15 13:41:23.333 ( 10.457s) [RANK: 0 ] MPI.cpp:217 INFO| Finished graph edge discovery using NBX algorithm. Number of discovered edges 2 -2023-05-15 13:41:23.333 ( 10.457s) [RANK: 0 ] MPI.h:500 INFO| Neighbourhood destination ranks from post office in distribute_data (rank, num dests, num dests/mpi_size): 0, 2, 0.666667 +2023-05-16 15:54:38.884 ( 0.548s) [RANK: 0 ] utils.cpp:612 INFO| Compute partition of cells across ranks +2023-05-16 15:54:38.884 ( 0.548s) [RANK: 0 ] graphbuild.cpp:533 INFO| Building mesh dual graph +2023-05-16 15:54:38.884 ( 0.548s) [RANK: 0 ] graphbuild.cpp:396 INFO| Build local part of mesh dual graph +2023-05-16 15:54:39.040 ( 0.704s) [RANK: 0 ] graphbuild.cpp:89 INFO| Build nonlocal part of mesh dual graph +2023-05-16 15:54:39.040 ( 0.705s) [RANK: 0 ] MPI.cpp:154 INFO| Computing communicaton graph edges (using NBX algorithm). Number of input edges: 2 +2023-05-16 15:54:39.072 ( 0.737s) [RANK: 0 ] MPI.cpp:217 INFO| Finished graph edge discovery using NBX algorithm. Number of discovered edges 2 +2023-05-16 15:54:39.073 ( 0.737s) [RANK: 0 ] graphbuild.cpp:203 INFO| Number of destination and source ranks in non-local dual graph construction, and ratio to total number of ranks: 2, 2, 0.666667, 0.666667 +2023-05-16 15:54:39.085 ( 0.749s) [RANK: 0 ] graphbuild.cpp:545 INFO| Graph edges (local: 66332, non-local: 962) +2023-05-16 15:54:39.085 ( 0.749s) [RANK: 0 ] partitioners.cpp:316 INFO| Compute graph partition using PT-SCOTCH +2023-05-16 15:54:52.092 ( 13.756s) [RANK: 0 ] MPI.cpp:154 INFO| Computing communicaton graph edges (using NBX algorithm). Number of input edges: 3 +2023-05-16 15:54:52.112 ( 13.777s) [RANK: 0 ] MPI.cpp:217 INFO| Finished graph edge discovery using NBX algorithm. Number of discovered edges 3 +2023-05-16 15:54:52.410 ( 14.074s) [RANK: 0 ] graphbuild.cpp:396 INFO| Build local part of mesh dual graph +2023-05-16 15:54:52.554 ( 14.218s) [RANK: 0 ] ordering.cpp:202 INFO| GPS pseudo-diameter:(120) 16494-1122 + +2023-05-16 15:54:52.566 ( 14.230s) [RANK: 0 ] Topology.cpp:923 INFO| Create topology +2023-05-16 15:54:52.584 ( 14.249s) [RANK: 0 ] MPI.cpp:154 INFO| Computing communicaton graph edges (using NBX algorithm). Number of input edges: 3 +2023-05-16 15:54:52.600 ( 14.265s) [RANK: 0 ] MPI.cpp:217 INFO| Finished graph edge discovery using NBX algorithm. Number of discovered edges 3 +2023-05-16 15:54:52.767 ( 14.431s) [RANK: 0 ] MPI.cpp:154 INFO| Computing communicaton graph edges (using NBX algorithm). Number of input edges: 2 +2023-05-16 15:54:52.792 ( 14.457s) [RANK: 0 ] MPI.cpp:217 INFO| Finished graph edge discovery using NBX algorithm. Number of discovered edges 2 +2023-05-16 15:54:52.797 ( 14.461s) [RANK: 0 ] MPI.cpp:154 INFO| Computing communicaton graph edges (using NBX algorithm). Number of input edges: 2 +2023-05-16 15:54:52.797 ( 14.461s) [RANK: 0 ] MPI.cpp:217 INFO| Finished graph edge discovery using NBX algorithm. Number of discovered edges 2 +2023-05-16 15:54:52.800 ( 14.464s) [RANK: 0 ] MPI.cpp:154 INFO| Computing communicaton graph edges (using NBX algorithm). Number of input edges: 2 +2023-05-16 15:54:52.800 ( 14.465s) [RANK: 0 ] MPI.cpp:217 INFO| Finished graph edge discovery using NBX algorithm. Number of discovered edges 2 +2023-05-16 15:54:52.809 ( 14.473s) [RANK: 0 ] MPI.cpp:154 INFO| Computing communicaton graph edges (using NBX algorithm). Number of input edges: 0 +2023-05-16 15:54:52.809 ( 14.473s) [RANK: 0 ] MPI.cpp:217 INFO| Finished graph edge discovery using NBX algorithm. Number of discovered edges 0 +2023-05-16 15:54:52.809 ( 14.473s) [RANK: 0 ] MPI.cpp:154 INFO| Computing communicaton graph edges (using NBX algorithm). Number of input edges: 2 +2023-05-16 15:54:52.809 ( 14.473s) [RANK: 0 ] MPI.cpp:217 INFO| Finished graph edge discovery using NBX algorithm. Number of discovered edges 2 +2023-05-16 15:54:52.825 ( 14.489s) [RANK: 0 ] MPI.cpp:154 INFO| Computing communicaton graph edges (using NBX algorithm). Number of input edges: 0 +2023-05-16 15:54:52.840 ( 14.505s) [RANK: 0 ] MPI.cpp:217 INFO| Finished graph edge discovery using NBX algorithm. Number of discovered edges 0 +2023-05-16 15:54:52.841 ( 14.505s) [RANK: 0 ] MPI.h:368 INFO| Number of neighbourhood source ranks in distribute_to_postoffice: 0 UnitCube (24x19x19) to be refined 0 times -2023-05-15 13:41:23.360 ( 10.484s) [RANK: 0 ]topologycomputation.cpp:746 INFO| Computing mesh entities of dimension 2 -2023-05-15 13:41:23.394 ( 10.518s) [RANK: 0 ] MPI.cpp:154 INFO| Computing communicaton graph edges (using NBX algorithm). Number of input edges: 2 -2023-05-15 13:41:23.395 ( 10.519s) [RANK: 0 ] MPI.cpp:217 INFO| Finished graph edge discovery using NBX algorithm. Number of discovered edges 2 -2023-05-15 13:41:23.539 ( 10.663s) [RANK: 0 ] MPI.cpp:154 INFO| Computing communicaton graph edges (using NBX algorithm). Number of input edges: 2 -2023-05-15 13:41:23.539 ( 10.663s) [RANK: 0 ] MPI.cpp:217 INFO| Finished graph edge discovery using NBX algorithm. Number of discovered edges 2 -2023-05-15 13:41:23.542 ( 10.666s) [RANK: 0 ]topologycomputation.cpp:786 INFO| Requesting connectivity 2 - 3 -2023-05-15 13:41:23.542 ( 10.666s) [RANK: 0 ]topologycomputation.cpp:650 INFO| Computing mesh connectivity 2 - 3 from transpose. -2023-05-15 13:41:23.545 ( 10.669s) [RANK: 0 ]topologycomputation.cpp:746 INFO| Computing mesh entities of dimension 0 -2023-05-15 13:41:23.549 ( 10.673s) [RANK: 0 ] MPI.cpp:154 INFO| Computing communicaton graph edges (using NBX algorithm). Number of input edges: 2 -2023-05-15 13:41:23.559 ( 10.683s) [RANK: 0 ] MPI.cpp:217 INFO| Finished graph edge discovery using NBX algorithm. Number of discovered edges 2 -2023-05-15 13:41:23.559 ( 10.684s) [RANK: 0 ] MPI.cpp:154 INFO| Computing communicaton graph edges (using NBX algorithm). Number of input edges: 2 -2023-05-15 13:41:23.560 ( 10.684s) [RANK: 0 ] MPI.cpp:217 INFO| Finished graph edge discovery using NBX algorithm. Number of discovered edges 2 -2023-05-15 13:41:23.560 ( 10.684s) [RANK: 0 ] MPI.cpp:154 INFO| Computing communicaton graph edges (using NBX algorithm). Number of input edges: 0 -2023-05-15 13:41:23.560 ( 10.684s) [RANK: 0 ] MPI.cpp:217 INFO| Finished graph edge discovery using NBX algorithm. Number of discovered edges 0 -2023-05-15 13:41:23.560 ( 10.684s) [RANK: 0 ] MPI.cpp:154 INFO| Computing communicaton graph edges (using NBX algorithm). Number of input edges: 2 -2023-05-15 13:41:23.560 ( 10.684s) [RANK: 0 ] MPI.cpp:217 INFO| Finished graph edge discovery using NBX algorithm. Number of discovered edges 2 -2023-05-15 13:41:23.562 ( 10.686s) [RANK: 0 ]topologycomputation.cpp:786 INFO| Requesting connectivity 3 - 0 -2023-05-15 13:41:23.563 ( 10.687s) [RANK: 0 ]topologycomputation.cpp:786 INFO| Requesting connectivity 3 - 0 -2023-05-15 13:41:23.563 ( 10.687s) [RANK: 0 ]topologycomputation.cpp:786 INFO| Requesting connectivity 2 - 0 -2023-05-15 13:41:23.564 ( 10.688s) [RANK: 0 ]topologycomputation.cpp:786 INFO| Requesting connectivity 2 - 3 -2023-05-15 13:41:23.641 ( 10.765s) [RANK: 0 ] SparsityPattern.cpp:389 INFO| Column ghost size increased from 214 to 561 +2023-05-16 15:54:52.845 ( 14.509s) [RANK: 0 ] MPI.cpp:154 INFO| Computing communicaton graph edges (using NBX algorithm). Number of input edges: 2 +2023-05-16 15:54:52.845 ( 14.509s) [RANK: 0 ] MPI.cpp:217 INFO| Finished graph edge discovery using NBX algorithm. Number of discovered edges 2 +2023-05-16 15:54:52.845 ( 14.509s) [RANK: 0 ] MPI.h:500 INFO| Neighbourhood destination ranks from post office in distribute_data (rank, num dests, num dests/mpi_size): 0, 2, 0.666667 +2023-05-16 15:54:52.848 ( 14.512s) [RANK: 0 ]topologycomputation.cpp:746 INFO| Computing mesh entities of dimension 2 +2023-05-16 15:54:52.885 ( 14.550s) [RANK: 0 ] MPI.cpp:154 INFO| Computing communicaton graph edges (using NBX algorithm). Number of input edges: 2 +2023-05-16 15:54:52.916 ( 14.581s) [RANK: 0 ] MPI.cpp:217 INFO| Finished graph edge discovery using NBX algorithm. Number of discovered edges 2 +2023-05-16 15:54:53.177 ( 14.841s) [RANK: 0 ] MPI.cpp:154 INFO| Computing communicaton graph edges (using NBX algorithm). Number of input edges: 2 +2023-05-16 15:54:53.180 ( 14.845s) [RANK: 0 ] MPI.cpp:217 INFO| Finished graph edge discovery using NBX algorithm. Number of discovered edges 2 +2023-05-16 15:54:53.183 ( 14.847s) [RANK: 0 ]topologycomputation.cpp:786 INFO| Requesting connectivity 2 - 3 +2023-05-16 15:54:53.183 ( 14.847s) [RANK: 0 ]topologycomputation.cpp:650 INFO| Computing mesh connectivity 2 - 3 from transpose. +2023-05-16 15:54:53.194 ( 14.858s) [RANK: 0 ]topologycomputation.cpp:746 INFO| Computing mesh entities of dimension 0 +2023-05-16 15:54:53.197 ( 14.862s) [RANK: 0 ] MPI.cpp:154 INFO| Computing communicaton graph edges (using NBX algorithm). Number of input edges: 2 +2023-05-16 15:54:53.221 ( 14.885s) [RANK: 0 ] MPI.cpp:217 INFO| Finished graph edge discovery using NBX algorithm. Number of discovered edges 2 +2023-05-16 15:54:53.269 ( 14.933s) [RANK: 0 ] MPI.cpp:154 INFO| Computing communicaton graph edges (using NBX algorithm). Number of input edges: 2 +2023-05-16 15:54:53.269 ( 14.933s) [RANK: 0 ] MPI.cpp:217 INFO| Finished graph edge discovery using NBX algorithm. Number of discovered edges 2 +2023-05-16 15:54:53.269 ( 14.933s) [RANK: 0 ] MPI.cpp:154 INFO| Computing communicaton graph edges (using NBX algorithm). Number of input edges: 0 +2023-05-16 15:54:53.269 ( 14.933s) [RANK: 0 ] MPI.cpp:217 INFO| Finished graph edge discovery using NBX algorithm. Number of discovered edges 0 +2023-05-16 15:54:53.270 ( 14.934s) [RANK: 0 ] MPI.cpp:154 INFO| Computing communicaton graph edges (using NBX algorithm). Number of input edges: 2 +2023-05-16 15:54:53.270 ( 14.934s) [RANK: 0 ] MPI.cpp:217 INFO| Finished graph edge discovery using NBX algorithm. Number of discovered edges 2 +2023-05-16 15:54:53.271 ( 14.935s) [RANK: 0 ]topologycomputation.cpp:786 INFO| Requesting connectivity 3 - 0 +2023-05-16 15:54:53.272 ( 14.936s) [RANK: 0 ]topologycomputation.cpp:786 INFO| Requesting connectivity 3 - 0 +2023-05-16 15:54:53.272 ( 14.936s) [RANK: 0 ]topologycomputation.cpp:786 INFO| Requesting connectivity 2 - 0 +2023-05-16 15:54:53.272 ( 14.936s) [RANK: 0 ]topologycomputation.cpp:786 INFO| Requesting connectivity 2 - 3 +2023-05-16 15:54:53.420 ( 15.084s) [RANK: 0 ] SparsityPattern.cpp:389 INFO| Column ghost size increased from 212 to 547 ---------------------------------------------------------------- Test problem summary @@ -2363,7 +2406,7 @@ Total degrees of freedom: 30000 (30 thousand) Average degrees of freedom per process: 10000 ---------------------------------------------------------------- -2023-05-15 13:41:24.274 ( 11.398s) [RANK: 0 ] petsc.cpp:677 INFO| PETSc Krylov solver starting to solve system. +2023-05-16 15:54:55.009 ( 16.673s) [RANK: 0 ] petsc.cpp:677 INFO| PETSc Krylov solver starting to solve system. KSP Object: 3 MPI processes type: cg maximum iterations=10000, initial guess is zero @@ -2381,7 +2424,7 @@ AGG specific options Number of levels to square graph 1 Number smoothing steps 1 - Complexity: grid = 1.0644 operator = 1.25169 + Complexity: grid = 1.0702 operator = 1.28848 Coarse grid solver -- level 0 ------------------------------- KSP Object: (mg_coarse_) 3 MPI processes type: preonly @@ -2406,33 +2449,33 @@ tolerance for zero pivot 2.22045e-14 using diagonal shift on blocks to prevent zero pivot [INBLOCKS] matrix ordering: nd - factor fill ratio given 5., needed 1.07148 + factor fill ratio given 5., needed 1.0454 Factored matrix follows: Mat Object: (mg_coarse_sub_) 1 MPI process type: seqaij - rows=246, cols=246, bs=6 + rows=252, cols=252, bs=6 package used to perform factorization: petsc - total: nonzeros=58284, allocated nonzeros=58284 - using I-node routines: found 59 nodes, limit used is 5 + total: nonzeros=61344, allocated nonzeros=61344 + using I-node routines: found 56 nodes, limit used is 5 linear system matrix = precond matrix: Mat Object: (mg_coarse_sub_) 1 MPI process type: seqaij - rows=246, cols=246, bs=6 - total: nonzeros=54396, allocated nonzeros=54396 + rows=252, cols=252, bs=6 + total: nonzeros=58680, allocated nonzeros=58680 total number of mallocs used during MatSetValues calls=0 - using I-node routines: found 73 nodes, limit used is 5 + using I-node routines: found 75 nodes, limit used is 5 linear system matrix = precond matrix: Mat Object: 3 MPI processes type: mpiaij - rows=246, cols=246, bs=6 - total: nonzeros=54396, allocated nonzeros=54396 + rows=252, cols=252, bs=6 + total: nonzeros=58680, allocated nonzeros=58680 total number of mallocs used during MatSetValues calls=0 - using I-node (on process 0) routines: found 73 nodes, limit used is 5 + using I-node (on process 0) routines: found 75 nodes, limit used is 5 Down solver (pre-smoother) on level 1 ------------------------------- KSP Object: (mg_levels_1_) 3 MPI processes type: chebyshev - eigenvalue targets used: min 0.250462, max 2.75509 - eigenvalues provided (min 1.74513e-06, max 2.50462) with transform: [0. 0.1; 0. 1.1] + eigenvalue targets used: min 0.233344, max 2.56678 + eigenvalues provided (min 9.43462e-07, max 2.33344) with transform: [0. 0.1; 0. 1.1] maximum iterations=2, nonzero initial guess tolerances: relative=1e-05, absolute=1e-50, divergence=10000. left preconditioning @@ -2443,17 +2486,17 @@ linear system matrix = precond matrix: Mat Object: 3 MPI processes type: mpiaij - rows=1686, cols=1686, bs=6 - total: nonzeros=260604, allocated nonzeros=260604 + rows=1854, cols=1854, bs=6 + total: nonzeros=302364, allocated nonzeros=302364 total number of mallocs used during MatSetValues calls=0 using scalable MatPtAP() implementation - using I-node (on process 0) routines: found 158 nodes, limit used is 5 + using I-node (on process 0) routines: found 192 nodes, limit used is 5 Up solver (post-smoother) same as down solver (pre-smoother) Down solver (pre-smoother) on level 2 ------------------------------- KSP Object: (mg_levels_2_) 3 MPI processes type: chebyshev - eigenvalue targets used: min 0.25856, max 2.84416 - eigenvalues provided (min 0.0750929, max 2.5856) with transform: [0. 0.1; 0. 1.1] + eigenvalue targets used: min 0.25831, max 2.84141 + eigenvalues provided (min 0.0734188, max 2.5831) with transform: [0. 0.1; 0. 1.1] maximum iterations=2, nonzero initial guess tolerances: relative=1e-05, absolute=1e-50, divergence=10000. left preconditioning @@ -2468,7 +2511,7 @@ total: nonzeros=1251522, allocated nonzeros=1251522 total number of mallocs used during MatSetValues calls=0 has attached near null space - using I-node (on process 0) routines: found 3370 nodes, limit used is 5 + using I-node (on process 0) routines: found 3349 nodes, limit used is 5 Up solver (post-smoother) same as down solver (pre-smoother) linear system matrix = precond matrix: Mat Object: 3 MPI processes @@ -2477,49 +2520,49 @@ total: nonzeros=1251522, allocated nonzeros=1251522 total number of mallocs used during MatSetValues calls=0 has attached near null space - using I-node (on process 0) routines: found 3370 nodes, limit used is 5 + using I-node (on process 0) routines: found 3349 nodes, limit used is 5 [MPI_MAX] Summary of timings | reps wall avg wall tot --------------------------------------------------------------------------------------------------------- -Build BoxMesh | 1 10.378391 10.378391 -Build dofmap data | 2 0.022703 0.045405 -Build sparsity | 1 0.022955 0.022955 -Compute connectivity 2-3 | 1 0.001109 0.001109 -Compute dof reordering map | 2 0.000376 0.000752 -Compute entities of dim = 2 | 1 0.182362 0.182362 -Compute graph partition (SCOTCH) | 1 9.910348 9.910348 -Compute local part of mesh dual graph | 2 0.064983 0.129966 -Compute local-to-local map | 1 0.004645 0.004645 -Compute non-local part of mesh dual graph | 1 0.007240 0.007240 -Compute-local-to-global links for global/local adjacency list | 1 0.000976 0.000976 -Distribute AdjacencyList nodes to destination ranks | 1 0.182308 0.182308 -Distribute row-wise data (scalable) | 1 0.001735 0.001735 -Extract partition boundaries from SCOTCH graph | 1 0.001229 0.001229 -GPS: create_level_structure | 2 0.002821 0.011284 -Get SCOTCH graph data | 1 0.000021 0.000021 -Gibbs-Poole-Stockmeyer ordering | 1 0.016073 0.016073 -Init MPI | 1 0.095859 0.095859 -Init PETSc | 1 0.008519 0.008519 -Init dofmap from element dofmap | 2 0.004718 0.009436 -Init logging | 1 0.000071 0.000071 -PETSc Krylov solver | 1 2.979508 2.979508 -SCOTCH: call SCOTCH_dgraphBuild | 1 0.000321 0.000321 -SCOTCH: call SCOTCH_dgraphHalo | 1 0.059910 0.059910 -SCOTCH: call SCOTCH_dgraphPart | 1 9.870127 9.870127 -SparsityPattern::assemble | 1 0.028076 0.028076 -Topology: create | 1 0.142568 0.142568 -Topology: determine shared index ownership | 1 0.091480 0.091480 -Topology: determine vertex ownership groups (owned, undetermined, unowned) | 1 0.007660 0.007660 -ZZZ Assemble matrix | 1 0.539294 0.539294 -ZZZ Assemble vector | 1 0.016013 0.016013 -ZZZ Create Mesh | 1 10.378955 10.378955 -ZZZ Create RHS function | 1 0.037099 0.037099 -ZZZ Create boundary conditions | 1 0.014307 0.014307 -ZZZ Create facets and facet->cell connectivity | 1 0.183592 0.183592 -ZZZ Create forms | 1 0.000129 0.000129 -ZZZ Create near-nullspace | 1 0.026588 0.026588 -ZZZ FunctionSpace | 1 0.018394 0.018394 -ZZZ Solve | 1 3.000090 3.000090 +Build BoxMesh | 1 13.970864 13.970864 +Build dofmap data | 2 0.047445 0.094889 +Build sparsity | 1 0.056576 0.056576 +Compute connectivity 2-3 | 1 0.001117 0.001117 +Compute dof reordering map | 2 0.000356 0.000712 +Compute entities of dim = 2 | 1 0.335146 0.335146 +Compute graph partition (SCOTCH) | 1 12.993136 12.993136 +Compute local part of mesh dual graph | 2 0.144397 0.288793 +Compute local-to-local map | 1 0.000522 0.000522 +Compute non-local part of mesh dual graph | 1 0.088810 0.088810 +Compute-local-to-global links for global/local adjacency list | 1 0.000964 0.000964 +Distribute AdjacencyList nodes to destination ranks | 1 0.342413 0.342413 +Distribute row-wise data (scalable) | 1 0.021215 0.021215 +Extract partition boundaries from SCOTCH graph | 1 0.001166 0.001166 +GPS: create_level_structure | 3 0.003394 0.011639 +Get SCOTCH graph data | 1 0.000017 0.000017 +Gibbs-Poole-Stockmeyer ordering | 1 0.032505 0.032505 +Init MPI | 1 0.596813 0.596813 +Init PETSc | 1 0.003049 0.003049 +Init dofmap from element dofmap | 2 0.006736 0.013472 +Init logging | 1 0.000076 0.000076 +PETSc Krylov solver | 1 10.117109 10.117109 +SCOTCH: call SCOTCH_dgraphBuild | 1 0.023315 0.023315 +SCOTCH: call SCOTCH_dgraphHalo | 1 0.087935 0.087935 +SCOTCH: call SCOTCH_dgraphPart | 1 12.930871 12.930871 +SparsityPattern::assemble | 1 0.056398 0.056398 +Topology: create | 1 0.246821 0.246821 +Topology: determine shared index ownership | 1 0.138803 0.138803 +Topology: determine vertex ownership groups (owned, undetermined, unowned) | 1 0.011678 0.011678 +ZZZ Assemble matrix | 1 0.705242 0.705242 +ZZZ Assemble vector | 1 0.036322 0.036322 +ZZZ Create Mesh | 1 13.971261 13.971261 +ZZZ Create RHS function | 1 0.055420 0.055420 +ZZZ Create boundary conditions | 1 0.010601 0.010601 +ZZZ Create facets and facet->cell connectivity | 1 0.336364 0.336364 +ZZZ Create forms | 1 0.000107 0.000107 +ZZZ Create near-nullspace | 1 0.652143 0.652143 +ZZZ FunctionSpace | 1 0.086574 0.086574 +ZZZ Solve | 1 10.293412 10.293412 *** Number of Krylov iterations: 21 *** Solution norm: 3.6795e-05 **************************************************************************************************************************************************************** @@ -2528,17 +2571,17 @@ ------------------------------------------------------------------ PETSc Performance Summary: ------------------------------------------------------------------ -/build/fenicsx-performance-tests-0.5.0~git20220731.821823b/obj-arm-linux-gnueabihf/dolfinx-scaling-test on a named virt64c with 3 processors, by pbuilder1 Mon May 15 13:41:27 2023 +/build/fenicsx-performance-tests-0.5.0~git20220731.821823b/obj-arm-linux-gnueabihf/dolfinx-scaling-test on a named i-capture-the-hostname with 3 processors, by pbuilder2 Tue May 16 15:55:05 2023 Using Petsc Release Version 3.18.5, Feb 27, 2023 Max Max/Min Avg Total -Time (sec): 1.428e+01 1.000 1.428e+01 +Time (sec): 2.627e+01 1.000 2.627e+01 Objects: 4.630e+02 1.004 4.617e+02 -Flops: 2.177e+08 1.077 2.080e+08 6.241e+08 -Flops/sec: 1.525e+07 1.077 1.456e+07 4.369e+07 -MPI Msg Count: 8.200e+02 1.041 7.987e+02 2.396e+03 -MPI Msg Len (bytes): 6.314e+06 1.387 6.894e+03 1.652e+07 -MPI Reductions: 6.370e+02 1.000 +Flops: 2.249e+08 1.081 2.165e+08 6.495e+08 +Flops/sec: 8.561e+06 1.081 8.240e+06 2.472e+07 +MPI Msg Count: 8.170e+02 1.044 7.947e+02 2.384e+03 +MPI Msg Len (bytes): 6.914e+06 1.484 7.102e+03 1.693e+07 +MPI Reductions: 6.360e+02 1.000 Flop counting convention: 1 flop = 1 real number operation of type (multiply/divide/add/subtract) e.g., VecAXPY() for real vectors of length N --> 2N flops @@ -2546,7 +2589,7 @@ Summary of Stages: ----- Time ------ ----- Flop ------ --- Messages --- -- Message Lengths -- -- Reductions -- Avg %Total Avg %Total Count %Total Avg %Total Count %Total - 0: Main Stage: 1.4282e+01 100.0% 6.2406e+08 100.0% 2.396e+03 100.0% 6.894e+03 100.0% 6.190e+02 97.2% + 0: Main Stage: 2.6274e+01 100.0% 6.4947e+08 100.0% 2.384e+03 100.0% 7.102e+03 100.0% 6.180e+02 97.2% ------------------------------------------------------------------------------------------------------------------------ See the 'Profiling' chapter of the users' manual for details on interpreting output. @@ -2570,79 +2613,79 @@ --- Event Stage 0: Main Stage -BuildTwoSided 103 1.0 3.9985e-01 2.0 0.00e+00 0.0 1.4e+02 4.0e+00 1.0e+02 2 0 6 0 16 2 0 6 0 17 0 -BuildTwoSidedF 86 1.0 3.6660e-01 2.2 0.00e+00 0.0 1.2e+02 3.5e+04 8.6e+01 2 0 5 25 14 2 0 5 25 14 0 -MatMult 217 1.0 8.6624e-01 1.1 1.21e+08 1.1 1.3e+03 5.4e+03 2.0e+00 6 55 55 43 0 6 55 55 43 0 399 -MatMultAdd 44 1.0 1.6751e-01 1.3 1.02e+07 1.1 1.8e+02 1.4e+03 0.0e+00 1 5 7 1 0 1 5 7 1 0 174 -MatMultTranspose 44 1.0 1.0524e-01 1.1 1.02e+07 1.1 1.9e+02 1.3e+03 2.0e+00 1 5 8 1 0 1 5 8 1 0 277 -MatSolve 22 0.0 3.4467e-03 0.0 2.56e+06 0.0 0.0e+00 0.0e+00 0.0e+00 0 0 0 0 0 0 0 0 0 0 742 -MatLUFactorSym 1 1.0 3.9829e-03 127.4 0.00e+00 0.0 0.0e+00 0.0e+00 0.0e+00 0 0 0 0 0 0 0 0 0 0 0 -MatLUFactorNum 1 1.0 1.3976e-02 4063.8 8.67e+06 0.0 0.0e+00 0.0e+00 0.0e+00 0 1 0 0 0 0 1 0 0 0 620 -MatConvert 1 1.0 3.4387e-02 1.5 0.00e+00 0.0 1.2e+01 7.1e+02 1.0e+00 0 0 1 0 0 0 0 1 0 0 0 -MatScale 4 1.0 1.4577e-03 1.1 4.61e+05 1.1 0.0e+00 0.0e+00 0.0e+00 0 0 0 0 0 0 0 0 0 0 908 -MatResidual 44 1.0 1.6782e-01 1.1 2.34e+07 1.1 2.6e+02 5.1e+03 0.0e+00 1 11 11 8 0 1 11 11 8 0 396 -MatAssemblyBegin 59 1.0 4.3112e-01 2.0 0.00e+00 0.0 1.2e+02 3.5e+04 3.0e+01 2 0 5 25 5 2 0 5 25 5 0 -MatAssemblyEnd 59 1.0 2.1949e-01 1.1 8.07e+04 1.6 0.0e+00 0.0e+00 9.6e+01 1 0 0 0 15 1 0 0 0 16 1 -MatGetRowIJ 1 0.0 1.4657e-04 0.0 0.00e+00 0.0 0.0e+00 0.0e+00 0.0e+00 0 0 0 0 0 0 0 0 0 0 0 -MatCreateSubMat 2 1.0 2.7110e-02 1.0 0.00e+00 0.0 1.0e+01 4.4e+04 2.8e+01 0 0 0 3 4 0 0 0 3 5 0 -MatGetOrdering 1 0.0 3.3205e-04 0.0 0.00e+00 0.0 0.0e+00 0.0e+00 0.0e+00 0 0 0 0 0 0 0 0 0 0 0 -MatCoarsen 2 1.0 1.9495e-01 1.0 1.38e+05 1.0 2.4e+02 7.2e+02 9.7e+01 1 0 10 1 15 1 0 10 1 16 2 -MatZeroEntries 3 1.0 4.5762e-03 21.1 0.00e+00 0.0 0.0e+00 0.0e+00 0.0e+00 0 0 0 0 0 0 0 0 0 0 0 -MatView 6 1.5 1.8845e-03 1.2 0.00e+00 0.0 0.0e+00 0.0e+00 4.0e+00 0 0 0 0 1 0 0 0 0 1 0 -MatAXPY 4 1.0 9.2435e-02 1.1 1.14e+05 1.0 0.0e+00 0.0e+00 1.2e+01 1 0 0 0 2 1 0 0 0 2 4 -MatTranspose 10 1.0 2.6795e-02 1.0 0.00e+00 0.0 9.0e+01 2.0e+03 3.2e+01 0 0 4 1 5 0 0 4 1 5 0 -MatMatMultSym 9 1.0 1.6998e-01 1.4 0.00e+00 0.0 5.1e+01 1.1e+04 2.8e+01 1 0 2 4 4 1 0 2 4 5 0 -MatMatMultNum 3 1.0 5.6207e-02 1.0 6.39e+06 1.1 1.5e+01 2.5e+04 3.0e+00 0 3 1 2 0 0 3 1 2 0 323 -MatPtAPSymbolic 3 1.0 5.1443e-01 1.0 0.00e+00 0.0 9.9e+01 3.2e+04 2.1e+01 4 0 4 19 3 4 0 4 19 3 0 -MatPtAPNumeric 3 1.0 6.1132e-01 1.0 5.69e+07 1.3 3.0e+01 8.4e+04 1.5e+01 4 24 1 15 2 4 24 1 15 2 248 -MatGetLocalMat 9 1.0 5.6102e-03 1.0 0.00e+00 0.0 0.0e+00 0.0e+00 0.0e+00 0 0 0 0 0 0 0 0 0 0 0 -MatGetBrAoCol 9 1.0 2.6462e-02 1.2 0.00e+00 0.0 1.2e+02 2.9e+04 1.0e+00 0 0 5 21 0 0 0 5 21 0 0 -VecMDot 20 1.0 7.1269e-02 3.8 1.18e+06 1.0 0.0e+00 0.0e+00 2.0e+01 0 1 0 0 3 0 1 0 0 3 49 -VecTDot 42 1.0 7.5054e-02 1.5 8.49e+05 1.0 0.0e+00 0.0e+00 4.2e+01 0 0 0 0 7 0 0 0 0 7 34 -VecNorm 44 1.0 1.2638e-01 3.6 6.80e+05 1.0 0.0e+00 0.0e+00 4.4e+01 0 0 0 0 7 0 0 0 0 7 16 -VecScale 22 1.0 2.1404e-04 1.3 1.18e+05 1.0 0.0e+00 0.0e+00 0.0e+00 0 0 0 0 0 0 0 0 0 0 1628 -VecCopy 136 1.0 1.2017e-03 1.1 0.00e+00 0.0 0.0e+00 0.0e+00 0.0e+00 0 0 0 0 0 0 0 0 0 0 0 -VecSet 203 1.0 2.3094e-03 3.2 0.00e+00 0.0 0.0e+00 0.0e+00 0.0e+00 0 0 0 0 0 0 0 0 0 0 0 -VecAXPY 44 1.0 6.0182e-03 3.5 8.70e+05 1.0 0.0e+00 0.0e+00 0.0e+00 0 0 0 0 0 0 0 0 0 0 429 -VecAYPX 284 1.0 1.4465e-02 2.4 2.30e+06 1.0 0.0e+00 0.0e+00 0.0e+00 0 1 0 0 0 0 1 0 0 0 468 -VecAXPBYCZ 88 1.0 3.5598e-03 1.2 2.37e+06 1.0 0.0e+00 0.0e+00 0.0e+00 0 1 0 0 0 0 1 0 0 0 1958 -VecMAXPY 22 1.0 2.2159e-03 1.1 1.40e+06 1.0 0.0e+00 0.0e+00 0.0e+00 0 1 0 0 0 0 1 0 0 0 1859 -VecAssemblyBegin 57 1.0 9.8881e-03 5.5 0.00e+00 0.0 0.0e+00 0.0e+00 5.6e+01 0 0 0 0 9 0 0 0 0 9 0 -VecAssemblyEnd 57 1.0 1.9049e-04 1.2 0.00e+00 0.0 0.0e+00 0.0e+00 0.0e+00 0 0 0 0 0 0 0 0 0 0 0 -VecPointwiseMult 198 1.0 5.2705e-03 1.2 1.06e+06 1.0 0.0e+00 0.0e+00 0.0e+00 0 1 0 0 0 0 1 0 0 0 595 -VecScatterBegin 363 1.0 1.2860e-02 1.5 0.00e+00 0.0 1.9e+03 4.1e+03 8.0e+00 0 0 79 47 1 0 0 79 47 1 0 -VecScatterEnd 363 1.0 6.9555e-01 1.2 1.43e+04 2.1 0.0e+00 0.0e+00 0.0e+00 4 0 0 0 0 4 0 0 0 0 0 -VecNormalize 22 1.0 4.9217e-02 56.0 3.55e+05 1.0 0.0e+00 0.0e+00 2.2e+01 0 0 0 0 3 0 0 0 0 4 21 -SFSetGraph 35 1.0 3.5590e-04 1.1 0.00e+00 0.0 0.0e+00 0.0e+00 0.0e+00 0 0 0 0 0 0 0 0 0 0 0 -SFSetUp 17 1.0 5.0971e-02 1.3 0.00e+00 0.0 1.6e+02 4.8e+02 1.7e+01 0 0 7 0 3 0 0 7 0 3 0 -SFBcastBegin 15 1.0 2.9154e-04 1.2 0.00e+00 0.0 9.0e+01 6.3e+02 0.0e+00 0 0 4 0 0 0 0 4 0 0 0 -SFBcastEnd 15 1.0 4.2819e-02 1.8 0.00e+00 0.0 0.0e+00 0.0e+00 0.0e+00 0 0 0 0 0 0 0 0 0 0 0 -SFReduceBegin 4 1.0 1.2283e-04 1.1 0.00e+00 0.0 1.8e+01 5.4e+02 0.0e+00 0 0 1 0 0 0 0 1 0 0 0 -SFReduceEnd 4 1.0 5.1115e-05 1.1 0.00e+00 0.0 0.0e+00 0.0e+00 0.0e+00 0 0 0 0 0 0 0 0 0 0 0 -SFPack 382 1.0 3.0137e-03 1.2 0.00e+00 0.0 0.0e+00 0.0e+00 0.0e+00 0 0 0 0 0 0 0 0 0 0 0 -SFUnpack 382 1.0 7.5822e-04 1.1 1.43e+04 2.1 0.0e+00 0.0e+00 0.0e+00 0 0 0 0 0 0 0 0 0 0 39 -KSPSetUp 7 1.0 5.3617e-04 1.0 0.00e+00 0.0 0.0e+00 0.0e+00 4.0e+00 0 0 0 0 1 0 0 0 0 1 0 -KSPSolve 1 1.0 1.1231e+00 1.0 1.38e+08 1.1 1.6e+03 4.5e+03 7.0e+01 8 65 65 42 11 8 65 65 42 11 363 -KSPGMRESOrthog 20 1.0 7.3392e-02 3.6 2.37e+06 1.0 0.0e+00 0.0e+00 2.0e+01 0 1 0 0 3 0 1 0 0 3 95 -PCSetUp_GAMG+ 1 1.0 1.8483e+00 1.0 7.75e+07 1.3 8.0e+02 1.0e+04 5.0e+02 13 34 33 51 79 13 34 33 51 81 114 - PCGAMGCreateG 2 1.0 1.3524e-01 1.1 4.98e+04 1.0 6.0e+01 2.8e+03 4.4e+01 1 0 3 1 7 1 0 3 1 7 1 - GAMG Coarsen 2 1.0 1.9704e-01 1.0 1.38e+05 1.0 2.4e+02 7.2e+02 9.7e+01 1 0 10 1 15 1 0 10 1 16 2 - GAMG MIS/Agg 2 1.0 1.9500e-01 1.0 1.38e+05 1.0 2.4e+02 7.2e+02 9.7e+01 1 0 10 1 15 1 0 10 1 16 2 - PCGAMGProl 2 1.0 5.4778e-02 1.0 0.00e+00 0.0 1.9e+02 1.7e+03 1.9e+02 0 0 8 2 30 0 0 8 2 30 0 - GAMG Prol-col 2 1.0 2.2614e-02 1.0 0.00e+00 0.0 1.8e+02 6.3e+02 1.7e+02 0 0 8 1 27 0 0 8 1 27 0 - GAMG Prol-lift 2 1.0 3.1533e-02 1.0 0.00e+00 0.0 1.2e+01 1.7e+04 1.0e+01 0 0 1 1 2 0 0 1 1 2 0 - PCGAMGOptProl 2 1.0 3.3950e-01 1.0 2.05e+07 1.1 1.9e+02 8.3e+03 8.2e+01 2 9 8 10 13 2 9 8 10 13 173 - GAMG smooth 2 1.0 1.5932e-01 1.0 6.91e+06 1.1 4.8e+01 2.0e+04 2.6e+01 1 3 2 6 4 1 3 2 6 4 123 - PCGAMGCreateL 2 1.0 1.1275e+00 1.0 5.68e+07 1.3 1.2e+02 5.1e+04 7.7e+01 8 24 5 37 12 8 24 5 37 12 134 - GAMG PtAP 2 1.0 1.0987e+00 1.0 5.68e+07 1.3 9.6e+01 5.9e+04 2.4e+01 8 24 4 34 4 8 24 4 34 4 138 - GAMG Reduce 1 1.0 2.9588e-02 1.0 0.00e+00 0.0 2.5e+01 1.9e+04 5.3e+01 0 0 1 3 8 0 0 1 3 9 0 -PCGAMG Gal l00 1 1.0 8.0729e-01 1.0 3.49e+07 1.1 4.8e+01 7.4e+04 1.2e+01 6 16 2 21 2 6 16 2 21 2 125 -PCGAMG Opt l00 1 1.0 1.0628e-01 1.1 5.04e+06 1.0 2.4e+01 3.3e+04 1.0e+01 1 2 1 5 2 1 2 1 5 2 141 -PCGAMG Gal l01 1 1.0 2.9138e-01 1.0 2.19e+07 1.9 4.8e+01 4.4e+04 1.2e+01 2 8 2 13 2 2 8 2 13 2 174 -PCGAMG Opt l01 1 1.0 2.8385e-02 1.0 1.34e+06 1.8 2.4e+01 6.8e+03 1.0e+01 0 1 1 1 2 0 1 1 1 2 110 -PCSetUp 2 1.0 1.8667e+00 1.0 7.75e+07 1.1 8.0e+02 1.0e+04 5.0e+02 13 35 33 51 79 13 35 33 51 81 117 -PCSetUpOnBlocks 22 1.0 1.8603e-02 49.1 8.67e+06 0.0 0.0e+00 0.0e+00 0.0e+00 0 1 0 0 0 0 1 0 0 0 466 -PCApply 22 1.0 9.1400e-01 1.1 1.19e+08 1.1 1.4e+03 4.1e+03 6.0e+00 6 56 59 36 1 6 56 59 36 1 381 +BuildTwoSided 103 1.0 1.5237e+00 2.6 0.00e+00 0.0 1.4e+02 4.0e+00 1.0e+02 4 0 6 0 16 4 0 6 0 17 0 +BuildTwoSidedF 86 1.0 1.2299e+00 3.6 0.00e+00 0.0 1.1e+02 3.7e+04 8.6e+01 3 0 5 25 14 3 0 5 25 14 0 +MatMult 217 1.0 2.4983e+00 1.1 1.22e+08 1.1 1.3e+03 5.5e+03 2.0e+00 9 54 56 43 0 9 54 56 43 0 141 +MatMultAdd 44 1.0 3.4937e-01 1.2 1.04e+07 1.0 1.8e+02 1.3e+03 0.0e+00 1 5 7 1 0 1 5 7 1 0 87 +MatMultTranspose 44 1.0 3.9131e-01 1.2 1.04e+07 1.0 1.9e+02 1.2e+03 2.0e+00 1 5 8 1 0 1 5 8 1 0 78 +MatSolve 22 0.0 3.2913e-03 0.0 2.69e+06 0.0 0.0e+00 0.0e+00 0.0e+00 0 0 0 0 0 0 0 0 0 0 818 +MatLUFactorSym 1 1.0 1.2511e-02 385.9 0.00e+00 0.0 0.0e+00 0.0e+00 0.0e+00 0 0 0 0 0 0 0 0 0 0 0 +MatLUFactorNum 1 1.0 5.9309e-02 13482.3 9.06e+06 0.0 0.0e+00 0.0e+00 0.0e+00 0 1 0 0 0 0 1 0 0 0 153 +MatConvert 1 1.0 2.2297e-02 1.7 0.00e+00 0.0 1.2e+01 7.1e+02 1.0e+00 0 0 1 0 0 0 0 1 0 0 0 +MatScale 4 1.0 1.2280e-03 1.1 4.70e+05 1.0 0.0e+00 0.0e+00 0.0e+00 0 0 0 0 0 0 0 0 0 0 1122 +MatResidual 44 1.0 5.8201e-01 1.2 2.38e+07 1.1 2.6e+02 5.2e+03 0.0e+00 2 11 11 8 0 2 11 11 8 0 117 +MatAssemblyBegin 59 1.0 1.0557e+00 3.1 0.00e+00 0.0 1.1e+02 3.7e+04 3.0e+01 3 0 5 25 5 3 0 5 25 5 0 +MatAssemblyEnd 59 1.0 1.2311e+00 1.1 8.82e+04 1.9 0.0e+00 0.0e+00 9.6e+01 4 0 0 0 15 4 0 0 0 16 0 +MatGetRowIJ 1 0.0 1.4231e-04 0.0 0.00e+00 0.0 0.0e+00 0.0e+00 0.0e+00 0 0 0 0 0 0 0 0 0 0 0 +MatCreateSubMat 2 1.0 4.9588e-01 1.0 0.00e+00 0.0 1.0e+01 5.1e+04 2.8e+01 2 0 0 3 4 2 0 0 3 5 0 +MatGetOrdering 1 0.0 3.2379e-04 0.0 0.00e+00 0.0 0.0e+00 0.0e+00 0.0e+00 0 0 0 0 0 0 0 0 0 0 0 +MatCoarsen 2 1.0 1.4175e+00 1.0 1.38e+05 1.0 2.3e+02 7.6e+02 9.6e+01 5 0 10 1 15 5 0 10 1 16 0 +MatZeroEntries 3 1.0 2.6737e-04 1.4 0.00e+00 0.0 0.0e+00 0.0e+00 0.0e+00 0 0 0 0 0 0 0 0 0 0 0 +MatView 6 1.5 1.3763e-02 1.5 0.00e+00 0.0 0.0e+00 0.0e+00 4.0e+00 0 0 0 0 1 0 0 0 0 1 0 +MatAXPY 4 1.0 1.6374e-01 1.1 1.13e+05 1.0 0.0e+00 0.0e+00 1.2e+01 1 0 0 0 2 1 0 0 0 2 2 +MatTranspose 10 1.0 4.2431e-01 1.0 0.00e+00 0.0 9.0e+01 2.1e+03 3.2e+01 2 0 4 1 5 2 0 4 1 5 0 +MatMatMultSym 9 1.0 4.7878e-01 1.0 0.00e+00 0.0 5.1e+01 1.2e+04 2.8e+01 2 0 2 4 4 2 0 2 4 5 0 +MatMatMultNum 3 1.0 9.8035e-02 1.1 6.49e+06 1.1 1.5e+01 2.5e+04 3.0e+00 0 3 1 2 0 0 3 1 2 0 190 +MatPtAPSymbolic 3 1.0 1.1839e+00 1.0 0.00e+00 0.0 9.9e+01 3.3e+04 2.1e+01 4 0 4 19 3 4 0 4 19 3 0 +MatPtAPNumeric 3 1.0 1.3949e+00 1.0 6.24e+07 1.2 3.0e+01 8.6e+04 1.5e+01 5 25 1 15 2 5 25 1 15 2 118 +MatGetLocalMat 9 1.0 1.4684e-02 1.5 0.00e+00 0.0 0.0e+00 0.0e+00 0.0e+00 0 0 0 0 0 0 0 0 0 0 0 +MatGetBrAoCol 9 1.0 3.2514e-01 1.6 0.00e+00 0.0 1.2e+02 3.0e+04 1.0e+00 1 0 5 21 0 1 0 5 21 0 0 +VecMDot 20 1.0 9.1244e-02 2.1 1.18e+06 1.0 0.0e+00 0.0e+00 2.0e+01 0 1 0 0 3 0 1 0 0 3 38 +VecTDot 42 1.0 1.8788e-01 1.6 8.50e+05 1.0 0.0e+00 0.0e+00 4.2e+01 1 0 0 0 7 1 0 0 0 7 13 +VecNorm 44 1.0 2.2618e-01 1.8 6.80e+05 1.0 0.0e+00 0.0e+00 4.4e+01 1 0 0 0 7 1 0 0 0 7 9 +VecScale 22 1.0 2.0722e-04 1.1 1.18e+05 1.0 0.0e+00 0.0e+00 0.0e+00 0 0 0 0 0 0 0 0 0 0 1691 +VecCopy 136 1.0 1.0528e-03 1.2 0.00e+00 0.0 0.0e+00 0.0e+00 0.0e+00 0 0 0 0 0 0 0 0 0 0 0 +VecSet 203 1.0 7.8103e-04 1.0 0.00e+00 0.0 0.0e+00 0.0e+00 0.0e+00 0 0 0 0 0 0 0 0 0 0 0 +VecAXPY 44 1.0 1.5379e-03 1.1 8.71e+05 1.0 0.0e+00 0.0e+00 0.0e+00 0 0 0 0 0 0 0 0 0 0 1680 +VecAYPX 284 1.0 2.7035e-02 5.1 2.29e+06 1.0 0.0e+00 0.0e+00 0.0e+00 0 1 0 0 0 0 1 0 0 0 252 +VecAXPBYCZ 88 1.0 3.7038e-03 1.4 2.35e+06 1.0 0.0e+00 0.0e+00 0.0e+00 0 1 0 0 0 0 1 0 0 0 1892 +VecMAXPY 22 1.0 1.9853e-03 1.1 1.39e+06 1.0 0.0e+00 0.0e+00 0.0e+00 0 1 0 0 0 0 1 0 0 0 2086 +VecAssemblyBegin 57 1.0 2.9757e-01 3.5 0.00e+00 0.0 0.0e+00 0.0e+00 5.6e+01 1 0 0 0 9 1 0 0 0 9 0 +VecAssemblyEnd 57 1.0 2.6269e-04 1.2 0.00e+00 0.0 0.0e+00 0.0e+00 0.0e+00 0 0 0 0 0 0 0 0 0 0 0 +VecPointwiseMult 198 1.0 1.2385e-02 1.5 1.06e+06 1.0 0.0e+00 0.0e+00 0.0e+00 0 0 0 0 0 0 0 0 0 0 255 +VecScatterBegin 363 1.0 1.7374e-01 1.3 0.00e+00 0.0 1.9e+03 4.1e+03 8.0e+00 1 0 80 47 1 1 0 80 47 1 0 +VecScatterEnd 363 1.0 2.7014e+00 1.0 1.40e+04 2.4 0.0e+00 0.0e+00 0.0e+00 10 0 0 0 0 10 0 0 0 0 0 +VecNormalize 22 1.0 6.2398e-02 1.1 3.53e+05 1.0 0.0e+00 0.0e+00 2.2e+01 0 0 0 0 3 0 0 0 0 4 17 +SFSetGraph 35 1.0 3.8984e-04 1.1 0.00e+00 0.0 0.0e+00 0.0e+00 0.0e+00 0 0 0 0 0 0 0 0 0 0 0 +SFSetUp 17 1.0 3.7349e-01 1.3 0.00e+00 0.0 1.6e+02 4.9e+02 1.7e+01 1 0 7 0 3 1 0 7 0 3 0 +SFBcastBegin 14 1.0 3.7822e-04 1.2 0.00e+00 0.0 8.4e+01 6.7e+02 0.0e+00 0 0 4 0 0 0 0 4 0 0 0 +SFBcastEnd 14 1.0 1.7891e-01 1.2 0.00e+00 0.0 0.0e+00 0.0e+00 0.0e+00 1 0 0 0 0 1 0 0 0 0 0 +SFReduceBegin 4 1.0 1.9504e-04 1.6 0.00e+00 0.0 1.8e+01 5.4e+02 0.0e+00 0 0 1 0 0 0 0 1 0 0 0 +SFReduceEnd 4 1.0 4.6056e-02 3.9 0.00e+00 0.0 0.0e+00 0.0e+00 0.0e+00 0 0 0 0 0 0 0 0 0 0 0 +SFPack 381 1.0 1.0744e-02 4.0 0.00e+00 0.0 0.0e+00 0.0e+00 0.0e+00 0 0 0 0 0 0 0 0 0 0 0 +SFUnpack 381 1.0 5.1630e-03 4.2 1.40e+04 2.4 0.0e+00 0.0e+00 0.0e+00 0 0 0 0 0 0 0 0 0 0 6 +KSPSetUp 7 1.0 4.8489e-02 1.1 0.00e+00 0.0 0.0e+00 0.0e+00 4.0e+00 0 0 0 0 1 0 0 0 0 1 0 +KSPSolve 1 1.0 3.3142e+00 1.0 1.44e+08 1.1 1.6e+03 4.6e+03 7.0e+01 13 64 65 42 11 13 64 65 42 11 126 +KSPGMRESOrthog 20 1.0 9.3153e-02 2.1 2.35e+06 1.0 0.0e+00 0.0e+00 2.0e+01 0 1 0 0 3 0 1 0 0 3 75 +PCSetUp_GAMG+ 1 1.0 6.7838e+00 1.0 8.32e+07 1.2 8.0e+02 1.1e+04 5.0e+02 26 35 33 51 79 26 35 33 51 81 33 + PCGAMGCreateG 2 1.0 4.9234e-01 1.0 4.97e+04 1.0 6.0e+01 2.9e+03 4.4e+01 2 0 3 1 7 2 0 3 1 7 0 + GAMG Coarsen 2 1.0 1.4198e+00 1.0 1.38e+05 1.0 2.3e+02 7.6e+02 9.6e+01 5 0 10 1 15 5 0 10 1 16 0 + GAMG MIS/Agg 2 1.0 1.4176e+00 1.0 1.38e+05 1.0 2.3e+02 7.6e+02 9.6e+01 5 0 10 1 15 5 0 10 1 16 0 + PCGAMGProl 2 1.0 9.6101e-01 1.0 0.00e+00 0.0 1.9e+02 1.9e+03 1.9e+02 4 0 8 2 30 4 0 8 2 30 0 + GAMG Prol-col 2 1.0 8.0465e-01 1.0 0.00e+00 0.0 1.8e+02 7.2e+02 1.7e+02 3 0 8 1 27 3 0 8 1 28 0 + GAMG Prol-lift 2 1.0 7.6113e-02 1.0 0.00e+00 0.0 1.2e+01 2.0e+04 1.0e+01 0 0 1 1 2 0 0 1 1 2 0 + PCGAMGOptProl 2 1.0 6.8568e-01 1.0 2.07e+07 1.1 1.9e+02 8.5e+03 8.2e+01 3 9 8 10 13 3 9 8 10 13 88 + GAMG smooth 2 1.0 3.5211e-01 1.0 7.02e+06 1.1 4.8e+01 2.0e+04 2.6e+01 1 3 2 6 4 1 3 2 6 4 57 + PCGAMGCreateL 2 1.0 3.1199e+00 1.0 6.23e+07 1.2 1.2e+02 5.2e+04 7.7e+01 12 25 5 37 12 12 25 5 37 12 53 + GAMG PtAP 2 1.0 2.3129e+00 1.0 6.23e+07 1.2 9.6e+01 6.0e+04 2.4e+01 9 25 4 34 4 9 25 4 34 4 71 + GAMG Reduce 1 1.0 8.0765e-01 1.0 0.00e+00 0.0 2.5e+01 2.1e+04 5.3e+01 3 0 1 3 8 3 0 1 3 9 0 +PCGAMG Gal l00 1 1.0 1.3827e+00 1.0 3.57e+07 1.0 4.8e+01 7.3e+04 1.2e+01 5 16 2 21 2 5 16 2 21 2 77 +PCGAMG Opt l00 1 1.0 2.2547e-01 1.0 5.06e+06 1.0 2.4e+01 3.3e+04 1.0e+01 1 2 1 5 2 1 2 1 5 2 67 +PCGAMG Gal l01 1 1.0 9.3344e-01 1.0 2.66e+07 1.7 4.8e+01 4.8e+04 1.2e+01 4 9 2 13 2 4 9 2 13 2 63 +PCGAMG Opt l01 1 1.0 6.0880e-02 1.0 1.50e+06 1.4 2.4e+01 7.4e+03 1.0e+01 0 1 1 1 2 0 1 1 1 2 60 +PCSetUp 2 1.0 6.8562e+00 1.0 8.32e+07 1.2 8.0e+02 1.1e+04 5.0e+02 26 36 33 51 79 26 36 33 51 81 34 +PCSetUpOnBlocks 22 1.0 7.2483e-02 194.9 9.06e+06 0.0 0.0e+00 0.0e+00 0.0e+00 0 1 0 0 0 0 1 0 0 0 125 +PCApply 22 1.0 2.8046e+00 1.0 1.24e+08 1.1 1.4e+03 4.2e+03 6.0e+00 10 55 60 35 1 10 55 60 35 1 128 --- Event Stage 1: Unknown @@ -2671,9 +2714,9 @@ --- Event Stage 1: Unknown ======================================================================================================================== -Average time to get PetscTime(): 1.22e-07 -Average time for MPI_Barrier(): 3.3916e-06 -Average time for zero size MPI_Send(): 3.113e-06 +Average time to get PetscTime(): 1.46e-07 +Average time for MPI_Barrier(): 4.2876e-06 +Average time for zero size MPI_Send(): 2.693e-06 #PETSc Option Table entries: --ndofs 30000 --problem_type elasticity @@ -2736,67 +2779,67 @@ Option left: name:--problem_type value: elasticity Option left: name:--scaling_type value: strong Option left: name:-mg_levels_esteig_ksp_type value: cg -2023-05-15 13:41:27.353 ( 14.477s) [RANK: 0 ] loguru.cpp:526 INFO| atexit +2023-05-16 15:55:05.494 ( 27.158s) [RANK: 0 ] loguru.cpp:526 INFO| atexit ==== poisson weak scaling (3 processes with ndofs=10000) ==== -2023-05-15 13:41:27.792 ( 0.220s) [RANK: 0 ] utils.cpp:612 INFO| Compute partition of cells across ranks -2023-05-15 13:41:27.793 ( 0.221s) [RANK: 0 ] graphbuild.cpp:533 INFO| Building mesh dual graph -2023-05-15 13:41:27.793 ( 0.221s) [RANK: 0 ] graphbuild.cpp:396 INFO| Build local part of mesh dual graph -2023-05-15 13:41:27.994 ( 0.422s) [RANK: 0 ] graphbuild.cpp:89 INFO| Build nonlocal part of mesh dual graph -2023-05-15 13:41:28.013 ( 0.441s) [RANK: 0 ] MPI.cpp:154 INFO| Computing communicaton graph edges (using NBX algorithm). Number of input edges: 2 -2023-05-15 13:41:28.014 ( 0.442s) [RANK: 0 ] MPI.cpp:217 INFO| Finished graph edge discovery using NBX algorithm. Number of discovered edges 2 -2023-05-15 13:41:28.014 ( 0.442s) [RANK: 0 ] graphbuild.cpp:203 INFO| Number of destination and source ranks in non-local dual graph construction, and ratio to total number of ranks: 2, 2, 0.666667, 0.666667 -2023-05-15 13:41:28.027 ( 0.455s) [RANK: 0 ] graphbuild.cpp:545 INFO| Graph edges (local: 210000, non-local: 1800) -2023-05-15 13:41:28.027 ( 0.455s) [RANK: 0 ] partitioners.cpp:316 INFO| Compute graph partition using PT-SCOTCH -2023-05-15 13:41:45.982 ( 18.410s) [RANK: 0 ] MPI.cpp:154 INFO| Computing communicaton graph edges (using NBX algorithm). Number of input edges: 3 -2023-05-15 13:41:45.982 ( 18.410s) [RANK: 0 ] MPI.cpp:217 INFO| Finished graph edge discovery using NBX algorithm. Number of discovered edges 3 -2023-05-15 13:41:45.994 ( 18.422s) [RANK: 0 ] graphbuild.cpp:396 INFO| Build local part of mesh dual graph -2023-05-15 13:41:46.168 ( 18.596s) [RANK: 0 ] ordering.cpp:202 INFO| GPS pseudo-diameter:(167) 1635-51451 - -2023-05-15 13:41:46.192 ( 18.620s) [RANK: 0 ] Topology.cpp:923 INFO| Create topology -2023-05-15 13:41:46.204 ( 18.632s) [RANK: 0 ] MPI.cpp:154 INFO| Computing communicaton graph edges (using NBX algorithm). Number of input edges: 3 -2023-05-15 13:41:46.204 ( 18.632s) [RANK: 0 ] MPI.cpp:217 INFO| Finished graph edge discovery using NBX algorithm. Number of discovered edges 3 -2023-05-15 13:41:46.258 ( 18.686s) [RANK: 0 ] MPI.cpp:154 INFO| Computing communicaton graph edges (using NBX algorithm). Number of input edges: 2 -2023-05-15 13:41:46.260 ( 18.688s) [RANK: 0 ] MPI.cpp:217 INFO| Finished graph edge discovery using NBX algorithm. Number of discovered edges 2 -2023-05-15 13:41:46.260 ( 18.688s) [RANK: 0 ] MPI.cpp:154 INFO| Computing communicaton graph edges (using NBX algorithm). Number of input edges: 2 -2023-05-15 13:41:46.261 ( 18.689s) [RANK: 0 ] MPI.cpp:217 INFO| Finished graph edge discovery using NBX algorithm. Number of discovered edges 2 -2023-05-15 13:41:46.271 ( 18.699s) [RANK: 0 ] MPI.cpp:154 INFO| Computing communicaton graph edges (using NBX algorithm). Number of input edges: 2 -2023-05-15 13:41:46.271 ( 18.699s) [RANK: 0 ] MPI.cpp:217 INFO| Finished graph edge discovery using NBX algorithm. Number of discovered edges 2 -2023-05-15 13:41:46.272 ( 18.699s) [RANK: 0 ] MPI.cpp:154 INFO| Computing communicaton graph edges (using NBX algorithm). Number of input edges: 0 -2023-05-15 13:41:46.272 ( 18.700s) [RANK: 0 ] MPI.cpp:217 INFO| Finished graph edge discovery using NBX algorithm. Number of discovered edges 0 -2023-05-15 13:41:46.272 ( 18.700s) [RANK: 0 ] MPI.cpp:154 INFO| Computing communicaton graph edges (using NBX algorithm). Number of input edges: 2 -2023-05-15 13:41:46.272 ( 18.700s) [RANK: 0 ] MPI.cpp:217 INFO| Finished graph edge discovery using NBX algorithm. Number of discovered edges 2 -2023-05-15 13:41:46.285 ( 18.713s) [RANK: 0 ] MPI.cpp:154 INFO| Computing communicaton graph edges (using NBX algorithm). Number of input edges: 0 -2023-05-15 13:41:46.285 ( 18.713s) [RANK: 0 ] MPI.cpp:217 INFO| Finished graph edge discovery using NBX algorithm. Number of discovered edges 0 -2023-05-15 13:41:46.285 ( 18.713s) [RANK: 0 ] MPI.h:368 INFO| Number of neighbourhood source ranks in distribute_to_postoffice: 0 -2023-05-15 13:41:46.286 ( 18.714s) [RANK: 0 ] MPI.cpp:154 INFO| Computing communicaton graph edges (using NBX algorithm). Number of input edges: 2 -2023-05-15 13:41:46.286 ( 18.714s) [RANK: 0 ] MPI.cpp:217 INFO| Finished graph edge discovery using NBX algorithm. Number of discovered edges 2 -2023-05-15 13:41:46.286 ( 18.714s) [RANK: 0 ] MPI.h:500 INFO| Neighbourhood destination ranks from post office in distribute_data (rank, num dests, num dests/mpi_size): 0, 2, 0.666667 -2023-05-15 13:41:46.295 ( 18.723s) [RANK: 0 ]topologycomputation.cpp:746 INFO| Computing mesh entities of dimension 2 +2023-05-16 15:55:06.490 ( 0.560s) [RANK: 0 ] utils.cpp:612 INFO| Compute partition of cells across ranks +2023-05-16 15:55:06.490 ( 0.561s) [RANK: 0 ] graphbuild.cpp:533 INFO| Building mesh dual graph +2023-05-16 15:55:06.490 ( 0.561s) [RANK: 0 ] graphbuild.cpp:396 INFO| Build local part of mesh dual graph +2023-05-16 15:55:06.855 ( 0.925s) [RANK: 0 ] graphbuild.cpp:89 INFO| Build nonlocal part of mesh dual graph +2023-05-16 15:55:07.017 ( 1.088s) [RANK: 0 ] MPI.cpp:154 INFO| Computing communicaton graph edges (using NBX algorithm). Number of input edges: 2 +2023-05-16 15:55:07.037 ( 1.108s) [RANK: 0 ] MPI.cpp:217 INFO| Finished graph edge discovery using NBX algorithm. Number of discovered edges 2 +2023-05-16 15:55:07.037 ( 1.108s) [RANK: 0 ] graphbuild.cpp:203 INFO| Number of destination and source ranks in non-local dual graph construction, and ratio to total number of ranks: 2, 2, 0.666667, 0.666667 +2023-05-16 15:55:07.142 ( 1.213s) [RANK: 0 ] graphbuild.cpp:545 INFO| Graph edges (local: 210000, non-local: 1800) +2023-05-16 15:55:07.142 ( 1.213s) [RANK: 0 ] partitioners.cpp:316 INFO| Compute graph partition using PT-SCOTCH +2023-05-16 15:55:29.393 ( 23.464s) [RANK: 0 ] MPI.cpp:154 INFO| Computing communicaton graph edges (using NBX algorithm). Number of input edges: 3 +2023-05-16 15:55:29.416 ( 23.487s) [RANK: 0 ] MPI.cpp:217 INFO| Finished graph edge discovery using NBX algorithm. Number of discovered edges 3 +2023-05-16 15:55:29.855 ( 23.926s) [RANK: 0 ] graphbuild.cpp:396 INFO| Build local part of mesh dual graph +2023-05-16 15:55:30.273 ( 24.344s) [RANK: 0 ] ordering.cpp:202 INFO| GPS pseudo-diameter:(168) 1473-51353 + +2023-05-16 15:55:30.340 ( 24.410s) [RANK: 0 ] Topology.cpp:923 INFO| Create topology +2023-05-16 15:55:30.371 ( 24.442s) [RANK: 0 ] MPI.cpp:154 INFO| Computing communicaton graph edges (using NBX algorithm). Number of input edges: 3 +2023-05-16 15:55:30.397 ( 24.468s) [RANK: 0 ] MPI.cpp:217 INFO| Finished graph edge discovery using NBX algorithm. Number of discovered edges 3 +2023-05-16 15:55:30.818 ( 24.889s) [RANK: 0 ] MPI.cpp:154 INFO| Computing communicaton graph edges (using NBX algorithm). Number of input edges: 2 +2023-05-16 15:55:30.829 ( 24.900s) [RANK: 0 ] MPI.cpp:217 INFO| Finished graph edge discovery using NBX algorithm. Number of discovered edges 2 +2023-05-16 15:55:30.873 ( 24.943s) [RANK: 0 ] MPI.cpp:154 INFO| Computing communicaton graph edges (using NBX algorithm). Number of input edges: 2 +2023-05-16 15:55:30.896 ( 24.967s) [RANK: 0 ] MPI.cpp:217 INFO| Finished graph edge discovery using NBX algorithm. Number of discovered edges 2 +2023-05-16 15:55:30.983 ( 25.053s) [RANK: 0 ] MPI.cpp:154 INFO| Computing communicaton graph edges (using NBX algorithm). Number of input edges: 2 +2023-05-16 15:55:31.016 ( 25.087s) [RANK: 0 ] MPI.cpp:217 INFO| Finished graph edge discovery using NBX algorithm. Number of discovered edges 2 +2023-05-16 15:55:31.076 ( 25.147s) [RANK: 0 ] MPI.cpp:154 INFO| Computing communicaton graph edges (using NBX algorithm). Number of input edges: 0 +2023-05-16 15:55:31.089 ( 25.160s) [RANK: 0 ] MPI.cpp:217 INFO| Finished graph edge discovery using NBX algorithm. Number of discovered edges 0 +2023-05-16 15:55:31.197 ( 25.267s) [RANK: 0 ] MPI.cpp:154 INFO| Computing communicaton graph edges (using NBX algorithm). Number of input edges: 2 +2023-05-16 15:55:31.220 ( 25.291s) [RANK: 0 ] MPI.cpp:217 INFO| Finished graph edge discovery using NBX algorithm. Number of discovered edges 2 +2023-05-16 15:55:31.285 ( 25.355s) [RANK: 0 ] MPI.cpp:154 INFO| Computing communicaton graph edges (using NBX algorithm). Number of input edges: 0 +2023-05-16 15:55:31.293 ( 25.364s) [RANK: 0 ] MPI.cpp:217 INFO| Finished graph edge discovery using NBX algorithm. Number of discovered edges 0 +2023-05-16 15:55:31.293 ( 25.364s) [RANK: 0 ] MPI.h:368 INFO| Number of neighbourhood source ranks in distribute_to_postoffice: 0 +2023-05-16 15:55:31.318 ( 25.389s) [RANK: 0 ] MPI.cpp:154 INFO| Computing communicaton graph edges (using NBX algorithm). Number of input edges: 2 +2023-05-16 15:55:31.332 ( 25.403s) [RANK: 0 ] MPI.cpp:217 INFO| Finished graph edge discovery using NBX algorithm. Number of discovered edges 2 +2023-05-16 15:55:31.333 ( 25.403s) [RANK: 0 ] MPI.h:500 INFO| Neighbourhood destination ranks from post office in distribute_data (rank, num dests, num dests/mpi_size): 0, 2, 0.666667 UnitCube (30x30x30) to be refined 0 times -2023-05-15 13:41:46.354 ( 18.782s) [RANK: 0 ] MPI.cpp:154 INFO| Computing communicaton graph edges (using NBX algorithm). Number of input edges: 2 -2023-05-15 13:41:46.358 ( 18.786s) [RANK: 0 ] MPI.cpp:217 INFO| Finished graph edge discovery using NBX algorithm. Number of discovered edges 2 -2023-05-15 13:41:46.505 ( 18.932s) [RANK: 0 ] MPI.cpp:154 INFO| Computing communicaton graph edges (using NBX algorithm). Number of input edges: 2 -2023-05-15 13:41:46.505 ( 18.933s) [RANK: 0 ] MPI.cpp:217 INFO| Finished graph edge discovery using NBX algorithm. Number of discovered edges 2 -2023-05-15 13:41:46.512 ( 18.940s) [RANK: 0 ]topologycomputation.cpp:786 INFO| Requesting connectivity 2 - 3 -2023-05-15 13:41:46.512 ( 18.940s) [RANK: 0 ]topologycomputation.cpp:650 INFO| Computing mesh connectivity 2 - 3 from transpose. -2023-05-15 13:41:46.517 ( 18.945s) [RANK: 0 ]topologycomputation.cpp:746 INFO| Computing mesh entities of dimension 0 -2023-05-15 13:41:46.527 ( 18.955s) [RANK: 0 ] MPI.cpp:154 INFO| Computing communicaton graph edges (using NBX algorithm). Number of input edges: 2 -2023-05-15 13:41:46.528 ( 18.956s) [RANK: 0 ] MPI.cpp:217 INFO| Finished graph edge discovery using NBX algorithm. Number of discovered edges 2 -2023-05-15 13:41:46.528 ( 18.956s) [RANK: 0 ] MPI.cpp:154 INFO| Computing communicaton graph edges (using NBX algorithm). Number of input edges: 2 -2023-05-15 13:41:46.528 ( 18.956s) [RANK: 0 ] MPI.cpp:217 INFO| Finished graph edge discovery using NBX algorithm. Number of discovered edges 2 -2023-05-15 13:41:46.528 ( 18.956s) [RANK: 0 ] MPI.cpp:154 INFO| Computing communicaton graph edges (using NBX algorithm). Number of input edges: 0 -2023-05-15 13:41:46.528 ( 18.956s) [RANK: 0 ] MPI.cpp:217 INFO| Finished graph edge discovery using NBX algorithm. Number of discovered edges 0 -2023-05-15 13:41:46.529 ( 18.957s) [RANK: 0 ] MPI.cpp:154 INFO| Computing communicaton graph edges (using NBX algorithm). Number of input edges: 2 -2023-05-15 13:41:46.529 ( 18.957s) [RANK: 0 ] MPI.cpp:217 INFO| Finished graph edge discovery using NBX algorithm. Number of discovered edges 2 -2023-05-15 13:41:46.532 ( 18.960s) [RANK: 0 ]topologycomputation.cpp:786 INFO| Requesting connectivity 3 - 0 -2023-05-15 13:41:46.534 ( 18.962s) [RANK: 0 ]topologycomputation.cpp:786 INFO| Requesting connectivity 3 - 0 -2023-05-15 13:41:46.535 ( 18.962s) [RANK: 0 ]topologycomputation.cpp:786 INFO| Requesting connectivity 2 - 0 -2023-05-15 13:41:46.536 ( 18.964s) [RANK: 0 ]topologycomputation.cpp:786 INFO| Requesting connectivity 2 - 3 -2023-05-15 13:41:46.619 ( 19.047s) [RANK: 0 ]topologycomputation.cpp:786 INFO| Requesting connectivity 2 - 3 -2023-05-15 13:41:46.619 ( 19.047s) [RANK: 0 ]topologycomputation.cpp:786 INFO| Requesting connectivity 3 - 2 -2023-05-15 13:41:46.619 ( 19.047s) [RANK: 0 ] MPI.cpp:154 INFO| Computing communicaton graph edges (using NBX algorithm). Number of input edges: 2 -2023-05-15 13:41:46.620 ( 19.048s) [RANK: 0 ] MPI.cpp:217 INFO| Finished graph edge discovery using NBX algorithm. Number of discovered edges 2 -2023-05-15 13:41:46.683 ( 19.111s) [RANK: 0 ] SparsityPattern.cpp:389 INFO| Column ghost size increased from 469 to 1274 +2023-05-16 15:55:31.526 ( 25.597s) [RANK: 0 ]topologycomputation.cpp:746 INFO| Computing mesh entities of dimension 2 +2023-05-16 15:55:31.663 ( 25.733s) [RANK: 0 ] MPI.cpp:154 INFO| Computing communicaton graph edges (using NBX algorithm). Number of input edges: 2 +2023-05-16 15:55:31.672 ( 25.743s) [RANK: 0 ] MPI.cpp:217 INFO| Finished graph edge discovery using NBX algorithm. Number of discovered edges 2 +2023-05-16 15:55:32.157 ( 26.227s) [RANK: 0 ] MPI.cpp:154 INFO| Computing communicaton graph edges (using NBX algorithm). Number of input edges: 2 +2023-05-16 15:55:32.180 ( 26.251s) [RANK: 0 ] MPI.cpp:217 INFO| Finished graph edge discovery using NBX algorithm. Number of discovered edges 2 +2023-05-16 15:55:32.244 ( 26.315s) [RANK: 0 ]topologycomputation.cpp:786 INFO| Requesting connectivity 2 - 3 +2023-05-16 15:55:32.247 ( 26.317s) [RANK: 0 ]topologycomputation.cpp:650 INFO| Computing mesh connectivity 2 - 3 from transpose. +2023-05-16 15:55:32.252 ( 26.322s) [RANK: 0 ]topologycomputation.cpp:746 INFO| Computing mesh entities of dimension 0 +2023-05-16 15:55:32.280 ( 26.351s) [RANK: 0 ] MPI.cpp:154 INFO| Computing communicaton graph edges (using NBX algorithm). Number of input edges: 2 +2023-05-16 15:55:32.301 ( 26.372s) [RANK: 0 ] MPI.cpp:217 INFO| Finished graph edge discovery using NBX algorithm. Number of discovered edges 2 +2023-05-16 15:55:32.349 ( 26.420s) [RANK: 0 ] MPI.cpp:154 INFO| Computing communicaton graph edges (using NBX algorithm). Number of input edges: 2 +2023-05-16 15:55:32.368 ( 26.439s) [RANK: 0 ] MPI.cpp:217 INFO| Finished graph edge discovery using NBX algorithm. Number of discovered edges 2 +2023-05-16 15:55:32.409 ( 26.479s) [RANK: 0 ] MPI.cpp:154 INFO| Computing communicaton graph edges (using NBX algorithm). Number of input edges: 0 +2023-05-16 15:55:32.437 ( 26.508s) [RANK: 0 ] MPI.cpp:217 INFO| Finished graph edge discovery using NBX algorithm. Number of discovered edges 0 +2023-05-16 15:55:32.565 ( 26.636s) [RANK: 0 ] MPI.cpp:154 INFO| Computing communicaton graph edges (using NBX algorithm). Number of input edges: 2 +2023-05-16 15:55:32.589 ( 26.660s) [RANK: 0 ] MPI.cpp:217 INFO| Finished graph edge discovery using NBX algorithm. Number of discovered edges 2 +2023-05-16 15:55:32.713 ( 26.784s) [RANK: 0 ]topologycomputation.cpp:786 INFO| Requesting connectivity 3 - 0 +2023-05-16 15:55:32.716 ( 26.786s) [RANK: 0 ]topologycomputation.cpp:786 INFO| Requesting connectivity 3 - 0 +2023-05-16 15:55:32.716 ( 26.786s) [RANK: 0 ]topologycomputation.cpp:786 INFO| Requesting connectivity 2 - 0 +2023-05-16 15:55:32.718 ( 26.789s) [RANK: 0 ]topologycomputation.cpp:786 INFO| Requesting connectivity 2 - 3 +2023-05-16 15:55:33.179 ( 27.250s) [RANK: 0 ]topologycomputation.cpp:786 INFO| Requesting connectivity 2 - 3 +2023-05-16 15:55:33.179 ( 27.250s) [RANK: 0 ]topologycomputation.cpp:786 INFO| Requesting connectivity 3 - 2 +2023-05-16 15:55:33.179 ( 27.250s) [RANK: 0 ] MPI.cpp:154 INFO| Computing communicaton graph edges (using NBX algorithm). Number of input edges: 2 +2023-05-16 15:55:33.272 ( 27.343s) [RANK: 0 ] MPI.cpp:217 INFO| Finished graph edge discovery using NBX algorithm. Number of discovered edges 2 +2023-05-16 15:55:33.458 ( 27.529s) [RANK: 0 ] SparsityPattern.cpp:389 INFO| Column ghost size increased from 469 to 1274 ---------------------------------------------------------------- Test problem summary @@ -2811,7 +2854,7 @@ Total degrees of freedom: 29791 (29.8 thousand) Average degrees of freedom per process: 9930 ---------------------------------------------------------------- -2023-05-15 13:41:46.859 ( 19.287s) [RANK: 0 ] petsc.cpp:677 INFO| PETSc Krylov solver starting to solve system. +2023-05-16 15:55:33.910 ( 27.980s) [RANK: 0 ] petsc.cpp:677 INFO| PETSc Krylov solver starting to solve system. KSP Object: 3 MPI processes type: cg maximum iterations=10000, initial guess is zero @@ -2855,44 +2898,44 @@ [MPI_MAX] Summary of timings | reps wall avg wall tot --------------------------------------------------------------------------------------------------------- -Build BoxMesh | 1 18.534523 18.534523 -Build dofmap data | 2 0.013436 0.026872 -Build sparsity | 1 0.023999 0.023999 -Compute connectivity 2-3 | 1 0.004748 0.004748 -Compute dof reordering map | 2 0.001238 0.002477 -Compute entities of dim = 2 | 1 0.217239 0.217239 -Compute graph partition (SCOTCH) | 1 17.942604 17.942604 -Compute local part of mesh dual graph | 2 0.193003 0.386006 -Compute local-to-local map | 1 0.002315 0.002315 -Compute non-local part of mesh dual graph | 1 0.079041 0.079041 -Compute-local-to-global links for global/local adjacency list | 1 0.003275 0.003275 -Distribute AdjacencyList nodes to destination ranks | 1 0.023941 0.023941 -Distribute row-wise data (scalable) | 1 0.003205 0.003205 -Extract partition boundaries from SCOTCH graph | 1 0.003051 0.003051 -GPS: create_level_structure | 3 0.003873 0.009744 -Get SCOTCH graph data | 1 0.000015 0.000015 -Gibbs-Poole-Stockmeyer ordering | 1 0.027943 0.027943 -Init MPI | 1 0.151486 0.151486 -Init PETSc | 1 0.072099 0.072099 -Init dofmap from element dofmap | 2 0.008741 0.017481 +Build BoxMesh | 1 25.057323 25.057323 +Build dofmap data | 2 0.341784 0.683568 +Build sparsity | 1 0.060808 0.060808 +Compute connectivity 2-3 | 1 0.012381 0.012381 +Compute dof reordering map | 2 0.007172 0.014344 +Compute entities of dim = 2 | 1 0.718176 0.718176 +Compute graph partition (SCOTCH) | 1 22.189431 22.189431 +Compute local part of mesh dual graph | 2 0.460482 0.920964 +Compute local-to-local map | 1 0.006121 0.006121 +Compute non-local part of mesh dual graph | 1 0.322069 0.322069 +Compute-local-to-global links for global/local adjacency list | 1 0.002982 0.002982 +Distribute AdjacencyList nodes to destination ranks | 1 0.521864 0.521864 +Distribute row-wise data (scalable) | 1 0.200576 0.200576 +Extract partition boundaries from SCOTCH graph | 1 0.003166 0.003166 +GPS: create_level_structure | 2 0.011068 0.029318 +Get SCOTCH graph data | 1 0.000016 0.000016 +Gibbs-Poole-Stockmeyer ordering | 1 0.074525 0.074525 +Init MPI | 1 0.544531 0.544531 +Init PETSc | 1 0.004181 0.004181 +Init dofmap from element dofmap | 2 0.025761 0.051522 Init logging | 1 0.000070 0.000070 -PETSc Krylov solver | 1 0.817945 0.817945 -SCOTCH: call SCOTCH_dgraphBuild | 1 0.004330 0.004330 -SCOTCH: call SCOTCH_dgraphHalo | 1 0.065735 0.065735 -SCOTCH: call SCOTCH_dgraphPart | 1 17.925561 17.925561 -SparsityPattern::assemble | 1 0.043044 0.043044 -Topology: create | 1 0.072891 0.072891 -Topology: determine shared index ownership | 1 0.005157 0.005157 -Topology: determine vertex ownership groups (owned, undetermined, unowned) | 1 0.011662 0.011662 -ZZZ Assemble | 1 0.323147 0.323147 -ZZZ Assemble matrix | 1 0.136474 0.136474 -ZZZ Assemble vector | 1 0.026269 0.026269 -ZZZ Create Mesh | 1 18.534732 18.534732 -ZZZ Create RHS function | 1 0.082233 0.082233 -ZZZ Create boundary conditions | 1 0.006505 0.006505 -ZZZ Create facets and facet->cell connectivity | 1 0.222114 0.222114 -ZZZ FunctionSpace | 1 0.014662 0.014662 -ZZZ Solve | 1 0.822405 0.822405 +PETSc Krylov solver | 1 7.670947 7.670947 +SCOTCH: call SCOTCH_dgraphBuild | 1 0.043894 0.043894 +SCOTCH: call SCOTCH_dgraphHalo | 1 0.119943 0.119943 +SCOTCH: call SCOTCH_dgraphPart | 1 22.071425 22.071425 +SparsityPattern::assemble | 1 0.123076 0.123076 +Topology: create | 1 0.890626 0.890626 +Topology: determine shared index ownership | 1 0.423716 0.423716 +Topology: determine vertex ownership groups (owned, undetermined, unowned) | 1 0.022819 0.022819 +ZZZ Assemble | 1 1.166310 1.166310 +ZZZ Assemble matrix | 1 0.271731 0.271731 +ZZZ Assemble vector | 1 0.058961 0.058961 +ZZZ Create Mesh | 1 25.057571 25.057571 +ZZZ Create RHS function | 1 0.471018 0.471018 +ZZZ Create boundary conditions | 1 0.146710 0.146710 +ZZZ Create facets and facet->cell connectivity | 1 0.730707 0.730707 +ZZZ FunctionSpace | 1 0.387144 0.387144 +ZZZ Solve | 1 7.710026 7.710026 *** Number of Krylov iterations: 7 *** Solution norm: 36.6791 **************************************************************************************************************************************************************** @@ -2901,16 +2944,16 @@ ------------------------------------------------------------------ PETSc Performance Summary: ------------------------------------------------------------------ -/build/fenicsx-performance-tests-0.5.0~git20220731.821823b/obj-arm-linux-gnueabihf/dolfinx-scaling-test on a named virt64c with 3 processors, by pbuilder1 Mon May 15 13:41:47 2023 +/build/fenicsx-performance-tests-0.5.0~git20220731.821823b/obj-arm-linux-gnueabihf/dolfinx-scaling-test on a named i-capture-the-hostname with 3 processors, by pbuilder2 Tue May 16 15:55:41 2023 Using Petsc Release Version 3.18.5, Feb 27, 2023 Max Max/Min Avg Total -Time (sec): 1.992e+01 1.001 1.991e+01 +Time (sec): 3.517e+01 1.000 3.517e+01 Objects: 3.200e+01 1.000 3.200e+01 -Flops: 3.508e+06 1.029 3.448e+06 1.035e+07 -Flops/sec: 1.762e+05 1.029 1.732e+05 5.195e+05 +Flops: 3.495e+06 1.026 3.449e+06 1.035e+07 +Flops/sec: 9.939e+04 1.026 9.808e+04 2.942e+05 MPI Msg Count: 2.800e+01 1.000 2.800e+01 8.400e+01 -MPI Msg Len (bytes): 1.965e+05 1.222 6.572e+03 5.521e+05 +MPI Msg Len (bytes): 1.967e+05 1.236 6.365e+03 5.347e+05 MPI Reductions: 6.700e+01 1.000 Flop counting convention: 1 flop = 1 real number operation of type (multiply/divide/add/subtract) @@ -2919,7 +2962,7 @@ Summary of Stages: ----- Time ------ ----- Flop ------ --- Messages --- -- Message Lengths -- -- Reductions -- Avg %Total Avg %Total Count %Total Avg %Total Count %Total - 0: Main Stage: 1.9914e+01 100.0% 1.0345e+07 100.0% 8.400e+01 100.0% 6.572e+03 100.0% 4.900e+01 73.1% + 0: Main Stage: 3.5169e+01 100.0% 1.0348e+07 100.0% 8.400e+01 100.0% 6.365e+03 100.0% 4.900e+01 73.1% ------------------------------------------------------------------------------------------------------------------------ See the 'Profiling' chapter of the users' manual for details on interpreting output. @@ -2943,30 +2986,30 @@ --- Event Stage 0: Main Stage -BuildTwoSided 4 1.0 7.8692e-03 5.2 0.00e+00 0.0 1.8e+01 4.0e+00 4.0e+00 0 0 21 0 6 0 0 21 0 8 0 -BuildTwoSidedF 2 1.0 7.8343e-03 57.8 0.00e+00 0.0 1.2e+01 2.3e+04 2.0e+00 0 0 14 49 3 0 0 14 49 4 0 -MatMult 7 1.0 8.6405e-03 1.0 1.94e+06 1.0 5.4e+01 4.8e+03 1.0e+00 0 55 64 47 1 0 55 64 47 2 663 -MatConvert 1 1.0 4.2298e-03 1.0 0.00e+00 0.0 0.0e+00 0.0e+00 2.0e+00 0 0 0 0 3 0 0 0 0 4 0 -MatAssemblyBegin 3 1.0 1.1104e-02 2.7 0.00e+00 0.0 1.2e+01 2.3e+04 2.0e+00 0 0 14 49 3 0 0 14 49 4 0 -MatAssemblyEnd 3 1.0 8.1029e-03 1.1 3.89e+03 1.3 0.0e+00 0.0e+00 6.0e+00 0 0 0 0 9 0 0 0 0 12 1 -MatGetRowIJ 2 1.0 3.2600e-06 1.2 0.00e+00 0.0 0.0e+00 0.0e+00 0.0e+00 0 0 0 0 0 0 0 0 0 0 0 -MatView 1 1.0 9.1796e-03 4.5 0.00e+00 0.0 0.0e+00 0.0e+00 1.0e+00 0 0 0 0 1 0 0 0 0 2 0 -VecTDot 14 1.0 7.2477e-04 1.2 2.82e+05 1.0 0.0e+00 0.0e+00 1.4e+01 0 8 0 0 21 0 8 0 0 29 1151 -VecNorm 8 1.0 3.8888e-03 10.2 1.61e+05 1.0 0.0e+00 0.0e+00 8.0e+00 0 5 0 0 12 0 5 0 0 16 123 -VecCopy 2 1.0 5.0435e-05 1.2 0.00e+00 0.0 0.0e+00 0.0e+00 0.0e+00 0 0 0 0 0 0 0 0 0 0 0 -VecSet 9 1.0 1.5057e-04 1.1 0.00e+00 0.0 0.0e+00 0.0e+00 0.0e+00 0 0 0 0 0 0 0 0 0 0 0 -VecAXPY 14 1.0 4.5050e-04 1.1 2.82e+05 1.0 0.0e+00 0.0e+00 0.0e+00 0 8 0 0 0 0 8 0 0 0 1852 -VecAYPX 6 1.0 2.3726e-04 1.3 1.21e+05 1.0 0.0e+00 0.0e+00 0.0e+00 0 3 0 0 0 0 3 0 0 0 1507 -VecScatterBegin 8 1.0 2.1072e-03 2.2 0.00e+00 0.0 7.2e+01 3.9e+03 2.0e+00 0 0 86 51 3 0 0 86 51 4 0 -VecScatterEnd 8 1.0 1.0624e-03 1.9 0.00e+00 0.0 0.0e+00 0.0e+00 0.0e+00 0 0 0 0 0 0 0 0 0 0 0 -SFSetGraph 3 1.0 9.6531e-05 1.3 0.00e+00 0.0 0.0e+00 0.0e+00 0.0e+00 0 0 0 0 0 0 0 0 0 0 0 -SFSetUp 2 1.0 1.6852e-03 4.4 0.00e+00 0.0 2.4e+01 1.0e+03 2.0e+00 0 0 29 4 3 0 0 29 4 4 0 -SFPack 8 1.0 1.9744e-04 1.3 0.00e+00 0.0 0.0e+00 0.0e+00 0.0e+00 0 0 0 0 0 0 0 0 0 0 0 -SFUnpack 8 1.0 1.7378e-05 1.1 0.00e+00 0.0 0.0e+00 0.0e+00 0.0e+00 0 0 0 0 0 0 0 0 0 0 0 -KSPSetUp 1 1.0 1.5646e-04 1.2 0.00e+00 0.0 0.0e+00 0.0e+00 0.0e+00 0 0 0 0 0 0 0 0 0 0 0 -KSPSolve 1 1.0 4.0275e-01 1.0 2.79e+06 1.0 5.4e+01 4.8e+03 2.3e+01 2 80 64 47 34 2 80 64 47 47 20 -PCSetUp 1 1.0 4.0425e-01 1.0 0.00e+00 0.0 0.0e+00 0.0e+00 2.0e+00 2 0 0 0 3 2 0 0 0 4 0 -PCApply 8 1.0 3.9206e-01 1.0 0.00e+00 0.0 0.0e+00 0.0e+00 0.0e+00 2 0 0 0 0 2 0 0 0 0 0 +BuildTwoSided 4 1.0 6.9187e-02 2.4 0.00e+00 0.0 1.8e+01 4.0e+00 4.0e+00 0 0 21 0 6 0 0 21 0 8 0 +BuildTwoSidedF 2 1.0 3.3677e-02 6.5 0.00e+00 0.0 1.2e+01 2.2e+04 2.0e+00 0 0 14 49 3 0 0 14 49 4 0 +MatMult 7 1.0 1.6055e-01 1.3 1.94e+06 1.0 5.4e+01 4.7e+03 1.0e+00 0 55 64 48 1 0 55 64 48 2 36 +MatConvert 1 1.0 1.0314e-01 1.0 0.00e+00 0.0 0.0e+00 0.0e+00 2.0e+00 0 0 0 0 3 0 0 0 0 4 0 +MatAssemblyBegin 3 1.0 3.7421e-02 2.9 0.00e+00 0.0 1.2e+01 2.2e+04 2.0e+00 0 0 14 49 3 0 0 14 49 4 0 +MatAssemblyEnd 3 1.0 9.9342e-02 1.1 3.96e+03 1.3 0.0e+00 0.0e+00 6.0e+00 0 0 0 0 9 0 0 0 0 12 0 +MatGetRowIJ 2 1.0 3.9000e-06 1.0 0.00e+00 0.0 0.0e+00 0.0e+00 0.0e+00 0 0 0 0 0 0 0 0 0 0 0 +MatView 1 1.0 1.1971e-02 1.9 0.00e+00 0.0 0.0e+00 0.0e+00 1.0e+00 0 0 0 0 1 0 0 0 0 2 0 +VecTDot 14 1.0 1.4424e-01 1.6 2.81e+05 1.0 0.0e+00 0.0e+00 1.4e+01 0 8 0 0 21 0 8 0 0 29 6 +VecNorm 8 1.0 9.0722e-02 2.9 1.61e+05 1.0 0.0e+00 0.0e+00 8.0e+00 0 5 0 0 12 0 5 0 0 16 5 +VecCopy 2 1.0 6.2295e-05 1.1 0.00e+00 0.0 0.0e+00 0.0e+00 0.0e+00 0 0 0 0 0 0 0 0 0 0 0 +VecSet 9 1.0 1.5268e-04 1.0 0.00e+00 0.0 0.0e+00 0.0e+00 0.0e+00 0 0 0 0 0 0 0 0 0 0 0 +VecAXPY 14 1.0 5.1325e-04 1.2 2.81e+05 1.0 0.0e+00 0.0e+00 0.0e+00 0 8 0 0 0 0 8 0 0 0 1625 +VecAYPX 6 1.0 2.8223e-04 1.3 1.21e+05 1.0 0.0e+00 0.0e+00 0.0e+00 0 3 0 0 0 0 3 0 0 0 1267 +VecScatterBegin 8 1.0 6.7971e-02 1.4 0.00e+00 0.0 7.2e+01 3.8e+03 2.0e+00 0 0 86 51 3 0 0 86 51 4 0 +VecScatterEnd 8 1.0 1.2623e-01 1.4 0.00e+00 0.0 0.0e+00 0.0e+00 0.0e+00 0 0 0 0 0 0 0 0 0 0 0 +SFSetGraph 3 1.0 8.5412e-05 1.1 0.00e+00 0.0 0.0e+00 0.0e+00 0.0e+00 0 0 0 0 0 0 0 0 0 0 0 +SFSetUp 2 1.0 6.7547e-02 1.4 0.00e+00 0.0 2.4e+01 9.7e+02 2.0e+00 0 0 29 4 3 0 0 29 4 4 0 +SFPack 8 1.0 1.4723e-04 1.2 0.00e+00 0.0 0.0e+00 0.0e+00 0.0e+00 0 0 0 0 0 0 0 0 0 0 0 +SFUnpack 8 1.0 5.4934e-05 1.4 0.00e+00 0.0 0.0e+00 0.0e+00 0.0e+00 0 0 0 0 0 0 0 0 0 0 0 +KSPSetUp 1 1.0 1.1873e-04 1.0 0.00e+00 0.0 0.0e+00 0.0e+00 0.0e+00 0 0 0 0 0 0 0 0 0 0 0 +KSPSolve 1 1.0 3.3138e+00 1.0 2.78e+06 1.0 5.4e+01 4.7e+03 2.3e+01 9 80 64 48 34 9 80 64 48 47 2 +PCSetUp 1 1.0 4.3090e+00 1.0 0.00e+00 0.0 0.0e+00 0.0e+00 2.0e+00 12 0 0 0 3 12 0 0 0 4 0 +PCApply 8 1.0 3.0262e+00 1.0 0.00e+00 0.0 0.0e+00 0.0e+00 0.0e+00 9 0 0 0 0 9 0 0 0 0 0 --- Event Stage 1: Unknown @@ -2988,9 +3031,9 @@ --- Event Stage 1: Unknown ======================================================================================================================== -Average time to get PetscTime(): 1.379e-07 -Average time for MPI_Barrier(): 3.4838e-06 -Average time for zero size MPI_Send(): 5.47933e-06 +Average time to get PetscTime(): 1.44e-07 +Average time for MPI_Barrier(): 3.6956e-06 +Average time for zero size MPI_Send(): 6.006e-06 #PETSc Option Table entries: --ndofs 10000 --problem_type poisson @@ -3046,67 +3089,67 @@ Option left: name:--ndofs value: 10000 Option left: name:--problem_type value: poisson Option left: name:--scaling_type value: weak -2023-05-15 13:41:47.750 ( 20.178s) [RANK: 0 ] loguru.cpp:526 INFO| atexit +2023-05-16 15:55:43.171 ( 37.241s) [RANK: 0 ] loguru.cpp:526 INFO| atexit ==== poisson strong scaling (3 processes with ndofs=30000) ==== -2023-05-15 13:41:48.059 ( 0.138s) [RANK: 0 ] utils.cpp:612 INFO| Compute partition of cells across ranks -2023-05-15 13:41:48.060 ( 0.138s) [RANK: 0 ] graphbuild.cpp:533 INFO| Building mesh dual graph -2023-05-15 13:41:48.060 ( 0.138s) [RANK: 0 ] graphbuild.cpp:396 INFO| Build local part of mesh dual graph -2023-05-15 13:41:48.231 ( 0.310s) [RANK: 0 ] graphbuild.cpp:89 INFO| Build nonlocal part of mesh dual graph -2023-05-15 13:41:48.232 ( 0.310s) [RANK: 0 ] MPI.cpp:154 INFO| Computing communicaton graph edges (using NBX algorithm). Number of input edges: 2 -2023-05-15 13:41:48.232 ( 0.311s) [RANK: 0 ] MPI.cpp:217 INFO| Finished graph edge discovery using NBX algorithm. Number of discovered edges 2 -2023-05-15 13:41:48.233 ( 0.311s) [RANK: 0 ] graphbuild.cpp:203 INFO| Number of destination and source ranks in non-local dual graph construction, and ratio to total number of ranks: 2, 2, 0.666667, 0.666667 -2023-05-15 13:41:48.241 ( 0.319s) [RANK: 0 ] graphbuild.cpp:545 INFO| Graph edges (local: 210000, non-local: 1800) -2023-05-15 13:41:48.241 ( 0.319s) [RANK: 0 ] partitioners.cpp:316 INFO| Compute graph partition using PT-SCOTCH -2023-05-15 13:42:05.277 ( 17.355s) [RANK: 0 ] MPI.cpp:154 INFO| Computing communicaton graph edges (using NBX algorithm). Number of input edges: 3 -2023-05-15 13:42:05.277 ( 17.355s) [RANK: 0 ] MPI.cpp:217 INFO| Finished graph edge discovery using NBX algorithm. Number of discovered edges 3 -2023-05-15 13:42:05.289 ( 17.368s) [RANK: 0 ] graphbuild.cpp:396 INFO| Build local part of mesh dual graph -2023-05-15 13:42:05.456 ( 17.534s) [RANK: 0 ] ordering.cpp:202 INFO| GPS pseudo-diameter:(167) 51493-1755 - -2023-05-15 13:42:05.482 ( 17.560s) [RANK: 0 ] Topology.cpp:923 INFO| Create topology -2023-05-15 13:42:05.513 ( 17.591s) [RANK: 0 ] MPI.cpp:154 INFO| Computing communicaton graph edges (using NBX algorithm). Number of input edges: 3 -2023-05-15 13:42:05.513 ( 17.591s) [RANK: 0 ] MPI.cpp:217 INFO| Finished graph edge discovery using NBX algorithm. Number of discovered edges 3 -2023-05-15 13:42:05.569 ( 17.647s) [RANK: 0 ] MPI.cpp:154 INFO| Computing communicaton graph edges (using NBX algorithm). Number of input edges: 2 -2023-05-15 13:42:05.573 ( 17.651s) [RANK: 0 ] MPI.cpp:217 INFO| Finished graph edge discovery using NBX algorithm. Number of discovered edges 2 -2023-05-15 13:42:05.573 ( 17.651s) [RANK: 0 ] MPI.cpp:154 INFO| Computing communicaton graph edges (using NBX algorithm). Number of input edges: 2 -2023-05-15 13:42:05.573 ( 17.651s) [RANK: 0 ] MPI.cpp:217 INFO| Finished graph edge discovery using NBX algorithm. Number of discovered edges 2 -2023-05-15 13:42:05.583 ( 17.661s) [RANK: 0 ] MPI.cpp:154 INFO| Computing communicaton graph edges (using NBX algorithm). Number of input edges: 2 -2023-05-15 13:42:05.584 ( 17.663s) [RANK: 0 ] MPI.cpp:217 INFO| Finished graph edge discovery using NBX algorithm. Number of discovered edges 2 -2023-05-15 13:42:05.585 ( 17.663s) [RANK: 0 ] MPI.cpp:154 INFO| Computing communicaton graph edges (using NBX algorithm). Number of input edges: 0 -2023-05-15 13:42:05.585 ( 17.663s) [RANK: 0 ] MPI.cpp:217 INFO| Finished graph edge discovery using NBX algorithm. Number of discovered edges 0 -2023-05-15 13:42:05.586 ( 17.664s) [RANK: 0 ] MPI.cpp:154 INFO| Computing communicaton graph edges (using NBX algorithm). Number of input edges: 2 -2023-05-15 13:42:05.586 ( 17.664s) [RANK: 0 ] MPI.cpp:217 INFO| Finished graph edge discovery using NBX algorithm. Number of discovered edges 2 -2023-05-15 13:42:05.599 ( 17.677s) [RANK: 0 ] MPI.cpp:154 INFO| Computing communicaton graph edges (using NBX algorithm). Number of input edges: 0 -2023-05-15 13:42:05.599 ( 17.677s) [RANK: 0 ] MPI.cpp:217 INFO| Finished graph edge discovery using NBX algorithm. Number of discovered edges 0 -2023-05-15 13:42:05.599 ( 17.677s) [RANK: 0 ] MPI.h:368 INFO| Number of neighbourhood source ranks in distribute_to_postoffice: 0 -2023-05-15 13:42:05.600 ( 17.679s) [RANK: 0 ] MPI.cpp:154 INFO| Computing communicaton graph edges (using NBX algorithm). Number of input edges: 2 -2023-05-15 13:42:05.601 ( 17.679s) [RANK: 0 ] MPI.cpp:217 INFO| Finished graph edge discovery using NBX algorithm. Number of discovered edges 2 -2023-05-15 13:42:05.601 ( 17.679s) [RANK: 0 ] MPI.h:500 INFO| Neighbourhood destination ranks from post office in distribute_data (rank, num dests, num dests/mpi_size): 0, 2, 0.666667 +2023-05-16 15:55:44.648 ( 0.547s) [RANK: 0 ] utils.cpp:612 INFO| Compute partition of cells across ranks +2023-05-16 15:55:44.648 ( 0.547s) [RANK: 0 ] graphbuild.cpp:533 INFO| Building mesh dual graph +2023-05-16 15:55:44.648 ( 0.547s) [RANK: 0 ] graphbuild.cpp:396 INFO| Build local part of mesh dual graph +2023-05-16 15:55:45.032 ( 0.931s) [RANK: 0 ] graphbuild.cpp:89 INFO| Build nonlocal part of mesh dual graph +2023-05-16 15:55:45.065 ( 0.963s) [RANK: 0 ] MPI.cpp:154 INFO| Computing communicaton graph edges (using NBX algorithm). Number of input edges: 2 +2023-05-16 15:55:45.069 ( 0.967s) [RANK: 0 ] MPI.cpp:217 INFO| Finished graph edge discovery using NBX algorithm. Number of discovered edges 2 +2023-05-16 15:55:45.069 ( 0.967s) [RANK: 0 ] graphbuild.cpp:203 INFO| Number of destination and source ranks in non-local dual graph construction, and ratio to total number of ranks: 2, 2, 0.666667, 0.666667 +2023-05-16 15:55:45.150 ( 1.049s) [RANK: 0 ] graphbuild.cpp:545 INFO| Graph edges (local: 210000, non-local: 1800) +2023-05-16 15:55:45.150 ( 1.049s) [RANK: 0 ] partitioners.cpp:316 INFO| Compute graph partition using PT-SCOTCH +2023-05-16 15:56:06.542 ( 22.440s) [RANK: 0 ] MPI.cpp:154 INFO| Computing communicaton graph edges (using NBX algorithm). Number of input edges: 3 +2023-05-16 15:56:06.564 ( 22.463s) [RANK: 0 ] MPI.cpp:217 INFO| Finished graph edge discovery using NBX algorithm. Number of discovered edges 3 +2023-05-16 15:56:07.012 ( 22.911s) [RANK: 0 ] graphbuild.cpp:396 INFO| Build local part of mesh dual graph +2023-05-16 15:56:07.447 ( 23.345s) [RANK: 0 ] ordering.cpp:202 INFO| GPS pseudo-diameter:(169) 50547-237 + +2023-05-16 15:56:07.496 ( 23.394s) [RANK: 0 ] Topology.cpp:923 INFO| Create topology +2023-05-16 15:56:07.617 ( 23.515s) [RANK: 0 ] MPI.cpp:154 INFO| Computing communicaton graph edges (using NBX algorithm). Number of input edges: 3 +2023-05-16 15:56:07.617 ( 23.515s) [RANK: 0 ] MPI.cpp:217 INFO| Finished graph edge discovery using NBX algorithm. Number of discovered edges 3 +2023-05-16 15:56:07.732 ( 23.631s) [RANK: 0 ] MPI.cpp:154 INFO| Computing communicaton graph edges (using NBX algorithm). Number of input edges: 2 +2023-05-16 15:56:07.775 ( 23.674s) [RANK: 0 ] MPI.cpp:217 INFO| Finished graph edge discovery using NBX algorithm. Number of discovered edges 2 +2023-05-16 15:56:07.786 ( 23.684s) [RANK: 0 ] MPI.cpp:154 INFO| Computing communicaton graph edges (using NBX algorithm). Number of input edges: 2 +2023-05-16 15:56:07.786 ( 23.684s) [RANK: 0 ] MPI.cpp:217 INFO| Finished graph edge discovery using NBX algorithm. Number of discovered edges 2 +2023-05-16 15:56:07.800 ( 23.699s) [RANK: 0 ] MPI.cpp:154 INFO| Computing communicaton graph edges (using NBX algorithm). Number of input edges: 2 +2023-05-16 15:56:07.824 ( 23.723s) [RANK: 0 ] MPI.cpp:217 INFO| Finished graph edge discovery using NBX algorithm. Number of discovered edges 2 +2023-05-16 15:56:07.842 ( 23.740s) [RANK: 0 ] MPI.cpp:154 INFO| Computing communicaton graph edges (using NBX algorithm). Number of input edges: 0 +2023-05-16 15:56:07.852 ( 23.751s) [RANK: 0 ] MPI.cpp:217 INFO| Finished graph edge discovery using NBX algorithm. Number of discovered edges 0 +2023-05-16 15:56:07.857 ( 23.756s) [RANK: 0 ] MPI.cpp:154 INFO| Computing communicaton graph edges (using NBX algorithm). Number of input edges: 2 +2023-05-16 15:56:07.858 ( 23.756s) [RANK: 0 ] MPI.cpp:217 INFO| Finished graph edge discovery using NBX algorithm. Number of discovered edges 2 +2023-05-16 15:56:07.894 ( 23.793s) [RANK: 0 ] MPI.cpp:154 INFO| Computing communicaton graph edges (using NBX algorithm). Number of input edges: 0 +2023-05-16 15:56:07.895 ( 23.793s) [RANK: 0 ] MPI.cpp:217 INFO| Finished graph edge discovery using NBX algorithm. Number of discovered edges 0 +2023-05-16 15:56:07.895 ( 23.793s) [RANK: 0 ] MPI.h:368 INFO| Number of neighbourhood source ranks in distribute_to_postoffice: 0 +2023-05-16 15:56:07.895 ( 23.794s) [RANK: 0 ] MPI.cpp:154 INFO| Computing communicaton graph edges (using NBX algorithm). Number of input edges: 2 +2023-05-16 15:56:07.896 ( 23.794s) [RANK: 0 ] MPI.cpp:217 INFO| Finished graph edge discovery using NBX algorithm. Number of discovered edges 2 +2023-05-16 15:56:07.896 ( 23.794s) [RANK: 0 ] MPI.h:500 INFO| Neighbourhood destination ranks from post office in distribute_data (rank, num dests, num dests/mpi_size): 0, 2, 0.666667 UnitCube (30x30x30) to be refined 0 times -2023-05-15 13:42:05.610 ( 17.688s) [RANK: 0 ]topologycomputation.cpp:746 INFO| Computing mesh entities of dimension 2 -2023-05-15 13:42:05.671 ( 17.749s) [RANK: 0 ] MPI.cpp:154 INFO| Computing communicaton graph edges (using NBX algorithm). Number of input edges: 2 -2023-05-15 13:42:05.672 ( 17.751s) [RANK: 0 ] MPI.cpp:217 INFO| Finished graph edge discovery using NBX algorithm. Number of discovered edges 2 -2023-05-15 13:42:05.820 ( 17.898s) [RANK: 0 ] MPI.cpp:154 INFO| Computing communicaton graph edges (using NBX algorithm). Number of input edges: 2 -2023-05-15 13:42:05.820 ( 17.898s) [RANK: 0 ] MPI.cpp:217 INFO| Finished graph edge discovery using NBX algorithm. Number of discovered edges 2 -2023-05-15 13:42:05.828 ( 17.906s) [RANK: 0 ]topologycomputation.cpp:786 INFO| Requesting connectivity 2 - 3 -2023-05-15 13:42:05.828 ( 17.906s) [RANK: 0 ]topologycomputation.cpp:650 INFO| Computing mesh connectivity 2 - 3 from transpose. -2023-05-15 13:42:05.833 ( 17.911s) [RANK: 0 ]topologycomputation.cpp:746 INFO| Computing mesh entities of dimension 0 -2023-05-15 13:42:05.846 ( 17.924s) [RANK: 0 ] MPI.cpp:154 INFO| Computing communicaton graph edges (using NBX algorithm). Number of input edges: 2 -2023-05-15 13:42:05.846 ( 17.924s) [RANK: 0 ] MPI.cpp:217 INFO| Finished graph edge discovery using NBX algorithm. Number of discovered edges 2 -2023-05-15 13:42:05.846 ( 17.924s) [RANK: 0 ] MPI.cpp:154 INFO| Computing communicaton graph edges (using NBX algorithm). Number of input edges: 2 -2023-05-15 13:42:05.846 ( 17.924s) [RANK: 0 ] MPI.cpp:217 INFO| Finished graph edge discovery using NBX algorithm. Number of discovered edges 2 -2023-05-15 13:42:05.847 ( 17.925s) [RANK: 0 ] MPI.cpp:154 INFO| Computing communicaton graph edges (using NBX algorithm). Number of input edges: 0 -2023-05-15 13:42:05.847 ( 17.925s) [RANK: 0 ] MPI.cpp:217 INFO| Finished graph edge discovery using NBX algorithm. Number of discovered edges 0 -2023-05-15 13:42:05.847 ( 17.926s) [RANK: 0 ] MPI.cpp:154 INFO| Computing communicaton graph edges (using NBX algorithm). Number of input edges: 2 -2023-05-15 13:42:05.848 ( 17.926s) [RANK: 0 ] MPI.cpp:217 INFO| Finished graph edge discovery using NBX algorithm. Number of discovered edges 2 -2023-05-15 13:42:05.850 ( 17.928s) [RANK: 0 ]topologycomputation.cpp:786 INFO| Requesting connectivity 3 - 0 -2023-05-15 13:42:05.853 ( 17.931s) [RANK: 0 ]topologycomputation.cpp:786 INFO| Requesting connectivity 3 - 0 -2023-05-15 13:42:05.853 ( 17.931s) [RANK: 0 ]topologycomputation.cpp:786 INFO| Requesting connectivity 2 - 0 -2023-05-15 13:42:05.854 ( 17.932s) [RANK: 0 ]topologycomputation.cpp:786 INFO| Requesting connectivity 2 - 3 -2023-05-15 13:42:05.948 ( 18.027s) [RANK: 0 ]topologycomputation.cpp:786 INFO| Requesting connectivity 2 - 3 -2023-05-15 13:42:05.949 ( 18.027s) [RANK: 0 ]topologycomputation.cpp:786 INFO| Requesting connectivity 3 - 2 -2023-05-15 13:42:05.949 ( 18.027s) [RANK: 0 ] MPI.cpp:154 INFO| Computing communicaton graph edges (using NBX algorithm). Number of input edges: 2 -2023-05-15 13:42:05.949 ( 18.028s) [RANK: 0 ] MPI.cpp:217 INFO| Finished graph edge discovery using NBX algorithm. Number of discovered edges 2 -2023-05-15 13:42:06.015 ( 18.094s) [RANK: 0 ] SparsityPattern.cpp:389 INFO| Column ghost size increased from 464 to 1256 +2023-05-16 15:56:07.954 ( 23.852s) [RANK: 0 ]topologycomputation.cpp:746 INFO| Computing mesh entities of dimension 2 +2023-05-16 15:56:08.015 ( 23.913s) [RANK: 0 ] MPI.cpp:154 INFO| Computing communicaton graph edges (using NBX algorithm). Number of input edges: 2 +2023-05-16 15:56:08.123 ( 24.022s) [RANK: 0 ] MPI.cpp:217 INFO| Finished graph edge discovery using NBX algorithm. Number of discovered edges 2 +2023-05-16 15:56:08.525 ( 24.423s) [RANK: 0 ] MPI.cpp:154 INFO| Computing communicaton graph edges (using NBX algorithm). Number of input edges: 2 +2023-05-16 15:56:08.536 ( 24.434s) [RANK: 0 ] MPI.cpp:217 INFO| Finished graph edge discovery using NBX algorithm. Number of discovered edges 2 +2023-05-16 15:56:08.551 ( 24.450s) [RANK: 0 ]topologycomputation.cpp:786 INFO| Requesting connectivity 2 - 3 +2023-05-16 15:56:08.551 ( 24.450s) [RANK: 0 ]topologycomputation.cpp:650 INFO| Computing mesh connectivity 2 - 3 from transpose. +2023-05-16 15:56:08.565 ( 24.464s) [RANK: 0 ]topologycomputation.cpp:746 INFO| Computing mesh entities of dimension 0 +2023-05-16 15:56:08.584 ( 24.482s) [RANK: 0 ] MPI.cpp:154 INFO| Computing communicaton graph edges (using NBX algorithm). Number of input edges: 2 +2023-05-16 15:56:08.607 ( 24.506s) [RANK: 0 ] MPI.cpp:217 INFO| Finished graph edge discovery using NBX algorithm. Number of discovered edges 2 +2023-05-16 15:56:08.608 ( 24.506s) [RANK: 0 ] MPI.cpp:154 INFO| Computing communicaton graph edges (using NBX algorithm). Number of input edges: 2 +2023-05-16 15:56:08.608 ( 24.506s) [RANK: 0 ] MPI.cpp:217 INFO| Finished graph edge discovery using NBX algorithm. Number of discovered edges 2 +2023-05-16 15:56:08.608 ( 24.507s) [RANK: 0 ] MPI.cpp:154 INFO| Computing communicaton graph edges (using NBX algorithm). Number of input edges: 0 +2023-05-16 15:56:08.608 ( 24.507s) [RANK: 0 ] MPI.cpp:217 INFO| Finished graph edge discovery using NBX algorithm. Number of discovered edges 0 +2023-05-16 15:56:08.617 ( 24.516s) [RANK: 0 ] MPI.cpp:154 INFO| Computing communicaton graph edges (using NBX algorithm). Number of input edges: 2 +2023-05-16 15:56:08.617 ( 24.516s) [RANK: 0 ] MPI.cpp:217 INFO| Finished graph edge discovery using NBX algorithm. Number of discovered edges 2 +2023-05-16 15:56:08.620 ( 24.518s) [RANK: 0 ]topologycomputation.cpp:786 INFO| Requesting connectivity 3 - 0 +2023-05-16 15:56:08.625 ( 24.523s) [RANK: 0 ]topologycomputation.cpp:786 INFO| Requesting connectivity 3 - 0 +2023-05-16 15:56:08.625 ( 24.523s) [RANK: 0 ]topologycomputation.cpp:786 INFO| Requesting connectivity 2 - 0 +2023-05-16 15:56:08.626 ( 24.525s) [RANK: 0 ]topologycomputation.cpp:786 INFO| Requesting connectivity 2 - 3 +2023-05-16 15:56:08.971 ( 24.869s) [RANK: 0 ]topologycomputation.cpp:786 INFO| Requesting connectivity 2 - 3 +2023-05-16 15:56:08.971 ( 24.870s) [RANK: 0 ]topologycomputation.cpp:786 INFO| Requesting connectivity 3 - 2 +2023-05-16 15:56:08.971 ( 24.870s) [RANK: 0 ] MPI.cpp:154 INFO| Computing communicaton graph edges (using NBX algorithm). Number of input edges: 2 +2023-05-16 15:56:09.008 ( 24.907s) [RANK: 0 ] MPI.cpp:217 INFO| Finished graph edge discovery using NBX algorithm. Number of discovered edges 2 +2023-05-16 15:56:09.252 ( 25.151s) [RANK: 0 ] SparsityPattern.cpp:389 INFO| Column ghost size increased from 475 to 1242 ---------------------------------------------------------------- Test problem summary @@ -3121,7 +3164,7 @@ Total degrees of freedom: 29791 (29.8 thousand) Average degrees of freedom per process: 9930 ---------------------------------------------------------------- -2023-05-15 13:42:06.196 ( 18.274s) [RANK: 0 ] petsc.cpp:677 INFO| PETSc Krylov solver starting to solve system. +2023-05-16 15:56:09.939 ( 25.837s) [RANK: 0 ] petsc.cpp:677 INFO| PETSc Krylov solver starting to solve system. KSP Object: 3 MPI processes type: cg maximum iterations=10000, initial guess is zero @@ -3165,44 +3208,44 @@ [MPI_MAX] Summary of timings | reps wall avg wall tot --------------------------------------------------------------------------------------------------------- -Build BoxMesh | 1 17.557787 17.557787 -Build dofmap data | 2 0.015147 0.030295 -Build sparsity | 1 0.026714 0.026714 -Compute connectivity 2-3 | 1 0.004961 0.004961 -Compute dof reordering map | 2 0.001344 0.002688 -Compute entities of dim = 2 | 1 0.219207 0.219207 -Compute graph partition (SCOTCH) | 1 17.025626 17.025626 -Compute local part of mesh dual graph | 2 0.166949 0.333897 -Compute local-to-local map | 1 0.002453 0.002453 -Compute non-local part of mesh dual graph | 1 0.015614 0.015614 -Compute-local-to-global links for global/local adjacency list | 1 0.003168 0.003168 -Distribute AdjacencyList nodes to destination ranks | 1 0.023581 0.023581 -Distribute row-wise data (scalable) | 1 0.004457 0.004457 -Extract partition boundaries from SCOTCH graph | 1 0.003284 0.003284 -GPS: create_level_structure | 2 0.003624 0.014498 -Get SCOTCH graph data | 1 0.000013 0.000013 -Gibbs-Poole-Stockmeyer ordering | 1 0.035050 0.035050 -Init MPI | 1 0.125719 0.125719 -Init PETSc | 1 0.007221 0.007221 -Init dofmap from element dofmap | 2 0.009488 0.018977 +Build BoxMesh | 1 23.333466 23.333466 +Build dofmap data | 2 0.063489 0.126979 +Build sparsity | 1 0.095001 0.095001 +Compute connectivity 2-3 | 1 0.012993 0.012993 +Compute dof reordering map | 2 0.001182 0.002363 +Compute entities of dim = 2 | 1 0.606327 0.606327 +Compute graph partition (SCOTCH) | 1 21.346761 21.346761 +Compute local part of mesh dual graph | 2 0.442666 0.885332 +Compute local-to-local map | 1 0.002316 0.002316 +Compute non-local part of mesh dual graph | 1 0.154616 0.154616 +Compute-local-to-global links for global/local adjacency list | 1 0.010883 0.010883 +Distribute AdjacencyList nodes to destination ranks | 1 0.533848 0.533848 +Distribute row-wise data (scalable) | 1 0.024517 0.024517 +Extract partition boundaries from SCOTCH graph | 1 0.003075 0.003075 +GPS: create_level_structure | 6 0.010642 0.060264 +Get SCOTCH graph data | 1 0.000020 0.000020 +Gibbs-Poole-Stockmeyer ordering | 1 0.101799 0.101799 +Init MPI | 1 0.635408 0.635408 +Init PETSc | 1 0.005180 0.005180 +Init dofmap from element dofmap | 2 0.024670 0.049340 Init logging | 1 0.000071 0.000071 -PETSc Krylov solver | 1 0.820146 0.820146 -SCOTCH: call SCOTCH_dgraphBuild | 1 0.000595 0.000595 -SCOTCH: call SCOTCH_dgraphHalo | 1 0.073866 0.073866 -SCOTCH: call SCOTCH_dgraphPart | 1 17.011886 17.011886 -SparsityPattern::assemble | 1 0.041694 0.041694 -Topology: create | 1 0.091402 0.091402 -Topology: determine shared index ownership | 1 0.020791 0.020791 -Topology: determine vertex ownership groups (owned, undetermined, unowned) | 1 0.011544 0.011544 -ZZZ Assemble | 1 0.341343 0.341343 -ZZZ Assemble matrix | 1 0.138731 0.138731 -ZZZ Assemble vector | 1 0.027932 0.027932 -ZZZ Create Mesh | 1 17.558176 17.558176 -ZZZ Create RHS function | 1 0.091795 0.091795 -ZZZ Create boundary conditions | 1 0.006870 0.006870 -ZZZ Create facets and facet->cell connectivity | 1 0.224320 0.224320 -ZZZ FunctionSpace | 1 0.016880 0.016880 -ZZZ Solve | 1 0.825175 0.825175 +PETSc Krylov solver | 1 11.509998 11.509998 +SCOTCH: call SCOTCH_dgraphBuild | 1 0.025632 0.025632 +SCOTCH: call SCOTCH_dgraphHalo | 1 0.135932 0.135932 +SCOTCH: call SCOTCH_dgraphPart | 1 21.241642 21.241642 +SparsityPattern::assemble | 1 0.144886 0.144886 +Topology: create | 1 0.290471 0.290471 +Topology: determine shared index ownership | 1 0.110813 0.110813 +Topology: determine vertex ownership groups (owned, undetermined, unowned) | 1 0.034830 0.034830 +ZZZ Assemble | 1 1.209170 1.209170 +ZZZ Assemble matrix | 1 0.447289 0.447289 +ZZZ Assemble vector | 1 0.082770 0.082770 +ZZZ Create Mesh | 1 23.333710 23.333710 +ZZZ Create RHS function | 1 0.292267 0.292267 +ZZZ Create boundary conditions | 1 0.081534 0.081534 +ZZZ Create facets and facet->cell connectivity | 1 0.619253 0.619253 +ZZZ FunctionSpace | 1 0.059212 0.059212 +ZZZ Solve | 1 11.559961 11.559961 *** Number of Krylov iterations: 7 *** Solution norm: 36.6791 **************************************************************************************************************************************************************** @@ -3211,16 +3254,16 @@ ------------------------------------------------------------------ PETSc Performance Summary: ------------------------------------------------------------------ -/build/fenicsx-performance-tests-0.5.0~git20220731.821823b/obj-arm-linux-gnueabihf/dolfinx-scaling-test on a named virt64c with 3 processors, by pbuilder1 Mon May 15 13:42:07 2023 +/build/fenicsx-performance-tests-0.5.0~git20220731.821823b/obj-arm-linux-gnueabihf/dolfinx-scaling-test on a named i-capture-the-hostname with 3 processors, by pbuilder2 Tue May 16 15:56:21 2023 Using Petsc Release Version 3.18.5, Feb 27, 2023 Max Max/Min Avg Total -Time (sec): 1.897e+01 1.000 1.897e+01 +Time (sec): 3.689e+01 1.000 3.688e+01 Objects: 3.200e+01 1.000 3.200e+01 -Flops: 3.490e+06 1.024 3.449e+06 1.035e+07 -Flops/sec: 1.840e+05 1.024 1.818e+05 5.455e+05 +Flops: 3.504e+06 1.027 3.449e+06 1.035e+07 +Flops/sec: 9.498e+04 1.027 9.351e+04 2.805e+05 MPI Msg Count: 2.800e+01 1.000 2.800e+01 8.400e+01 -MPI Msg Len (bytes): 1.888e+05 1.199 6.345e+03 5.330e+05 +MPI Msg Len (bytes): 2.081e+05 1.320 6.367e+03 5.348e+05 MPI Reductions: 6.700e+01 1.000 Flop counting convention: 1 flop = 1 real number operation of type (multiply/divide/add/subtract) @@ -3229,7 +3272,7 @@ Summary of Stages: ----- Time ------ ----- Flop ------ --- Messages --- -- Message Lengths -- -- Reductions -- Avg %Total Avg %Total Count %Total Avg %Total Count %Total - 0: Main Stage: 1.8969e+01 100.0% 1.0348e+07 100.0% 8.400e+01 100.0% 6.345e+03 100.0% 4.900e+01 73.1% + 0: Main Stage: 3.6885e+01 100.0% 1.0348e+07 100.0% 8.400e+01 100.0% 6.367e+03 100.0% 4.900e+01 73.1% ------------------------------------------------------------------------------------------------------------------------ See the 'Profiling' chapter of the users' manual for details on interpreting output. @@ -3253,30 +3296,30 @@ --- Event Stage 0: Main Stage -BuildTwoSided 4 1.0 1.0484e-02 9.6 0.00e+00 0.0 1.8e+01 4.0e+00 4.0e+00 0 0 21 0 6 0 0 21 0 8 0 -BuildTwoSidedF 2 1.0 9.7877e-03 9.1 0.00e+00 0.0 1.2e+01 2.2e+04 2.0e+00 0 0 14 49 3 0 0 14 49 4 0 -MatMult 7 1.0 8.4143e-03 1.0 1.93e+06 1.0 5.4e+01 4.7e+03 1.0e+00 0 55 64 47 1 0 55 64 47 2 681 -MatConvert 1 1.0 4.4323e-03 1.0 0.00e+00 0.0 0.0e+00 0.0e+00 2.0e+00 0 0 0 0 3 0 0 0 0 4 0 -MatAssemblyBegin 3 1.0 1.3356e-02 2.8 0.00e+00 0.0 1.2e+01 2.2e+04 2.0e+00 0 0 14 49 3 0 0 14 49 4 0 -MatAssemblyEnd 3 1.0 8.1487e-03 1.1 3.82e+03 1.3 0.0e+00 0.0e+00 6.0e+00 0 0 0 0 9 0 0 0 0 12 1 -MatGetRowIJ 2 1.0 3.7600e-06 1.2 0.00e+00 0.0 0.0e+00 0.0e+00 0.0e+00 0 0 0 0 0 0 0 0 0 0 0 -MatView 1 1.0 1.3297e-03 8.5 0.00e+00 0.0 0.0e+00 0.0e+00 1.0e+00 0 0 0 0 1 0 0 0 0 2 0 -VecTDot 14 1.0 9.1927e-04 1.3 2.81e+05 1.0 0.0e+00 0.0e+00 1.4e+01 0 8 0 0 21 0 8 0 0 29 907 -VecNorm 8 1.0 1.3386e-03 3.3 1.60e+05 1.0 0.0e+00 0.0e+00 8.0e+00 0 5 0 0 12 0 5 0 0 16 356 -VecCopy 2 1.0 5.4275e-05 1.2 0.00e+00 0.0 0.0e+00 0.0e+00 0.0e+00 0 0 0 0 0 0 0 0 0 0 0 -VecSet 9 1.0 1.9690e-04 1.4 0.00e+00 0.0 0.0e+00 0.0e+00 0.0e+00 0 0 0 0 0 0 0 0 0 0 0 -VecAXPY 14 1.0 5.8809e-04 1.2 2.81e+05 1.0 0.0e+00 0.0e+00 0.0e+00 0 8 0 0 0 0 8 0 0 0 1418 -VecAYPX 6 1.0 2.5224e-04 1.3 1.20e+05 1.0 0.0e+00 0.0e+00 0.0e+00 0 3 0 0 0 0 3 0 0 0 1417 -VecScatterBegin 8 1.0 1.3514e-03 2.1 0.00e+00 0.0 7.2e+01 3.8e+03 2.0e+00 0 0 86 51 3 0 0 86 51 4 0 -VecScatterEnd 8 1.0 1.0153e-03 2.5 0.00e+00 0.0 0.0e+00 0.0e+00 0.0e+00 0 0 0 0 0 0 0 0 0 0 0 -SFSetGraph 3 1.0 8.3592e-05 1.1 0.00e+00 0.0 0.0e+00 0.0e+00 0.0e+00 0 0 0 0 0 0 0 0 0 0 0 -SFSetUp 2 1.0 1.0090e-03 3.1 0.00e+00 0.0 2.4e+01 9.6e+02 2.0e+00 0 0 29 4 3 0 0 29 4 4 0 -SFPack 8 1.0 1.1407e-04 1.2 0.00e+00 0.0 0.0e+00 0.0e+00 0.0e+00 0 0 0 0 0 0 0 0 0 0 0 -SFUnpack 8 1.0 2.1178e-05 1.5 0.00e+00 0.0 0.0e+00 0.0e+00 0.0e+00 0 0 0 0 0 0 0 0 0 0 0 -KSPSetUp 1 1.0 1.3029e-04 1.1 0.00e+00 0.0 0.0e+00 0.0e+00 0.0e+00 0 0 0 0 0 0 0 0 0 0 0 -KSPSolve 1 1.0 4.0281e-01 1.0 2.78e+06 1.0 5.4e+01 4.7e+03 2.3e+01 2 80 64 47 34 2 80 64 47 47 20 -PCSetUp 1 1.0 4.1561e-01 1.0 0.00e+00 0.0 0.0e+00 0.0e+00 2.0e+00 2 0 0 0 3 2 0 0 0 4 0 -PCApply 8 1.0 3.9212e-01 1.0 0.00e+00 0.0 0.0e+00 0.0e+00 0.0e+00 2 0 0 0 0 2 0 0 0 0 0 +BuildTwoSided 4 1.0 1.1800e-01 2.1 0.00e+00 0.0 1.8e+01 4.0e+00 4.0e+00 0 0 21 0 6 0 0 21 0 8 0 +BuildTwoSidedF 2 1.0 8.8418e-02 9.0 0.00e+00 0.0 1.2e+01 2.2e+04 2.0e+00 0 0 14 49 3 0 0 14 49 4 0 +MatMult 7 1.0 2.0585e-01 1.2 1.94e+06 1.0 5.4e+01 4.7e+03 1.0e+00 1 55 64 47 1 1 55 64 47 2 28 +MatConvert 1 1.0 7.1345e-02 1.0 0.00e+00 0.0 0.0e+00 0.0e+00 2.0e+00 0 0 0 0 3 0 0 0 0 4 0 +MatAssemblyBegin 3 1.0 9.1874e-02 4.3 0.00e+00 0.0 1.2e+01 2.2e+04 2.0e+00 0 0 14 49 3 0 0 14 49 4 0 +MatAssemblyEnd 3 1.0 1.0951e-01 1.1 4.11e+03 1.4 0.0e+00 0.0e+00 6.0e+00 0 0 0 0 9 0 0 0 0 12 0 +MatGetRowIJ 2 1.0 4.1400e-06 1.1 0.00e+00 0.0 0.0e+00 0.0e+00 0.0e+00 0 0 0 0 0 0 0 0 0 0 0 +MatView 1 1.0 2.7932e-02 2.0 0.00e+00 0.0 0.0e+00 0.0e+00 1.0e+00 0 0 0 0 1 0 0 0 0 2 0 +VecTDot 14 1.0 1.7006e-01 1.5 2.82e+05 1.0 0.0e+00 0.0e+00 1.4e+01 0 8 0 0 21 0 8 0 0 29 5 +VecNorm 8 1.0 1.1291e-01 3.0 1.61e+05 1.0 0.0e+00 0.0e+00 8.0e+00 0 5 0 0 12 0 5 0 0 16 4 +VecCopy 2 1.0 6.2294e-05 1.1 0.00e+00 0.0 0.0e+00 0.0e+00 0.0e+00 0 0 0 0 0 0 0 0 0 0 0 +VecSet 9 1.0 1.6077e-04 1.1 0.00e+00 0.0 0.0e+00 0.0e+00 0.0e+00 0 0 0 0 0 0 0 0 0 0 0 +VecAXPY 14 1.0 6.1260e-04 1.1 2.82e+05 1.0 0.0e+00 0.0e+00 0.0e+00 0 8 0 0 0 0 8 0 0 0 1362 +VecAYPX 6 1.0 2.7591e-04 1.1 1.21e+05 1.0 0.0e+00 0.0e+00 0.0e+00 0 3 0 0 0 0 3 0 0 0 1296 +VecScatterBegin 8 1.0 7.2412e-02 1.3 0.00e+00 0.0 7.2e+01 3.8e+03 2.0e+00 0 0 86 51 3 0 0 86 51 4 0 +VecScatterEnd 8 1.0 1.7459e-01 1.2 0.00e+00 0.0 0.0e+00 0.0e+00 0.0e+00 0 0 0 0 0 0 0 0 0 0 0 +SFSetGraph 3 1.0 9.7291e-05 1.2 0.00e+00 0.0 0.0e+00 0.0e+00 0.0e+00 0 0 0 0 0 0 0 0 0 0 0 +SFSetUp 2 1.0 7.1926e-02 1.3 0.00e+00 0.0 2.4e+01 9.7e+02 2.0e+00 0 0 29 4 3 0 0 29 4 4 0 +SFPack 8 1.0 1.7692e-04 1.2 0.00e+00 0.0 0.0e+00 0.0e+00 0.0e+00 0 0 0 0 0 0 0 0 0 0 0 +SFUnpack 8 1.0 5.3896e-05 1.1 0.00e+00 0.0 0.0e+00 0.0e+00 0.0e+00 0 0 0 0 0 0 0 0 0 0 0 +KSPSetUp 1 1.0 1.3579e-04 1.1 0.00e+00 0.0 0.0e+00 0.0e+00 0.0e+00 0 0 0 0 0 0 0 0 0 0 0 +KSPSolve 1 1.0 7.5959e+00 1.0 2.79e+06 1.0 5.4e+01 4.7e+03 2.3e+01 21 80 64 47 34 21 80 64 47 47 1 +PCSetUp 1 1.0 3.8538e+00 1.0 0.00e+00 0.0 0.0e+00 0.0e+00 2.0e+00 10 0 0 0 3 10 0 0 0 4 0 +PCApply 8 1.0 7.2200e+00 1.0 0.00e+00 0.0 0.0e+00 0.0e+00 0.0e+00 19 0 0 0 0 19 0 0 0 0 0 --- Event Stage 1: Unknown @@ -3298,9 +3341,9 @@ --- Event Stage 1: Unknown ======================================================================================================================== -Average time to get PetscTime(): 1.4e-07 -Average time for MPI_Barrier(): 4.9554e-06 -Average time for zero size MPI_Send(): 6.886e-06 +Average time to get PetscTime(): 1.759e-07 +Average time for MPI_Barrier(): 5.9554e-06 +Average time for zero size MPI_Send(): 7.69933e-06 #PETSc Option Table entries: --ndofs 30000 --problem_type poisson @@ -3356,13 +3399,13 @@ Option left: name:--ndofs value: 30000 Option left: name:--problem_type value: poisson Option left: name:--scaling_type value: strong -2023-05-15 13:42:07.098 ( 19.176s) [RANK: 0 ] loguru.cpp:526 INFO| atexit +2023-05-16 15:56:22.083 ( 37.981s) [RANK: 0 ] loguru.cpp:526 INFO| atexit make[1]: Leaving directory '/build/fenicsx-performance-tests-0.5.0~git20220731.821823b' create-stamp debian/debhelper-build-stamp dh_testroot -O--buildsystem=cmake -O--sourcedirectory=src dh_prep -O--buildsystem=cmake -O--sourcedirectory=src dh_auto_install -O--buildsystem=cmake -O--sourcedirectory=src - cd obj-arm-linux-gnueabihf && make -j3 install DESTDIR=/build/fenicsx-performance-tests-0.5.0\~git20220731.821823b/debian/tmp AM_UPDATE_INFO_DIR=no "INSTALL=install --strip-program=true" + cd obj-arm-linux-gnueabihf && make -j4 install DESTDIR=/build/fenicsx-performance-tests-0.5.0\~git20220731.821823b/debian/tmp AM_UPDATE_INFO_DIR=no "INSTALL=install --strip-program=true" make[1]: Entering directory '/build/fenicsx-performance-tests-0.5.0~git20220731.821823b/obj-arm-linux-gnueabihf' /usr/bin/cmake -S"/build/fenicsx-performance-tests-0.5.0~git20220731.821823b/src" -B"/build/fenicsx-performance-tests-0.5.0~git20220731.821823b/obj-arm-linux-gnueabihf" --check-build-system CMakeFiles/Makefile.cmake 0 make -f CMakeFiles/Makefile2 preinstall @@ -3395,8 +3438,8 @@ dh_md5sums -O--buildsystem=cmake -O--sourcedirectory=src dh_builddeb -O--buildsystem=cmake -O--sourcedirectory=src dpkg-deb: building package 'fenicsx-performance-tests-dbgsym' in '../fenicsx-performance-tests-dbgsym_0.5.0~git20220731.821823b-1_armhf.deb'. -dpkg-deb: building package 'fenicsx-performance-tests' in '../fenicsx-performance-tests_0.5.0~git20220731.821823b-1_armhf.deb'. dpkg-deb: building package 'fenicsx-performance-tests-source' in '../fenicsx-performance-tests-source_0.5.0~git20220731.821823b-1_all.deb'. +dpkg-deb: building package 'fenicsx-performance-tests' in '../fenicsx-performance-tests_0.5.0~git20220731.821823b-1_armhf.deb'. dpkg-genbuildinfo --build=binary -O../fenicsx-performance-tests_0.5.0~git20220731.821823b-1_armhf.buildinfo dpkg-genchanges --build=binary -O../fenicsx-performance-tests_0.5.0~git20220731.821823b-1_armhf.changes dpkg-genchanges: info: binary-only upload (no source code included) @@ -3404,12 +3447,14 @@ dpkg-buildpackage: info: binary-only upload (no source included) dpkg-genchanges: info: including full source code in upload I: copying local configuration +I: user script /srv/workspace/pbuilder/27026/tmp/hooks/B01_cleanup starting +I: user script /srv/workspace/pbuilder/27026/tmp/hooks/B01_cleanup finished I: unmounting dev/ptmx filesystem I: unmounting dev/pts filesystem I: unmounting dev/shm filesystem I: unmounting proc filesystem I: unmounting sys filesystem I: cleaning the build env -I: removing directory /srv/workspace/pbuilder/1361 and its subdirectories -I: Current time: Mon May 15 13:42:33 -12 2023 -I: pbuilder-time-stamp: 1684201353 +I: removing directory /srv/workspace/pbuilder/27026 and its subdirectories +I: Current time: Tue May 16 15:57:35 +14 2023 +I: pbuilder-time-stamp: 1684202255