Diff of the two buildlogs: -- --- b1/build.log 2024-12-02 18:20:00.918801559 +0000 +++ b2/build.log 2024-12-02 19:13:54.492526388 +0000 @@ -1,6 +1,6 @@ I: pbuilder: network access will be disabled during build -I: Current time: Sun Jan 4 12:33:31 -12 2026 -I: pbuilder-time-stamp: 1767573211 +I: Current time: Tue Dec 3 08:20:04 +14 2024 +I: pbuilder-time-stamp: 1733163604 I: Building the build Environment I: extracting base tarball [/var/cache/pbuilder/unstable-reproducible-base.tgz] I: copying local configuration @@ -30,53 +30,85 @@ dpkg-source: info: applying auto-gitignore I: Not using root during the build. I: Installing the build-deps -I: user script /srv/workspace/pbuilder/23139/tmp/hooks/D02_print_environment starting +I: user script /srv/workspace/pbuilder/13949/tmp/hooks/D01_modify_environment starting +debug: Running on infom07-i386. +I: Changing host+domainname to test build reproducibility +I: Adding a custom variable just for the fun of it... +I: Changing /bin/sh to bash +'/bin/sh' -> '/bin/bash' +lrwxrwxrwx 1 root root 9 Dec 2 18:20 /bin/sh -> /bin/bash +I: Setting pbuilder2's login shell to /bin/bash +I: Setting pbuilder2's GECOS to second user,second room,second work-phone,second home-phone,second other +I: user script /srv/workspace/pbuilder/13949/tmp/hooks/D01_modify_environment finished +I: user script /srv/workspace/pbuilder/13949/tmp/hooks/D02_print_environment starting I: set - BUILDDIR='/build/reproducible-path' - BUILDUSERGECOS='first user,first room,first work-phone,first home-phone,first other' - BUILDUSERNAME='pbuilder1' - BUILD_ARCH='i386' - DEBIAN_FRONTEND='noninteractive' - DEB_BUILD_OPTIONS='buildinfo=+all reproducible=+all parallel=6 ' - DISTRIBUTION='unstable' - HOME='/root' - HOST_ARCH='i386' + BASH=/bin/sh + BASHOPTS=checkwinsize:cmdhist:complete_fullquote:extquote:force_fignore:globasciiranges:globskipdots:hostcomplete:interactive_comments:patsub_replacement:progcomp:promptvars:sourcepath + BASH_ALIASES=() + BASH_ARGC=() + BASH_ARGV=() + BASH_CMDS=() + BASH_LINENO=([0]="12" [1]="0") + BASH_LOADABLES_PATH=/usr/local/lib/bash:/usr/lib/bash:/opt/local/lib/bash:/usr/pkg/lib/bash:/opt/pkg/lib/bash:. + BASH_SOURCE=([0]="/tmp/hooks/D02_print_environment" [1]="/tmp/hooks/D02_print_environment") + BASH_VERSINFO=([0]="5" [1]="2" [2]="32" [3]="1" [4]="release" [5]="i686-pc-linux-gnu") + BASH_VERSION='5.2.32(1)-release' + BUILDDIR=/build/reproducible-path + BUILDUSERGECOS='second user,second room,second work-phone,second home-phone,second other' + BUILDUSERNAME=pbuilder2 + BUILD_ARCH=i386 + DEBIAN_FRONTEND=noninteractive + DEB_BUILD_OPTIONS='buildinfo=+all reproducible=+all parallel=5 ' + DIRSTACK=() + DISTRIBUTION=unstable + EUID=0 + FUNCNAME=([0]="Echo" [1]="main") + GROUPS=() + HOME=/root + HOSTNAME=i-capture-the-hostname + HOSTTYPE=i686 + HOST_ARCH=i386 IFS=' ' - INVOCATION_ID='b0a4aaaee1eb481b8662f16ba0e87027' - LANG='C' - LANGUAGE='en_US:en' - LC_ALL='C' - LD_LIBRARY_PATH='/usr/lib/libeatmydata' - LD_PRELOAD='libeatmydata.so' - MAIL='/var/mail/root' - OPTIND='1' - PATH='/usr/sbin:/usr/bin:/sbin:/bin:/usr/games' - PBCURRENTCOMMANDLINEOPERATION='build' - PBUILDER_OPERATION='build' - PBUILDER_PKGDATADIR='/usr/share/pbuilder' - PBUILDER_PKGLIBDIR='/usr/lib/pbuilder' - PBUILDER_SYSCONFDIR='/etc' - PPID='23139' - PS1='# ' - PS2='> ' + INVOCATION_ID=196b00f749c3461694cb8ed9b2ebd04f + LANG=C + LANGUAGE=de_CH:de + LC_ALL=C + LD_LIBRARY_PATH=/usr/lib/libeatmydata + LD_PRELOAD=libeatmydata.so + MACHTYPE=i686-pc-linux-gnu + MAIL=/var/mail/root + OPTERR=1 + OPTIND=1 + OSTYPE=linux-gnu + PATH=/usr/sbin:/usr/bin:/sbin:/bin:/usr/games:/i/capture/the/path + PBCURRENTCOMMANDLINEOPERATION=build + PBUILDER_OPERATION=build + PBUILDER_PKGDATADIR=/usr/share/pbuilder + PBUILDER_PKGLIBDIR=/usr/lib/pbuilder + PBUILDER_SYSCONFDIR=/etc + PIPESTATUS=([0]="0") + POSIXLY_CORRECT=y + PPID=13949 PS4='+ ' - PWD='/' - SHELL='/bin/bash' - SHLVL='2' - SUDO_COMMAND='/usr/bin/timeout -k 18.1h 18h /usr/bin/ionice -c 3 /usr/bin/nice /usr/sbin/pbuilder --build --configfile /srv/reproducible-results/rbuild-debian/r-b-build.r1NeHDgN/pbuilderrc_JNbE --distribution unstable --hookdir /etc/pbuilder/first-build-hooks --debbuildopts -b --basetgz /var/cache/pbuilder/unstable-reproducible-base.tgz --buildresult /srv/reproducible-results/rbuild-debian/r-b-build.r1NeHDgN/b1 --logfile b1/build.log librsb_1.3.0.2+dfsg-7.dsc' - SUDO_GID='111' - SUDO_UID='104' - SUDO_USER='jenkins' - TERM='unknown' - TZ='/usr/share/zoneinfo/Etc/GMT+12' - USER='root' - _='/usr/bin/systemd-run' + PWD=/ + SHELL=/bin/bash + SHELLOPTS=braceexpand:errexit:hashall:interactive-comments:posix + SHLVL=3 + SUDO_COMMAND='/usr/bin/timeout -k 24.1h 24h /usr/bin/ionice -c 3 /usr/bin/nice -n 11 /usr/bin/unshare --uts -- /usr/sbin/pbuilder --build --configfile /srv/reproducible-results/rbuild-debian/r-b-build.r1NeHDgN/pbuilderrc_E7Aq --distribution unstable --hookdir /etc/pbuilder/rebuild-hooks --debbuildopts -b --basetgz /var/cache/pbuilder/unstable-reproducible-base.tgz --buildresult /srv/reproducible-results/rbuild-debian/r-b-build.r1NeHDgN/b2 --logfile b2/build.log librsb_1.3.0.2+dfsg-7.dsc' + SUDO_GID=111 + SUDO_UID=104 + SUDO_USER=jenkins + TERM=unknown + TZ=/usr/share/zoneinfo/Etc/GMT-14 + UID=0 + USER=root + _='I: set' I: uname -a - Linux infom08-i386 6.11.5+bpo-amd64 #1 SMP PREEMPT_DYNAMIC Debian 6.11.5-1~bpo12+1 (2024-11-11) x86_64 GNU/Linux + Linux i-capture-the-hostname 6.1.0-28-amd64 #1 SMP PREEMPT_DYNAMIC Debian 6.1.119-1 (2024-11-22) x86_64 GNU/Linux I: ls -l /bin - lrwxrwxrwx 1 root root 7 Nov 22 2024 /bin -> usr/bin -I: user script /srv/workspace/pbuilder/23139/tmp/hooks/D02_print_environment finished + lrwxrwxrwx 1 root root 7 Nov 22 14:40 /bin -> usr/bin +I: user script /srv/workspace/pbuilder/13949/tmp/hooks/D02_print_environment finished -> Attempting to satisfy build-dependencies -> Creating pbuilder-satisfydepends-dummy package Package: pbuilder-satisfydepends-dummy @@ -295,7 +327,7 @@ Get: 171 http://deb.debian.org/debian unstable/main i386 libltdl-dev i386 2.4.7-8 [167 kB] Get: 172 http://deb.debian.org/debian unstable/main i386 libhwloc-dev i386 2.11.2-1 [271 kB] Get: 173 http://deb.debian.org/debian unstable/main i386 zlib1g-dev i386 1:1.3.dfsg+really1.3.1-1+b1 [916 kB] -Fetched 385 MB in 7s (56.6 MB/s) +Fetched 385 MB in 6s (65.2 MB/s) debconf: delaying package configuration, since apt-utils is not installed Selecting previously unselected package liblocale-gettext-perl. (Reading database ... (Reading database ... 5% (Reading database ... 10% (Reading database ... 15% (Reading database ... 20% (Reading database ... 25% (Reading database ... 30% (Reading database ... 35% (Reading database ... 40% (Reading database ... 45% (Reading database ... 50% (Reading database ... 55% (Reading database ... 60% (Reading database ... 65% (Reading database ... 70% (Reading database ... 75% (Reading database ... 80% (Reading database ... 85% (Reading database ... 90% (Reading database ... 95% (Reading database ... 100% (Reading database ... 19956 files and directories currently installed.) @@ -873,8 +905,8 @@ Setting up tzdata (2024b-3) ... Current default time zone: 'Etc/UTC' -Local time is now: Mon Jan 5 00:34:13 UTC 2026. -Universal Time is now: Mon Jan 5 00:34:13 UTC 2026. +Local time is now: Mon Dec 2 18:22:28 UTC 2024. +Universal Time is now: Mon Dec 2 18:22:28 UTC 2024. Run 'dpkg-reconfigure tzdata' if you wish to change it. Setting up libfontenc1:i386 (1:1.1.8-1+b1) ... @@ -1037,7 +1069,11 @@ Building tag database... -> Finished parsing the build-deps I: Building the package -I: Running cd /build/reproducible-path/librsb-1.3.0.2+dfsg/ && env PATH="/usr/sbin:/usr/bin:/sbin:/bin:/usr/games" HOME="/nonexistent/first-build" dpkg-buildpackage -us -uc -b && env PATH="/usr/sbin:/usr/bin:/sbin:/bin:/usr/games" HOME="/nonexistent/first-build" dpkg-genchanges -S > ../librsb_1.3.0.2+dfsg-7_source.changes +I: user script /srv/workspace/pbuilder/13949/tmp/hooks/A99_set_merged_usr starting +Not re-configuring usrmerge for unstable +I: user script /srv/workspace/pbuilder/13949/tmp/hooks/A99_set_merged_usr finished +hostname: Name or service not known +I: Running cd /build/reproducible-path/librsb-1.3.0.2+dfsg/ && env PATH="/usr/sbin:/usr/bin:/sbin:/bin:/usr/games:/i/capture/the/path" HOME="/nonexistent/second-build" dpkg-buildpackage -us -uc -b && env PATH="/usr/sbin:/usr/bin:/sbin:/bin:/usr/games:/i/capture/the/path" HOME="/nonexistent/second-build" dpkg-genchanges -S > ../librsb_1.3.0.2+dfsg-7_source.changes dpkg-buildpackage: info: source package librsb dpkg-buildpackage: info: source version 1.3.0.2+dfsg-7 dpkg-buildpackage: info: source distribution unstable @@ -1057,62 +1093,62 @@ dh binary dh_update_autotools_config dh_autoreconf -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found libtoolize: putting auxiliary files in '.'. libtoolize: copying file './ltmain.sh' libtoolize: putting macros in AC_CONFIG_MACRO_DIRS, 'm4'. @@ -1154,90 +1190,90 @@ libtoolize: copying file 'm4/ltsugar.m4' libtoolize: copying file 'm4/ltversion.m4' libtoolize: copying file 'm4/lt~obsolete.m4' -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found -sh: 1: git: not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found +sh: line 1: git: command not found configure.ac:66: installing './compile' configure.ac:65: installing './missing' Makefile.am: installing './depcomp' @@ -1420,7 +1456,7 @@ checking for m4... m4 checking for gmake... gmake checking for ggrep... /usr/bin/grep -checking for bash... /bin/bash +checking for bash... /bin/sh checking for gsed... /usr/bin/sed checking for cmp... cmp checking for basename... basename @@ -1537,7 +1573,7 @@ configure: It appears that Fortran programs can be linked without using the Fortran linker. configure: Using OPENMP_CFLAGS ok for linking an OpenMP program: adding it to LIBS. checking if your have a usable getrusage() ... 1 -checking for /bin/bash... /bin/bash +checking for /bin/sh... /bin/sh configure: Will not use Google Test. configure: You seem to not have GNU Octave or have disabled 'int' type. Part of the test suite will not be generated. If you want more testing capabilities, you should enable the 'int' type as well. checking that generated files are newer than configure... done @@ -1559,7 +1595,7 @@ config.status: executing depfiles commands config.status: executing libtool commands === configuring in librsbpp (/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp) -configure: running /bin/bash ./configure --disable-option-checking '--prefix=/usr' '--build=i686-linux-gnu' '--includedir=${prefix}/include' '--mandir=${prefix}/share/man' '--infodir=${prefix}/share/info' '--sysconfdir=/etc' '--localstatedir=/var' '--disable-silent-rules' '--libdir=${prefix}/lib/i386-linux-gnu' '--runstatedir=/run' '--disable-maintainer-mode' '--disable-dependency-tracking' '--with-hwloc' '--enable-matrix-types=blas' '--with-zlib=-lz' '--enable-doc-build' '--enable-fortran-module-install' '--enable-extra-patches' '--enable-pkg-config-install' '--disable-extra-patches' 'build_alias=i686-linux-gnu' 'CFLAGS=-g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3' 'LDFLAGS=-Wl,-z,relro' 'CPPFLAGS=-Wdate-time -D_FORTIFY_SOURCE=2' 'FCFLAGS=-g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -pipe' 'CXXFLAGS=-g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security' 'BASH=/bin/bash' --cache-file=/dev/null --srcdir=. +configure: running /bin/sh ./configure --disable-option-checking '--prefix=/usr' '--build=i686-linux-gnu' '--includedir=${prefix}/include' '--mandir=${prefix}/share/man' '--infodir=${prefix}/share/info' '--sysconfdir=/etc' '--localstatedir=/var' '--disable-silent-rules' '--libdir=${prefix}/lib/i386-linux-gnu' '--runstatedir=/run' '--disable-maintainer-mode' '--disable-dependency-tracking' '--with-hwloc' '--enable-matrix-types=blas' '--with-zlib=-lz' '--enable-doc-build' '--enable-fortran-module-install' '--enable-extra-patches' '--enable-pkg-config-install' '--disable-extra-patches' 'build_alias=i686-linux-gnu' 'CFLAGS=-g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3' 'LDFLAGS=-Wl,-z,relro' 'CPPFLAGS=-Wdate-time -D_FORTIFY_SOURCE=2' 'FCFLAGS=-g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -pipe' 'CXXFLAGS=-g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security' 'BASH=/bin/sh' --cache-file=/dev/null --srcdir=. checking for a BSD-compatible install... /usr/bin/install -c checking whether build environment is sane... yes checking for a race-free mkdir -p... /usr/bin/mkdir -p @@ -1681,7 +1717,7 @@ configure: Will not use Google Test. checking whether you have std::thread... yes checking whether you have std::mutex... yes -/bin/bash +/bin/sh checking that generated files are newer than configure... done configure: creating ./config.status config.status: creating Makefile @@ -1690,7 +1726,7 @@ config.status: executing libtool commands configure: Successfully created a Makefile. === configuring in rsblib (/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib) -configure: running /bin/bash ./configure --disable-option-checking '--prefix=/usr' '--build=i686-linux-gnu' '--includedir=${prefix}/include' '--mandir=${prefix}/share/man' '--infodir=${prefix}/share/info' '--sysconfdir=/etc' '--localstatedir=/var' '--disable-silent-rules' '--libdir=${prefix}/lib/i386-linux-gnu' '--runstatedir=/run' '--disable-maintainer-mode' '--disable-dependency-tracking' '--with-hwloc' '--enable-matrix-types=blas' '--with-zlib=-lz' '--enable-doc-build' '--enable-fortran-module-install' '--enable-extra-patches' '--enable-pkg-config-install' '--disable-extra-patches' 'build_alias=i686-linux-gnu' 'CFLAGS=-g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3' 'LDFLAGS=-Wl,-z,relro' 'CPPFLAGS=-Wdate-time -D_FORTIFY_SOURCE=2' 'FCFLAGS=-g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -pipe' 'CXXFLAGS=-g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security' 'BASH=/bin/bash' --cache-file=/dev/null --srcdir=. +configure: running /bin/sh ./configure --disable-option-checking '--prefix=/usr' '--build=i686-linux-gnu' '--includedir=${prefix}/include' '--mandir=${prefix}/share/man' '--infodir=${prefix}/share/info' '--sysconfdir=/etc' '--localstatedir=/var' '--disable-silent-rules' '--libdir=${prefix}/lib/i386-linux-gnu' '--runstatedir=/run' '--disable-maintainer-mode' '--disable-dependency-tracking' '--with-hwloc' '--enable-matrix-types=blas' '--with-zlib=-lz' '--enable-doc-build' '--enable-fortran-module-install' '--enable-extra-patches' '--enable-pkg-config-install' '--disable-extra-patches' 'build_alias=i686-linux-gnu' 'CFLAGS=-g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3' 'LDFLAGS=-Wl,-z,relro' 'CPPFLAGS=-Wdate-time -D_FORTIFY_SOURCE=2' 'FCFLAGS=-g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -pipe' 'CXXFLAGS=-g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security' 'BASH=/bin/sh' --cache-file=/dev/null --srcdir=. checking for a BSD-compatible install... /usr/bin/install -c checking whether build environment is sane... yes checking for a race-free mkdir -p... /usr/bin/mkdir -p @@ -1799,7 +1835,7 @@ checking for filesystem... yes checking for main in -lstdc++fs... yes configure: Assuming you are yet to build librsb.la. (set LIBS= -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la) -/bin/bash +/bin/sh checking that generated files are newer than configure... done configure: creating ./config.status config.status: creating Makefile @@ -1809,7 +1845,7 @@ config.status: executing libtool commands configure: Created a Makefile. === configuring in rsbtest (/build/reproducible-path/librsb-1.3.0.2+dfsg/rsbtest) -configure: running /bin/bash ./configure --disable-option-checking '--prefix=/usr' '--build=i686-linux-gnu' '--includedir=${prefix}/include' '--mandir=${prefix}/share/man' '--infodir=${prefix}/share/info' '--sysconfdir=/etc' '--localstatedir=/var' '--disable-silent-rules' '--libdir=${prefix}/lib/i386-linux-gnu' '--runstatedir=/run' '--disable-maintainer-mode' '--disable-dependency-tracking' '--with-hwloc' '--enable-matrix-types=blas' '--with-zlib=-lz' '--enable-doc-build' '--enable-fortran-module-install' '--enable-extra-patches' '--enable-pkg-config-install' '--disable-extra-patches' 'build_alias=i686-linux-gnu' 'CFLAGS=-g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3' 'LDFLAGS=-Wl,-z,relro' 'CPPFLAGS=-Wdate-time -D_FORTIFY_SOURCE=2' 'FCFLAGS=-g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -pipe' 'CXXFLAGS=-g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security' 'BASH=/bin/bash' --cache-file=/dev/null --srcdir=. +configure: running /bin/sh ./configure --disable-option-checking '--prefix=/usr' '--build=i686-linux-gnu' '--includedir=${prefix}/include' '--mandir=${prefix}/share/man' '--infodir=${prefix}/share/info' '--sysconfdir=/etc' '--localstatedir=/var' '--disable-silent-rules' '--libdir=${prefix}/lib/i386-linux-gnu' '--runstatedir=/run' '--disable-maintainer-mode' '--disable-dependency-tracking' '--with-hwloc' '--enable-matrix-types=blas' '--with-zlib=-lz' '--enable-doc-build' '--enable-fortran-module-install' '--enable-extra-patches' '--enable-pkg-config-install' '--disable-extra-patches' 'build_alias=i686-linux-gnu' 'CFLAGS=-g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3' 'LDFLAGS=-Wl,-z,relro' 'CPPFLAGS=-Wdate-time -D_FORTIFY_SOURCE=2' 'FCFLAGS=-g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -pipe' 'CXXFLAGS=-g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security' 'BASH=/bin/sh' --cache-file=/dev/null --srcdir=. checking for a BSD-compatible install... /usr/bin/install -c checking whether build environment is sane... yes checking for a race-free mkdir -p... /usr/bin/mkdir -p @@ -1920,7 +1956,7 @@ checking for filesystem... yes checking for rsb_lib_init... no checking for dd... yes -/bin/bash +/bin/sh /usr/bin/timeout checking that generated files are newer than configure... done configure: creating ./config.status @@ -1952,7 +1988,7 @@ ARFLAGS : cru M4 : m4 MAKE : gmake - BASH : /bin/bash + BASH : /bin/sh OCTAVE : false DOXYGEN : doxygen HELP2MAN : help2man @@ -2001,30 +2037,30 @@ blhc: ignore-line-regexp: ^.*CC.*: gcc blhc: ignore-line-regexp: ^.*LD.*: /usr/bin/ld.* dh_auto_build - make -j6 + make -j5 make[2]: Entering directory '/build/reproducible-path/librsb-1.3.0.2+dfsg' gmake all-recursive gmake[3]: Entering directory '/build/reproducible-path/librsb-1.3.0.2+dfsg' Making all in librsbpp gmake[4]: Entering directory '/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp' g++ -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -DRSBPP_HAS_RSB_H=1 -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -DRSBPP_HAS_RSB_H=1 -c -o rsbpp.o rsbpp.cpp -/bin/bash ./libtool --tag=CXX --mode=compile g++ -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -DRSBPP_HAS_RSB_H=1 -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -DRSBPP_HAS_RSB_H=1 -c -o rsbpp_coo.lo rsbpp_coo.cpp -/bin/bash ./libtool --tag=CXX --mode=compile g++ -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -DRSBPP_HAS_RSB_H=1 -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -DRSBPP_HAS_RSB_H=1 -c -o rsbpp_csr.lo rsbpp_csr.cpp +/bin/sh ./libtool --tag=CXX --mode=compile g++ -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -DRSBPP_HAS_RSB_H=1 -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -DRSBPP_HAS_RSB_H=1 -c -o rsbpp_coo.lo rsbpp_coo.cpp +/bin/sh ./libtool --tag=CXX --mode=compile g++ -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -DRSBPP_HAS_RSB_H=1 -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -DRSBPP_HAS_RSB_H=1 -c -o rsbpp_csr.lo rsbpp_csr.cpp g++ -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -DRSBPP_HAS_RSB_H=1 -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -DRSBPP_HAS_RSB_H=1 -c -o rsbtt.o rsbtt.cpp gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -DRSBPP_HAS_RSB_H=1 -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -c -o rsbct.o rsbct.c libtool: compile: g++ -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -DRSBPP_HAS_RSB_H=1 -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -DRSBPP_HAS_RSB_H=1 -c rsbpp_csr.cpp -fPIC -DPIC -o .libs/rsbpp_csr.o libtool: compile: g++ -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -DRSBPP_HAS_RSB_H=1 -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -DRSBPP_HAS_RSB_H=1 -c rsbpp_coo.cpp -fPIC -DPIC -o .libs/rsbpp_coo.o libtool: compile: g++ -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -DRSBPP_HAS_RSB_H=1 -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -DRSBPP_HAS_RSB_H=1 -c rsbpp_coo.cpp -o rsbpp_coo.o >/dev/null 2>&1 libtool: compile: g++ -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -DRSBPP_HAS_RSB_H=1 -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -DRSBPP_HAS_RSB_H=1 -c rsbpp_csr.cpp -o rsbpp_csr.o >/dev/null 2>&1 -/bin/bash ./libtool --tag=CXX --mode=link g++ -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -DRSBPP_HAS_RSB_H=1 -Wl,-z,relro -o librsbpp.la rsbpp_coo.lo rsbpp_csr.lo -lpthread -lstdc++fs +/bin/sh ./libtool --tag=CXX --mode=link g++ -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -DRSBPP_HAS_RSB_H=1 -Wl,-z,relro -o librsbpp.la rsbpp_coo.lo rsbpp_csr.lo -lpthread -lstdc++fs libtool: link: ar cr .libs/librsbpp.a .libs/rsbpp_coo.o .libs/rsbpp_csr.o libtool: link: ranlib .libs/librsbpp.a libtool: link: ( cd ".libs" && rm -f "librsbpp.la" && ln -s "../librsbpp.la" "librsbpp.la" ) -/bin/bash ./libtool --tag=CXX --mode=link g++ -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -DRSBPP_HAS_RSB_H=1 -Wl,-z,relro -o rsbtt rsbtt.o librsbpp.la -lpthread -lstdc++fs -/bin/bash ./libtool --tag=CXX --mode=link g++ -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -DRSBPP_HAS_RSB_H=1 -Wl,-z,relro -o rsbpp rsbpp.o librsbpp.la -lpthread -lstdc++fs -/bin/bash ./libtool --tag=CXX --mode=link g++ -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -DRSBPP_HAS_RSB_H=1 -Wl,-z,relro -o rsbct rsbct.o librsbpp.la -lpthread -lstdc++fs -libtool: link: g++ -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -DRSBPP_HAS_RSB_H=1 -Wl,-z -Wl,relro -o rsbpp rsbpp.o ./.libs/librsbpp.a -lpthread -lstdc++fs -fopenmp +/bin/sh ./libtool --tag=CXX --mode=link g++ -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -DRSBPP_HAS_RSB_H=1 -Wl,-z,relro -o rsbpp rsbpp.o librsbpp.la -lpthread -lstdc++fs +/bin/sh ./libtool --tag=CXX --mode=link g++ -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -DRSBPP_HAS_RSB_H=1 -Wl,-z,relro -o rsbtt rsbtt.o librsbpp.la -lpthread -lstdc++fs +/bin/sh ./libtool --tag=CXX --mode=link g++ -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -DRSBPP_HAS_RSB_H=1 -Wl,-z,relro -o rsbct rsbct.o librsbpp.la -lpthread -lstdc++fs libtool: link: g++ -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -DRSBPP_HAS_RSB_H=1 -Wl,-z -Wl,relro -o rsbct rsbct.o ./.libs/librsbpp.a -lpthread -lstdc++fs -fopenmp +libtool: link: g++ -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -DRSBPP_HAS_RSB_H=1 -Wl,-z -Wl,relro -o rsbpp rsbpp.o ./.libs/librsbpp.a -lpthread -lstdc++fs -fopenmp libtool: link: g++ -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -DRSBPP_HAS_RSB_H=1 -Wl,-z -Wl,relro -o rsbtt rsbtt.o ./.libs/librsbpp.a -lpthread -lstdc++fs -fopenmp gmake all-am gmake[5]: Entering directory '/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp' @@ -2043,44 +2079,31 @@ gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o rsbench-rsb_libspblas_tests.o `test -f 'rsb_libspblas_tests.c' || echo './'`rsb_libspblas_tests.c g++ -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -fopenmp -c -o rsb_dummy.o rsb_dummy.cpp gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o ch2icfb-ch2icfb.o `test -f 'ch2icfb.c' || echo './'`ch2icfb.c -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_nounroll_la-rsb_stropts.lo `test -f 'rsb_stropts.c' || echo './'`rsb_stropts.c -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_nounroll_la-rsb_strmif.lo `test -f 'rsb_strmif.c' || echo './'`rsb_strmif.c +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_nounroll_la-rsb_stropts.lo `test -f 'rsb_stropts.c' || echo './'`rsb_stropts.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_stropts.c -fPIC -DPIC -o .libs/librsb_nounroll_la-rsb_stropts.o -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_strmif.c -fPIC -DPIC -o .libs/librsb_nounroll_la-rsb_strmif.o libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_stropts.c -o librsb_nounroll_la-rsb_stropts.o >/dev/null 2>&1 -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_nounroll_la-rsb_unroll.lo `test -f 'rsb_unroll.c' || echo './'`rsb_unroll.c +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_nounroll_la-rsb_strmif.lo `test -f 'rsb_strmif.c' || echo './'`rsb_strmif.c +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_nounroll_la-rsb_unroll.lo `test -f 'rsb_unroll.c' || echo './'`rsb_unroll.c +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_strmif.c -fPIC -DPIC -o .libs/librsb_nounroll_la-rsb_strmif.o libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_unroll.c -fPIC -DPIC -o .libs/librsb_nounroll_la-rsb_unroll.o +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_nounroll_la-rsb_krnl_vb.lo `test -f 'rsb_krnl_vb.c' || echo './'`rsb_krnl_vb.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_unroll.c -o librsb_nounroll_la-rsb_unroll.o >/dev/null 2>&1 -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_nounroll_la-rsb_krnl_vb.lo `test -f 'rsb_krnl_vb.c' || echo './'`rsb_krnl_vb.c -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_strmif.c -o librsb_nounroll_la-rsb_strmif.o >/dev/null 2>&1 libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_krnl_vb.c -fPIC -DPIC -o .libs/librsb_nounroll_la-rsb_krnl_vb.o -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_nounroll_la-rsb_krnl_lb.lo `test -f 'rsb_krnl_lb.c' || echo './'`rsb_krnl_lb.c -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_krnl_lb.c -fPIC -DPIC -o .libs/librsb_nounroll_la-rsb_krnl_lb.o +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_nounroll_la-rsb_krnl_lb.lo `test -f 'rsb_krnl_lb.c' || echo './'`rsb_krnl_lb.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_krnl_vb.c -o librsb_nounroll_la-rsb_krnl_vb.o >/dev/null 2>&1 +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_strmif.c -o librsb_nounroll_la-rsb_strmif.o >/dev/null 2>&1 +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_krnl_lb.c -fPIC -DPIC -o .libs/librsb_nounroll_la-rsb_krnl_lb.o +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_nounroll_la-rsb_krnl.lo `test -f 'rsb_krnl.c' || echo './'`rsb_krnl.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_krnl_lb.c -o librsb_nounroll_la-rsb_krnl_lb.o >/dev/null 2>&1 -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_nounroll_la-rsb_krnl.lo `test -f 'rsb_krnl.c' || echo './'`rsb_krnl.c -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_nounroll_la-rsb_bench.lo `test -f 'rsb_bench.c' || echo './'`rsb_bench.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_krnl.c -fPIC -DPIC -o .libs/librsb_nounroll_la-rsb_krnl.o +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_nounroll_la-rsb_bench.lo `test -f 'rsb_bench.c' || echo './'`rsb_bench.c +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_nounroll_la-rsb_mergesort.lo `test -f 'rsb_mergesort.c' || echo './'`rsb_mergesort.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_bench.c -fPIC -DPIC -o .libs/librsb_nounroll_la-rsb_bench.o -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_nounroll_la-rsb_mergesort.lo `test -f 'rsb_mergesort.c' || echo './'`rsb_mergesort.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_mergesort.c -fPIC -DPIC -o .libs/librsb_nounroll_la-rsb_mergesort.o -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_nounroll_la-rsb_permute.lo `test -f 'rsb_permute.c' || echo './'`rsb_permute.c -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_permute.c -fPIC -DPIC -o .libs/librsb_nounroll_la-rsb_permute.o libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_mergesort.c -o librsb_nounroll_la-rsb_mergesort.o >/dev/null 2>&1 -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_nounroll_la-rsb_krnl_bcss_l.lo `test -f 'rsb_krnl_bcss_l.c' || echo './'`rsb_krnl_bcss_l.c -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_krnl_bcss_l.c -fPIC -DPIC -o .libs/librsb_nounroll_la-rsb_krnl_bcss_l.o -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_krnl_bcss_l.c -o librsb_nounroll_la-rsb_krnl_bcss_l.o >/dev/null 2>&1 -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_nounroll_la-rsb_krnl_bcss_u.lo `test -f 'rsb_krnl_bcss_u.c' || echo './'`rsb_krnl_bcss_u.c -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_krnl_bcss_u.c -fPIC -DPIC -o .libs/librsb_nounroll_la-rsb_krnl_bcss_u.o -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_krnl_bcss_u.c -o librsb_nounroll_la-rsb_krnl_bcss_u.o >/dev/null 2>&1 -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_nounroll_la-rsb_krnl_bcss_spsv_u.lo `test -f 'rsb_krnl_bcss_spsv_u.c' || echo './'`rsb_krnl_bcss_spsv_u.c -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_krnl_bcss_spsv_u.c -fPIC -DPIC -o .libs/librsb_nounroll_la-rsb_krnl_bcss_spsv_u.o +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_nounroll_la-rsb_permute.lo `test -f 'rsb_permute.c' || echo './'`rsb_permute.c +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_permute.c -fPIC -DPIC -o .libs/librsb_nounroll_la-rsb_permute.o libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_bench.c -o librsb_nounroll_la-rsb_bench.o >/dev/null 2>&1 -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_permute.c -o librsb_nounroll_la-rsb_permute.o >/dev/null 2>&1 -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_nounroll_la-rsb_krnl_bcss_spmv_u.lo `test -f 'rsb_krnl_bcss_spmv_u.c' || echo './'`rsb_krnl_bcss_spmv_u.c -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_krnl_bcss_spmv_u.c -fPIC -DPIC -o .libs/librsb_nounroll_la-rsb_krnl_bcss_spmv_u.o -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_nounroll_la-rsb_krnl_bcss_misc_u.lo `test -f 'rsb_krnl_bcss_misc_u.c' || echo './'`rsb_krnl_bcss_misc_u.c -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_krnl_bcss_misc_u.c -fPIC -DPIC -o .libs/librsb_nounroll_la-rsb_krnl_bcss_misc_u.o rsb_test_matops.c: In function 'rsb__main_block_partitioned_spmv_sxsa': rsb_test_matops.c:214:41: warning: '%s' directive writing up to 2047 bytes into a region of size 1011 [-Wformat-overflow=] 214 | rsb__sprintf(dst,"%s%s_%s_%.0lf_%s%s" "%s%s%s" "%s%s" "%s",pp?pp:"",h,rsb__getenv_nnr("HOSTNAME"),rsb_time(),buf,ap?ap:"", @@ -2099,9 +2122,19 @@ | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ 32 | __va_arg_pack ()); | ~~~~~~~~~~~~~~~~~ -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_nounroll_la-rsb_krnl_bcoo_spmv_u.lo `test -f 'rsb_krnl_bcoo_spmv_u.c' || echo './'`rsb_krnl_bcoo_spmv_u.c -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_krnl_bcoo_spmv_u.c -fPIC -DPIC -o .libs/librsb_nounroll_la-rsb_krnl_bcoo_spmv_u.o -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_krnl_bcss_spsv_u.c -o librsb_nounroll_la-rsb_krnl_bcss_spsv_u.o >/dev/null 2>&1 +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_permute.c -o librsb_nounroll_la-rsb_permute.o >/dev/null 2>&1 +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_nounroll_la-rsb_krnl_bcss_l.lo `test -f 'rsb_krnl_bcss_l.c' || echo './'`rsb_krnl_bcss_l.c +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_krnl_bcss_l.c -fPIC -DPIC -o .libs/librsb_nounroll_la-rsb_krnl_bcss_l.o +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_krnl_bcss_l.c -o librsb_nounroll_la-rsb_krnl_bcss_l.o >/dev/null 2>&1 +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_nounroll_la-rsb_krnl_bcss_u.lo `test -f 'rsb_krnl_bcss_u.c' || echo './'`rsb_krnl_bcss_u.c +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_nounroll_la-rsb_krnl_bcss_spsv_u.lo `test -f 'rsb_krnl_bcss_spsv_u.c' || echo './'`rsb_krnl_bcss_spsv_u.c +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_krnl_bcss_u.c -fPIC -DPIC -o .libs/librsb_nounroll_la-rsb_krnl_bcss_u.o +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_krnl_bcss_spsv_u.c -fPIC -DPIC -o .libs/librsb_nounroll_la-rsb_krnl_bcss_spsv_u.o +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_krnl_bcss_u.c -o librsb_nounroll_la-rsb_krnl_bcss_u.o >/dev/null 2>&1 +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_nounroll_la-rsb_krnl_bcss_spmv_u.lo `test -f 'rsb_krnl_bcss_spmv_u.c' || echo './'`rsb_krnl_bcss_spmv_u.c +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_krnl_bcss_spmv_u.c -fPIC -DPIC -o .libs/librsb_nounroll_la-rsb_krnl_bcss_spmv_u.o +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_nounroll_la-rsb_krnl_bcss_misc_u.lo `test -f 'rsb_krnl_bcss_misc_u.c' || echo './'`rsb_krnl_bcss_misc_u.c +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_krnl_bcss_misc_u.c -fPIC -DPIC -o .libs/librsb_nounroll_la-rsb_krnl_bcss_misc_u.o rsb_test_matops.c: In function 'rsb__main_block_partitioned_spsv_sxsx': rsb_test_matops.c:214:41: warning: '%s' directive writing up to 2047 bytes into a region of size 1011 [-Wformat-overflow=] 214 | rsb__sprintf(dst,"%s%s_%s_%.0lf_%s%s" "%s%s%s" "%s%s" "%s",pp?pp:"",h,rsb__getenv_nnr("HOSTNAME"),rsb_time(),buf,ap?ap:"", @@ -2116,6 +2149,7 @@ | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ 32 | __va_arg_pack ()); | ~~~~~~~~~~~~~~~~~ +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_krnl_bcss_spsv_u.c -o librsb_nounroll_la-rsb_krnl_bcss_spsv_u.o >/dev/null 2>&1 rsb_test_matops.c: In function 'rsb__main_block_partitioned_mat_stats': rsb_test_matops.c:214:41: warning: '%s' directive writing up to 2047 bytes into a region of size 1011 [-Wformat-overflow=] 214 | rsb__sprintf(dst,"%s%s_%s_%.0lf_%s%s" "%s%s%s" "%s%s" "%s",pp?pp:"",h,rsb__getenv_nnr("HOSTNAME"),rsb_time(),buf,ap?ap:"", @@ -2131,215 +2165,217 @@ 32 | __va_arg_pack ()); | ~~~~~~~~~~~~~~~~~ libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_krnl.c -o librsb_nounroll_la-rsb_krnl.o >/dev/null 2>&1 -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_nounroll_la-rsb_krnl_bcss.lo `test -f 'rsb_krnl_bcss.c' || echo './'`rsb_krnl_bcss.c +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_nounroll_la-rsb_krnl_bcoo_spmv_u.lo `test -f 'rsb_krnl_bcoo_spmv_u.c' || echo './'`rsb_krnl_bcoo_spmv_u.c +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_krnl_bcoo_spmv_u.c -fPIC -DPIC -o .libs/librsb_nounroll_la-rsb_krnl_bcoo_spmv_u.o +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_nounroll_la-rsb_krnl_bcss.lo `test -f 'rsb_krnl_bcss.c' || echo './'`rsb_krnl_bcss.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_krnl_bcss.c -fPIC -DPIC -o .libs/librsb_nounroll_la-rsb_krnl_bcss.o libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_krnl_bcss.c -o librsb_nounroll_la-rsb_krnl_bcss.o >/dev/null 2>&1 -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_nounroll_la-rsb_spmv.lo `test -f 'rsb_spmv.c' || echo './'`rsb_spmv.c +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_nounroll_la-rsb_spmv.lo `test -f 'rsb_spmv.c' || echo './'`rsb_spmv.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_spmv.c -fPIC -DPIC -o .libs/librsb_nounroll_la-rsb_spmv.o -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_nounroll_la-rsb_merge.lo `test -f 'rsb_merge.c' || echo './'`rsb_merge.c -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_merge.c -fPIC -DPIC -o .libs/librsb_nounroll_la-rsb_merge.o libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_spmv.c -o librsb_nounroll_la-rsb_spmv.o >/dev/null 2>&1 +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_krnl_bcss_misc_u.c -o librsb_nounroll_la-rsb_krnl_bcss_misc_u.o >/dev/null 2>&1 +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_nounroll_la-rsb_merge.lo `test -f 'rsb_merge.c' || echo './'`rsb_merge.c +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_merge.c -fPIC -DPIC -o .libs/librsb_nounroll_la-rsb_merge.o libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_merge.c -o librsb_nounroll_la-rsb_merge.o >/dev/null 2>&1 -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_nounroll_la-rsb_ompio.lo `test -f 'rsb_ompio.c' || echo './'`rsb_ompio.c +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_nounroll_la-rsb_ompio.lo `test -f 'rsb_ompio.c' || echo './'`rsb_ompio.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_ompio.c -fPIC -DPIC -o .libs/librsb_nounroll_la-rsb_ompio.o libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_ompio.c -o librsb_nounroll_la-rsb_ompio.o >/dev/null 2>&1 -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_nounroll_la-rsb_util.lo `test -f 'rsb_util.c' || echo './'`rsb_util.c +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_nounroll_la-rsb_util.lo `test -f 'rsb_util.c' || echo './'`rsb_util.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_util.c -fPIC -DPIC -o .libs/librsb_nounroll_la-rsb_util.o -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_nounroll_la-rsb_spgemm_csr.lo `test -f 'rsb_spgemm_csr.c' || echo './'`rsb_spgemm_csr.c +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_nounroll_la-rsb_spgemm_csr.lo `test -f 'rsb_spgemm_csr.c' || echo './'`rsb_spgemm_csr.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_spgemm_csr.c -fPIC -DPIC -o .libs/librsb_nounroll_la-rsb_spgemm_csr.o libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_spgemm_csr.c -o librsb_nounroll_la-rsb_spgemm_csr.o >/dev/null 2>&1 -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_krnl_bcss_misc_u.c -o librsb_nounroll_la-rsb_krnl_bcss_misc_u.o >/dev/null 2>&1 -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_nounroll_la-rsb_spsum_misc.lo `test -f 'rsb_spsum_misc.c' || echo './'`rsb_spsum_misc.c +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_nounroll_la-rsb_spsum_misc.lo `test -f 'rsb_spsum_misc.c' || echo './'`rsb_spsum_misc.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_spsum_misc.c -fPIC -DPIC -o .libs/librsb_nounroll_la-rsb_spsum_misc.o libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_spsum_misc.c -o librsb_nounroll_la-rsb_spsum_misc.o >/dev/null 2>&1 -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_nounroll_la-rsb_prec.lo `test -f 'rsb_prec.c' || echo './'`rsb_prec.c +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_nounroll_la-rsb_prec.lo `test -f 'rsb_prec.c' || echo './'`rsb_prec.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_prec.c -fPIC -DPIC -o .libs/librsb_nounroll_la-rsb_prec.o libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_prec.c -o librsb_nounroll_la-rsb_prec.o >/dev/null 2>&1 -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_base_la-rsb_is.lo `test -f 'rsb_is.c' || echo './'`rsb_is.c +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_base_la-rsb_is.lo `test -f 'rsb_is.c' || echo './'`rsb_is.c +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_base_la-rsb_mio.lo `test -f 'rsb_mio.c' || echo './'`rsb_mio.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_is.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_is.o -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_is.c -o librsb_base_la-rsb_is.o >/dev/null 2>&1 -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_base_la-rsb_mio.lo `test -f 'rsb_mio.c' || echo './'`rsb_mio.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_mio.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_mio.o -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_mio.c -o librsb_base_la-rsb_mio.o >/dev/null 2>&1 -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_base_la-rsb_op.lo `test -f 'rsb_op.c' || echo './'`rsb_op.c +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_is.c -o librsb_base_la-rsb_is.o >/dev/null 2>&1 +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_base_la-rsb_op.lo `test -f 'rsb_op.c' || echo './'`rsb_op.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_op.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_op.o libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_op.c -o librsb_base_la-rsb_op.o >/dev/null 2>&1 -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_base_la-rsb_bio.lo `test -f 'rsb_bio.c' || echo './'`rsb_bio.c +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_util.c -o librsb_nounroll_la-rsb_util.o >/dev/null 2>&1 +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_base_la-rsb_bio.lo `test -f 'rsb_bio.c' || echo './'`rsb_bio.c +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_mio.c -o librsb_base_la-rsb_mio.o >/dev/null 2>&1 libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_bio.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_bio.o libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_bio.c -o librsb_base_la-rsb_bio.o >/dev/null 2>&1 -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_base_la-rsb_get.lo `test -f 'rsb_get.c' || echo './'`rsb_get.c +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_base_la-rsb_get.lo `test -f 'rsb_get.c' || echo './'`rsb_get.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_get.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_get.o -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_get.c -o librsb_base_la-rsb_get.o >/dev/null 2>&1 -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_base_la-rsb_set.lo `test -f 'rsb_set.c' || echo './'`rsb_set.c +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_base_la-rsb_set.lo `test -f 'rsb_set.c' || echo './'`rsb_set.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_set.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_set.o libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_set.c -o librsb_base_la-rsb_set.o >/dev/null 2>&1 -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_base_la-rsb_coo.lo `test -f 'rsb_coo.c' || echo './'`rsb_coo.c +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_get.c -o librsb_base_la-rsb_get.o >/dev/null 2>&1 +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_base_la-rsb_coo.lo `test -f 'rsb_coo.c' || echo './'`rsb_coo.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_coo.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_coo.o libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_coo.c -o librsb_base_la-rsb_coo.o >/dev/null 2>&1 -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_base_la-rsb_csr.lo `test -f 'rsb_csr.c' || echo './'`rsb_csr.c +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_base_la-rsb_csr.lo `test -f 'rsb_csr.c' || echo './'`rsb_csr.c +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_base_la-rsb_coo_check.lo `test -f 'rsb_coo_check.c' || echo './'`rsb_coo_check.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_csr.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_csr.o -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_base_la-rsb_coo_check.lo `test -f 'rsb_coo_check.c' || echo './'`rsb_coo_check.c -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_csr.c -o librsb_base_la-rsb_csr.o >/dev/null 2>&1 libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_coo_check.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_coo_check.o -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_base_la-rsb_coo_symm.lo `test -f 'rsb_coo_symm.c' || echo './'`rsb_coo_symm.c -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_coo_symm.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_coo_symm.o +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_csr.c -o librsb_base_la-rsb_csr.o >/dev/null 2>&1 libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_coo_check.c -o librsb_base_la-rsb_coo_check.o >/dev/null 2>&1 -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_util.c -o librsb_nounroll_la-rsb_util.o >/dev/null 2>&1 -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_coo_symm.c -o librsb_base_la-rsb_coo_symm.o >/dev/null 2>&1 -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_base_la-rsb_idx.lo `test -f 'rsb_idx.c' || echo './'`rsb_idx.c +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_base_la-rsb_coo_symm.lo `test -f 'rsb_coo_symm.c' || echo './'`rsb_coo_symm.c +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_base_la-rsb_idx.lo `test -f 'rsb_idx.c' || echo './'`rsb_idx.c +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_coo_symm.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_coo_symm.o libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_idx.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_idx.o -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_base_la-rsb_srt.lo `test -f 'rsb_srt.c' || echo './'`rsb_srt.c -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_srt.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_srt.o +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_coo_symm.c -o librsb_base_la-rsb_coo_symm.o >/dev/null 2>&1 +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_base_la-rsb_srt.lo `test -f 'rsb_srt.c' || echo './'`rsb_srt.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_idx.c -o librsb_base_la-rsb_idx.o >/dev/null 2>&1 +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_srt.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_srt.o +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_base_la-rsb_srtp.lo `test -f 'rsb_srtp.c' || echo './'`rsb_srtp.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_srt.c -o librsb_base_la-rsb_srt.o >/dev/null 2>&1 -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_base_la-rsb_srtp.lo `test -f 'rsb_srtp.c' || echo './'`rsb_srtp.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_srtp.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_srtp.o -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_base_la-rsb_src.lo `test -f 'rsb_src.c' || echo './'`rsb_src.c +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_base_la-rsb_src.lo `test -f 'rsb_src.c' || echo './'`rsb_src.c +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_srtp.c -o librsb_base_la-rsb_srtp.o >/dev/null 2>&1 libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_src.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_src.o +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_base_la-rsb_test_accuracy.lo `test -f 'rsb_test_accuracy.c' || echo './'`rsb_test_accuracy.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_src.c -o librsb_base_la-rsb_src.o >/dev/null 2>&1 -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_srtp.c -o librsb_base_la-rsb_srtp.o >/dev/null 2>&1 -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_base_la-rsb_test_accuracy.lo `test -f 'rsb_test_accuracy.c' || echo './'`rsb_test_accuracy.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_test_accuracy.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_test_accuracy.o -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_base_la-rsb_clone.lo `test -f 'rsb_clone.c' || echo './'`rsb_clone.c +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_base_la-rsb_clone.lo `test -f 'rsb_clone.c' || echo './'`rsb_clone.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_clone.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_clone.o libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_test_accuracy.c -o librsb_base_la-rsb_test_accuracy.o >/dev/null 2>&1 -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_base_la-rsb_rec.lo `test -f 'rsb_rec.c' || echo './'`rsb_rec.c -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_rec.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_rec.o +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_base_la-rsb_rec.lo `test -f 'rsb_rec.c' || echo './'`rsb_rec.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_clone.c -o librsb_base_la-rsb_clone.o >/dev/null 2>&1 -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_base_la-rsb_render.lo `test -f 'rsb_render.c' || echo './'`rsb_render.c +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_rec.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_rec.o +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_base_la-rsb_render.lo `test -f 'rsb_render.c' || echo './'`rsb_render.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_render.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_render.o libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_render.c -o librsb_base_la-rsb_render.o >/dev/null 2>&1 -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_base_la-rsb_eps.lo `test -f 'rsb_eps.c' || echo './'`rsb_eps.c +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_rec.c -o librsb_base_la-rsb_rec.o >/dev/null 2>&1 +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_base_la-rsb_eps.lo `test -f 'rsb_eps.c' || echo './'`rsb_eps.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_eps.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_eps.o -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_base_la-rsb_msort_up.lo `test -f 'rsb_msort_up.c' || echo './'`rsb_msort_up.c +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_base_la-rsb_msort_up.lo `test -f 'rsb_msort_up.c' || echo './'`rsb_msort_up.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_msort_up.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_msort_up.o -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_rec.c -o librsb_base_la-rsb_rec.o >/dev/null 2>&1 libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_msort_up.c -o librsb_base_la-rsb_msort_up.o >/dev/null 2>&1 -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_base_la-rsb_sys.lo `test -f 'rsb_sys.c' || echo './'`rsb_sys.c -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_sys.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_sys.o libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_eps.c -o librsb_base_la-rsb_eps.o >/dev/null 2>&1 -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_sys.c -o librsb_base_la-rsb_sys.o >/dev/null 2>&1 -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_base_la-rsb_blas_stuff.lo `test -f 'rsb_blas_stuff.c' || echo './'`rsb_blas_stuff.c +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_base_la-rsb_sys.lo `test -f 'rsb_sys.c' || echo './'`rsb_sys.c +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_sys.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_sys.o +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_base_la-rsb_blas_stuff.lo `test -f 'rsb_blas_stuff.c' || echo './'`rsb_blas_stuff.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_blas_stuff.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_blas_stuff.o +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_sys.c -o librsb_base_la-rsb_sys.o >/dev/null 2>&1 libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_blas_stuff.c -o librsb_base_la-rsb_blas_stuff.o >/dev/null 2>&1 -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_base_la-rsb_gen.lo `test -f 'rsb_gen.c' || echo './'`rsb_gen.c +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_base_la-rsb_gen.lo `test -f 'rsb_gen.c' || echo './'`rsb_gen.c +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_base_la-rsb_perf.lo `test -f 'rsb_perf.c' || echo './'`rsb_perf.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_gen.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_gen.o -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_base_la-rsb_perf.lo `test -f 'rsb_perf.c' || echo './'`rsb_perf.c -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_base_la-rsb_rsb.lo `test -f 'rsb_rsb.c' || echo './'`rsb_rsb.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_perf.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_perf.o +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_base_la-rsb_rsb.lo `test -f 'rsb_rsb.c' || echo './'`rsb_rsb.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_rsb.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_rsb.o -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_gen.c -o librsb_base_la-rsb_gen.o >/dev/null 2>&1 libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_perf.c -o librsb_base_la-rsb_perf.o >/dev/null 2>&1 +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_gen.c -o librsb_base_la-rsb_gen.o >/dev/null 2>&1 libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_rsb.c -o librsb_base_la-rsb_rsb.o >/dev/null 2>&1 -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_base_la-rsb_err.lo `test -f 'rsb_err.c' || echo './'`rsb_err.c +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_base_la-rsb_err.lo `test -f 'rsb_err.c' || echo './'`rsb_err.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_err.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_err.o -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_base_la-rsb_tune.lo `test -f 'rsb_tune.c' || echo './'`rsb_tune.c -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_tune.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_tune.o +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_base_la-rsb_tune.lo `test -f 'rsb_tune.c' || echo './'`rsb_tune.c +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_base_la-rsb_do.lo `test -f 'rsb_do.c' || echo './'`rsb_do.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_err.c -o librsb_base_la-rsb_err.o >/dev/null 2>&1 -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_base_la-rsb_do.lo `test -f 'rsb_do.c' || echo './'`rsb_do.c +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_tune.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_tune.o +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_base_la-rsb_internals.lo `test -f 'rsb_internals.c' || echo './'`rsb_internals.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_do.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_do.o -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_base_la-rsb_internals.lo `test -f 'rsb_internals.c' || echo './'`rsb_internals.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_internals.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_internals.o libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_do.c -o librsb_base_la-rsb_do.o >/dev/null 2>&1 -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_base_la-rsb_garbage.lo `test -f 'rsb_garbage.c' || echo './'`rsb_garbage.c -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_garbage.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_garbage.o +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_base_la-rsb_garbage.lo `test -f 'rsb_garbage.c' || echo './'`rsb_garbage.c +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_tune.c -o librsb_base_la-rsb_tune.o >/dev/null 2>&1 libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_internals.c -o librsb_base_la-rsb_internals.o >/dev/null 2>&1 +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_garbage.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_garbage.o libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_garbage.c -o librsb_base_la-rsb_garbage.o >/dev/null 2>&1 -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_tune.c -o librsb_base_la-rsb_tune.o >/dev/null 2>&1 -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_base_la-rsb_mmio.lo `test -f 'rsb_mmio.c' || echo './'`rsb_mmio.c +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_base_la-rsb_mmio.lo `test -f 'rsb_mmio.c' || echo './'`rsb_mmio.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_mmio.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_mmio.o libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_mmio.c -o librsb_base_la-rsb_mmio.o >/dev/null 2>&1 -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_base_la-rsb_partition.lo `test -f 'rsb_partition.c' || echo './'`rsb_partition.c +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_base_la-rsb_partition.lo `test -f 'rsb_partition.c' || echo './'`rsb_partition.c +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_base_la-rsb_mbw.lo `test -f 'rsb_mbw.c' || echo './'`rsb_mbw.c +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_base_la-rsb_limiter.lo `test -f 'rsb_limiter.c' || echo './'`rsb_limiter.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_partition.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_partition.o -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_partition.c -o librsb_base_la-rsb_partition.o >/dev/null 2>&1 -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_base_la-rsb_mbw.lo `test -f 'rsb_mbw.c' || echo './'`rsb_mbw.c -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_base_la-rsb_limiter.lo `test -f 'rsb_limiter.c' || echo './'`rsb_limiter.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_mbw.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_mbw.o libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_limiter.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_limiter.o +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_partition.c -o librsb_base_la-rsb_partition.o >/dev/null 2>&1 libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_limiter.c -o librsb_base_la-rsb_limiter.o >/dev/null 2>&1 -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_base_la-rsb_fpb.lo `test -f 'rsb_fpb.c' || echo './'`rsb_fpb.c +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_base_la-rsb_fpb.lo `test -f 'rsb_fpb.c' || echo './'`rsb_fpb.c +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_base_la-rsb_spgemm.lo `test -f 'rsb_spgemm.c' || echo './'`rsb_spgemm.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_fpb.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_fpb.o -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_base_la-rsb_spgemm.lo `test -f 'rsb_spgemm.c' || echo './'`rsb_spgemm.c +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_mbw.c -o librsb_base_la-rsb_mbw.o >/dev/null 2>&1 libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_spgemm.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_spgemm.o libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_fpb.c -o librsb_base_la-rsb_fpb.o >/dev/null 2>&1 -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_mbw.c -o librsb_base_la-rsb_mbw.o >/dev/null 2>&1 libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_spgemm.c -o librsb_base_la-rsb_spgemm.o >/dev/null 2>&1 -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_base_la-rsb_spsum.lo `test -f 'rsb_spsum.c' || echo './'`rsb_spsum.c +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_base_la-rsb_spsum.lo `test -f 'rsb_spsum.c' || echo './'`rsb_spsum.c +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_base_la-rsb_spsv.lo `test -f 'rsb_spsv.c' || echo './'`rsb_spsv.c +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_base_la-rsb_lock.lo `test -f 'rsb_lock.c' || echo './'`rsb_lock.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_spsum.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_spsum.o -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_spsum.c -o librsb_base_la-rsb_spsum.o >/dev/null 2>&1 -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_base_la-rsb_spsv.lo `test -f 'rsb_spsv.c' || echo './'`rsb_spsv.c -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_base_la-rsb_lock.lo `test -f 'rsb_lock.c' || echo './'`rsb_lock.c -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_base_la-rsb_swt.lo `test -f 'rsb_swt.c' || echo './'`rsb_swt.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_spsv.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_spsv.o -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_base_la-rsb_init.lo `test -f 'rsb_init.c' || echo './'`rsb_init.c +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_spsum.c -o librsb_base_la-rsb_spsum.o >/dev/null 2>&1 libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_lock.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_lock.o -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_swt.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_swt.o -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_init.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_init.o +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_base_la-rsb_swt.lo `test -f 'rsb_swt.c' || echo './'`rsb_swt.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_lock.c -o librsb_base_la-rsb_lock.o >/dev/null 2>&1 +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_swt.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_swt.o +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_base_la-rsb_init.lo `test -f 'rsb_init.c' || echo './'`rsb_init.c +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_spsv.c -o librsb_base_la-rsb_spsv.o >/dev/null 2>&1 libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_swt.c -o librsb_base_la-rsb_swt.o >/dev/null 2>&1 +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_init.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_init.o +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_base_la-rsb_dump.lo `test -f 'rsb_dump.c' || echo './'`rsb_dump.c +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_base_la-rsb_cpmv.lo `test -f 'rsb_cpmv.c' || echo './'`rsb_cpmv.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_init.c -o librsb_base_la-rsb_init.o >/dev/null 2>&1 -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_spsv.c -o librsb_base_la-rsb_spsv.o >/dev/null 2>&1 -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_base_la-rsb_dump.lo `test -f 'rsb_dump.c' || echo './'`rsb_dump.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_dump.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_dump.o -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_base_la-rsb_cpmv.lo `test -f 'rsb_cpmv.c' || echo './'`rsb_cpmv.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_cpmv.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_cpmv.o -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_base_la-rsb_asm.lo `test -f 'rsb_asm.c' || echo './'`rsb_asm.c -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_dump.c -o librsb_base_la-rsb_dump.o >/dev/null 2>&1 -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_asm.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_asm.o -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_base_la-rsb_user.lo `test -f 'rsb_user.c' || echo './'`rsb_user.c +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_base_la-rsb_asm.lo `test -f 'rsb_asm.c' || echo './'`rsb_asm.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_cpmv.c -o librsb_base_la-rsb_cpmv.o >/dev/null 2>&1 -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_user.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_user.o +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_asm.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_asm.o +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_dump.c -o librsb_base_la-rsb_dump.o >/dev/null 2>&1 +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_base_la-rsb_user.lo `test -f 'rsb_user.c' || echo './'`rsb_user.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_asm.c -o librsb_base_la-rsb_asm.o >/dev/null 2>&1 -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_base_la-rsb_coo2rec.lo `test -f 'rsb_coo2rec.c' || echo './'`rsb_coo2rec.c +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_user.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_user.o +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_base_la-rsb_coo2rec.lo `test -f 'rsb_coo2rec.c' || echo './'`rsb_coo2rec.c +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_base_la-rsb_rec2coo.lo `test -f 'rsb_rec2coo.c' || echo './'`rsb_rec2coo.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_coo2rec.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_coo2rec.o -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_base_la-rsb_rec2coo.lo `test -f 'rsb_rec2coo.c' || echo './'`rsb_rec2coo.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_user.c -o librsb_base_la-rsb_user.o >/dev/null 2>&1 libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_rec2coo.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_rec2coo.o -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_base_la-rsb_rec2csr.lo `test -f 'rsb_rec2csr.c' || echo './'`rsb_rec2csr.c -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_rec2csr.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_rec2csr.o +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_base_la-rsb_rec2csr.lo `test -f 'rsb_rec2csr.c' || echo './'`rsb_rec2csr.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_rec2coo.c -o librsb_base_la-rsb_rec2coo.o >/dev/null 2>&1 -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_base_la-rsb_csr2coo.lo `test -f 'rsb_csr2coo.c' || echo './'`rsb_csr2coo.c -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_csr2coo.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_csr2coo.o +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_rec2csr.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_rec2csr.o +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o librsb_base_la-rsb_csr2coo.lo `test -f 'rsb_csr2coo.c' || echo './'`rsb_csr2coo.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_rec2csr.c -o librsb_base_la-rsb_rec2csr.o >/dev/null 2>&1 -/bin/bash ./libtool --tag=FC --mode=compile gfortran -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -pipe -fopenmp -c -o rsb_blas_sparse.lo rsb_blas_sparse.F90 -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o rsb_libspblas_handle.lo rsb_libspblas_handle.c +/bin/sh ./libtool --tag=FC --mode=compile gfortran -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -pipe -fopenmp -c -o rsb_blas_sparse.lo rsb_blas_sparse.F90 +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_csr2coo.c -fPIC -DPIC -o .libs/librsb_base_la-rsb_csr2coo.o +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_coo2rec.c -o librsb_base_la-rsb_coo2rec.o >/dev/null 2>&1 libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_csr2coo.c -o librsb_base_la-rsb_csr2coo.o >/dev/null 2>&1 libtool: compile: gfortran -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -pipe -fopenmp -c rsb_blas_sparse.F90 -fPIC -o .libs/rsb_blas_sparse.o +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o rsb_libspblas_handle.lo rsb_libspblas_handle.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_libspblas_handle.c -fPIC -DPIC -o .libs/rsb_libspblas_handle.o -/bin/bash ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o rsb_libspblas.lo rsb_libspblas.c +/bin/sh ./libtool --tag=CC --mode=compile gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c -o rsb_libspblas.lo rsb_libspblas.c libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_libspblas.c -fPIC -DPIC -o .libs/rsb_libspblas.o -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_coo2rec.c -o librsb_base_la-rsb_coo2rec.o >/dev/null 2>&1 libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_libspblas_handle.c -o rsb_libspblas_handle.o >/dev/null 2>&1 -gfortran -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -pipe -fopenmp -c -o rsb_blas_sparse.o rsb_blas_sparse.F90 -libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_libspblas.c -o rsb_libspblas.o >/dev/null 2>&1 libtool: compile: gfortran -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -pipe -fopenmp -c rsb_blas_sparse.F90 -o rsb_blas_sparse.o >/dev/null 2>&1 -/bin/bash ./libtool --tag=CC --mode=link gcc -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -no-undefined -version-info 0:0:0 -Wl,-z,relro -o ch2icfb ch2icfb-ch2icfb.o -lm -lhwloc -lz -fopenmp -L/usr/lib/gcc/i686-linux-gnu/14 -L/usr/lib/gcc/i686-linux-gnu/14/../../../i386-linux-gnu -L/usr/lib/gcc/i686-linux-gnu/14/../../../../lib -L/lib/i386-linux-gnu -L/lib/../lib -L/usr/lib/i386-linux-gnu -L/usr/lib/../lib -L/usr/lib/gcc/i686-linux-gnu/14/../../.. -lgfortran -lm -lquadmath +libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_libspblas.c -o rsb_libspblas.o >/dev/null 2>&1 +gfortran -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -pipe -fopenmp -c -o rsb_blas_sparse.o rsb_blas_sparse.F90 +/bin/sh ./libtool --tag=CC --mode=link gcc -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -no-undefined -version-info 0:0:0 -Wl,-z,relro -o ch2icfb ch2icfb-ch2icfb.o -lm -lhwloc -lz -fopenmp -L/usr/lib/gcc/i686-linux-gnu/14 -L/usr/lib/gcc/i686-linux-gnu/14/../../../i386-linux-gnu -L/usr/lib/gcc/i686-linux-gnu/14/../../../../lib -L/lib/i386-linux-gnu -L/lib/../lib -L/usr/lib/i386-linux-gnu -L/usr/lib/../lib -L/usr/lib/gcc/i686-linux-gnu/14/../../.. -lgfortran -lm -lquadmath libtool: warning: '-version-info' is ignored for programs libtool: link: gcc -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -Wl,-z -Wl,relro -o ch2icfb ch2icfb-ch2icfb.o -fopenmp -lhwloc -lz -L/usr/lib/gcc/i686-linux-gnu/14 -L/usr/lib/gcc/i686-linux-gnu/14/../../../i386-linux-gnu -L/usr/lib/gcc/i686-linux-gnu/14/../../../../lib -L/lib/i386-linux-gnu -L/lib/../lib -L/usr/lib/i386-linux-gnu -L/usr/lib/../lib -L/usr/lib/gcc/i686-linux-gnu/14/../../.. -lgfortran -lm -lquadmath -fopenmp +/bin/sh ./libtool --tag=CC --mode=link gcc -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -no-undefined -version-info 0:0:0 -Wl,-z,relro -o librsb_base.la librsb_base_la-rsb_is.lo librsb_base_la-rsb_mio.lo librsb_base_la-rsb_op.lo librsb_base_la-rsb_bio.lo librsb_base_la-rsb_get.lo librsb_base_la-rsb_set.lo librsb_base_la-rsb_coo.lo librsb_base_la-rsb_csr.lo librsb_base_la-rsb_coo_check.lo librsb_base_la-rsb_coo_symm.lo librsb_base_la-rsb_idx.lo librsb_base_la-rsb_srt.lo librsb_base_la-rsb_srtp.lo librsb_base_la-rsb_src.lo librsb_base_la-rsb_test_accuracy.lo librsb_base_la-rsb_clone.lo librsb_base_la-rsb_rec.lo librsb_base_la-rsb_render.lo librsb_base_la-rsb_eps.lo librsb_base_la-rsb_msort_up.lo librsb_base_la-rsb_sys.lo librsb_base_la-rsb_blas_stuff.lo librsb_base_la-rsb_gen.lo librsb_base_la-rsb_perf.lo librsb_base_la-rsb_rsb.lo librsb_base_la-rsb_err.lo librsb_base_la-rsb_tune.lo librsb_base_la-rsb_do.lo librsb_base_la-rsb_internals.lo librsb_base_la-rsb_garbage.lo librsb_base_la-rsb_mmio.lo librsb_base_la-rsb_partition.lo librsb_base_la-rsb_mbw.lo librsb_base_la-rsb_limiter.lo librsb_base_la-rsb_fpb.lo librsb_base_la-rsb_spgemm.lo librsb_base_la-rsb_spsum.lo librsb_base_la-rsb_spsv.lo librsb_base_la-rsb_lock.lo librsb_base_la-rsb_swt.lo librsb_base_la-rsb_init.lo librsb_base_la-rsb_dump.lo librsb_base_la-rsb_cpmv.lo librsb_base_la-rsb_asm.lo librsb_base_la-rsb_user.lo librsb_base_la-rsb_coo2rec.lo librsb_base_la-rsb_rec2coo.lo librsb_base_la-rsb_rec2csr.lo librsb_base_la-rsb_csr2coo.lo rsb_blas_sparse.lo -lm -lhwloc -lz -fopenmp -L/usr/lib/gcc/i686-linux-gnu/14 -L/usr/lib/gcc/i686-linux-gnu/14/../../../i386-linux-gnu -L/usr/lib/gcc/i686-linux-gnu/14/../../../../lib -L/lib/i386-linux-gnu -L/lib/../lib -L/usr/lib/i386-linux-gnu -L/usr/lib/../lib -L/usr/lib/gcc/i686-linux-gnu/14/../../.. -lgfortran -lm -lquadmath if test -f ./rsb_types.h -a ! -f ./rsb_types.h ; then cp -pv ./rsb_types.h ./rsb_types.h ; fi # out-of-dir behaviour varies between installations -if test -f ch2icfb ; then if SED=/usr/bin/sed GREP=/usr/bin/grep /bin/bash ./scripts/rsb_h_to_rsb_fi.sh . /build/reproducible-path/librsb-1.3.0.2+dfsg > rsb.F90 ; then true; else rm "rsb.F90"; echo "Failure generating rsb.F90!" ; exit ; fi ; else echo "Warning: Your system did not build ch2icfb for some reason --- skipping rebuild of "rsb.F90 ;true ; fi -/bin/bash ./libtool --tag=FC --mode=compile gfortran -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -pipe -fopenmp -c -o rsb.lo rsb.F90 -libtool: compile: gfortran -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -pipe -fopenmp -c rsb.F90 -fPIC -o .libs/rsb.o -libtool: compile: gfortran -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -pipe -fopenmp -c rsb.F90 -o rsb.o >/dev/null 2>&1 +if test -f ch2icfb ; then if SED=/usr/bin/sed GREP=/usr/bin/grep /bin/sh ./scripts/rsb_h_to_rsb_fi.sh . /build/reproducible-path/librsb-1.3.0.2+dfsg > rsb.F90 ; then true; else rm "rsb.F90"; echo "Failure generating rsb.F90!" ; exit ; fi ; else echo "Warning: Your system did not build ch2icfb for some reason --- skipping rebuild of "rsb.F90 ;true ; fi +/bin/sh ./libtool --tag=CC --mode=link gcc -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -no-undefined -version-info 0:0:0 -Wl,-z,relro -o librsb_spblas.la rsb_libspblas_handle.lo rsb_libspblas.lo -lm -lhwloc -lz -fopenmp -L/usr/lib/gcc/i686-linux-gnu/14 -L/usr/lib/gcc/i686-linux-gnu/14/../../../i386-linux-gnu -L/usr/lib/gcc/i686-linux-gnu/14/../../../../lib -L/lib/i386-linux-gnu -L/lib/../lib -L/usr/lib/i386-linux-gnu -L/usr/lib/../lib -L/usr/lib/gcc/i686-linux-gnu/14/../../.. -lgfortran -lm -lquadmath gfortran -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -pipe -fopenmp -c -o rsb.o rsb.F90 -/bin/bash ./libtool --tag=CC --mode=link gcc -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -no-undefined -version-info 0:0:0 -Wl,-z,relro -o librsb_spblas.la rsb_libspblas_handle.lo rsb_libspblas.lo -lm -lhwloc -lz -fopenmp -L/usr/lib/gcc/i686-linux-gnu/14 -L/usr/lib/gcc/i686-linux-gnu/14/../../../i386-linux-gnu -L/usr/lib/gcc/i686-linux-gnu/14/../../../../lib -L/lib/i386-linux-gnu -L/lib/../lib -L/usr/lib/i386-linux-gnu -L/usr/lib/../lib -L/usr/lib/gcc/i686-linux-gnu/14/../../.. -lgfortran -lm -lquadmath +/bin/sh ./libtool --tag=FC --mode=compile gfortran -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -pipe -fopenmp -c -o rsb.lo rsb.F90 libtool: warning: '-version-info/-version-number' is ignored for convenience libraries libtool: link: ar cr .libs/librsb_spblas.a .libs/rsb_libspblas_handle.o .libs/rsb_libspblas.o libtool: link: ranlib .libs/librsb_spblas.a libtool: link: ( cd ".libs" && rm -f "librsb_spblas.la" && ln -s "../librsb_spblas.la" "librsb_spblas.la" ) -/bin/bash ./libtool --tag=CC --mode=link gcc -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -no-undefined -version-info 0:0:0 -Wl,-z,relro -o librsb_base.la librsb_base_la-rsb_is.lo librsb_base_la-rsb_mio.lo librsb_base_la-rsb_op.lo librsb_base_la-rsb_bio.lo librsb_base_la-rsb_get.lo librsb_base_la-rsb_set.lo librsb_base_la-rsb_coo.lo librsb_base_la-rsb_csr.lo librsb_base_la-rsb_coo_check.lo librsb_base_la-rsb_coo_symm.lo librsb_base_la-rsb_idx.lo librsb_base_la-rsb_srt.lo librsb_base_la-rsb_srtp.lo librsb_base_la-rsb_src.lo librsb_base_la-rsb_test_accuracy.lo librsb_base_la-rsb_clone.lo librsb_base_la-rsb_rec.lo librsb_base_la-rsb_render.lo librsb_base_la-rsb_eps.lo librsb_base_la-rsb_msort_up.lo librsb_base_la-rsb_sys.lo librsb_base_la-rsb_blas_stuff.lo librsb_base_la-rsb_gen.lo librsb_base_la-rsb_perf.lo librsb_base_la-rsb_rsb.lo librsb_base_la-rsb_err.lo librsb_base_la-rsb_tune.lo librsb_base_la-rsb_do.lo librsb_base_la-rsb_internals.lo librsb_base_la-rsb_garbage.lo librsb_base_la-rsb_mmio.lo librsb_base_la-rsb_partition.lo librsb_base_la-rsb_mbw.lo librsb_base_la-rsb_limiter.lo librsb_base_la-rsb_fpb.lo librsb_base_la-rsb_spgemm.lo librsb_base_la-rsb_spsum.lo librsb_base_la-rsb_spsv.lo librsb_base_la-rsb_lock.lo librsb_base_la-rsb_swt.lo librsb_base_la-rsb_init.lo librsb_base_la-rsb_dump.lo librsb_base_la-rsb_cpmv.lo librsb_base_la-rsb_asm.lo librsb_base_la-rsb_user.lo librsb_base_la-rsb_coo2rec.lo librsb_base_la-rsb_rec2coo.lo librsb_base_la-rsb_rec2csr.lo librsb_base_la-rsb_csr2coo.lo rsb_blas_sparse.lo -lm -lhwloc -lz -fopenmp -L/usr/lib/gcc/i686-linux-gnu/14 -L/usr/lib/gcc/i686-linux-gnu/14/../../../i386-linux-gnu -L/usr/lib/gcc/i686-linux-gnu/14/../../../../lib -L/lib/i386-linux-gnu -L/lib/../lib -L/usr/lib/i386-linux-gnu -L/usr/lib/../lib -L/usr/lib/gcc/i686-linux-gnu/14/../../.. -lgfortran -lm -lquadmath +libtool: compile: gfortran -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -pipe -fopenmp -c rsb.F90 -fPIC -o .libs/rsb.o +libtool: compile: gfortran -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -pipe -fopenmp -c rsb.F90 -o rsb.o >/dev/null 2>&1 libtool: warning: '-version-info/-version-number' is ignored for convenience libraries libtool: link: ar cr .libs/librsb_base.a .libs/librsb_base_la-rsb_is.o .libs/librsb_base_la-rsb_mio.o .libs/librsb_base_la-rsb_op.o .libs/librsb_base_la-rsb_bio.o .libs/librsb_base_la-rsb_get.o .libs/librsb_base_la-rsb_set.o .libs/librsb_base_la-rsb_coo.o .libs/librsb_base_la-rsb_csr.o .libs/librsb_base_la-rsb_coo_check.o .libs/librsb_base_la-rsb_coo_symm.o .libs/librsb_base_la-rsb_idx.o .libs/librsb_base_la-rsb_srt.o .libs/librsb_base_la-rsb_srtp.o .libs/librsb_base_la-rsb_src.o .libs/librsb_base_la-rsb_test_accuracy.o .libs/librsb_base_la-rsb_clone.o .libs/librsb_base_la-rsb_rec.o .libs/librsb_base_la-rsb_render.o .libs/librsb_base_la-rsb_eps.o .libs/librsb_base_la-rsb_msort_up.o .libs/librsb_base_la-rsb_sys.o .libs/librsb_base_la-rsb_blas_stuff.o .libs/librsb_base_la-rsb_gen.o .libs/librsb_base_la-rsb_perf.o .libs/librsb_base_la-rsb_rsb.o .libs/librsb_base_la-rsb_err.o .libs/librsb_base_la-rsb_tune.o .libs/librsb_base_la-rsb_do.o .libs/librsb_base_la-rsb_internals.o .libs/librsb_base_la-rsb_garbage.o .libs/librsb_base_la-rsb_mmio.o .libs/librsb_base_la-rsb_partition.o .libs/librsb_base_la-rsb_mbw.o .libs/librsb_base_la-rsb_limiter.o .libs/librsb_base_la-rsb_fpb.o .libs/librsb_base_la-rsb_spgemm.o .libs/librsb_base_la-rsb_spsum.o .libs/librsb_base_la-rsb_spsv.o .libs/librsb_base_la-rsb_lock.o .libs/librsb_base_la-rsb_swt.o .libs/librsb_base_la-rsb_init.o .libs/librsb_base_la-rsb_dump.o .libs/librsb_base_la-rsb_cpmv.o .libs/librsb_base_la-rsb_asm.o .libs/librsb_base_la-rsb_user.o .libs/librsb_base_la-rsb_coo2rec.o .libs/librsb_base_la-rsb_rec2coo.o .libs/librsb_base_la-rsb_rec2csr.o .libs/librsb_base_la-rsb_csr2coo.o .libs/rsb_blas_sparse.o libtool: link: ranlib .libs/librsb_base.a libtool: link: ( cd ".libs" && rm -f "librsb_base.la" && ln -s "../librsb_base.la" "librsb_base.la" ) libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_krnl_bcss_spmv_u.c -o librsb_nounroll_la-rsb_krnl_bcss_spmv_u.o >/dev/null 2>&1 libtool: compile: gcc -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -fno-unroll-loops -fopenmp -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -c rsb_krnl_bcoo_spmv_u.c -o librsb_nounroll_la-rsb_krnl_bcoo_spmv_u.o >/dev/null 2>&1 -/bin/bash ./libtool --tag=CC --mode=link gcc -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -no-undefined -version-info 0:0:0 -Wl,-z,relro -o librsb_nounroll.la librsb_nounroll_la-rsb_stropts.lo librsb_nounroll_la-rsb_strmif.lo librsb_nounroll_la-rsb_unroll.lo librsb_nounroll_la-rsb_krnl_vb.lo librsb_nounroll_la-rsb_krnl_lb.lo librsb_nounroll_la-rsb_krnl.lo librsb_nounroll_la-rsb_bench.lo librsb_nounroll_la-rsb_mergesort.lo librsb_nounroll_la-rsb_permute.lo librsb_nounroll_la-rsb_krnl_bcss_l.lo librsb_nounroll_la-rsb_krnl_bcss_u.lo librsb_nounroll_la-rsb_krnl_bcss_spsv_u.lo librsb_nounroll_la-rsb_krnl_bcss_spmv_u.lo librsb_nounroll_la-rsb_krnl_bcss_misc_u.lo librsb_nounroll_la-rsb_krnl_bcoo_spmv_u.lo librsb_nounroll_la-rsb_krnl_bcss.lo librsb_nounroll_la-rsb_spmv.lo librsb_nounroll_la-rsb_merge.lo librsb_nounroll_la-rsb_ompio.lo librsb_nounroll_la-rsb_util.lo librsb_nounroll_la-rsb_spgemm_csr.lo librsb_nounroll_la-rsb_spsum_misc.lo librsb_nounroll_la-rsb_prec.lo -lm -lhwloc -lz -fopenmp -L/usr/lib/gcc/i686-linux-gnu/14 -L/usr/lib/gcc/i686-linux-gnu/14/../../../i386-linux-gnu -L/usr/lib/gcc/i686-linux-gnu/14/../../../../lib -L/lib/i386-linux-gnu -L/lib/../lib -L/usr/lib/i386-linux-gnu -L/usr/lib/../lib -L/usr/lib/gcc/i686-linux-gnu/14/../../.. -lgfortran -lm -lquadmath +/bin/sh ./libtool --tag=CC --mode=link gcc -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -no-undefined -version-info 0:0:0 -Wl,-z,relro -o librsb_nounroll.la librsb_nounroll_la-rsb_stropts.lo librsb_nounroll_la-rsb_strmif.lo librsb_nounroll_la-rsb_unroll.lo librsb_nounroll_la-rsb_krnl_vb.lo librsb_nounroll_la-rsb_krnl_lb.lo librsb_nounroll_la-rsb_krnl.lo librsb_nounroll_la-rsb_bench.lo librsb_nounroll_la-rsb_mergesort.lo librsb_nounroll_la-rsb_permute.lo librsb_nounroll_la-rsb_krnl_bcss_l.lo librsb_nounroll_la-rsb_krnl_bcss_u.lo librsb_nounroll_la-rsb_krnl_bcss_spsv_u.lo librsb_nounroll_la-rsb_krnl_bcss_spmv_u.lo librsb_nounroll_la-rsb_krnl_bcss_misc_u.lo librsb_nounroll_la-rsb_krnl_bcoo_spmv_u.lo librsb_nounroll_la-rsb_krnl_bcss.lo librsb_nounroll_la-rsb_spmv.lo librsb_nounroll_la-rsb_merge.lo librsb_nounroll_la-rsb_ompio.lo librsb_nounroll_la-rsb_util.lo librsb_nounroll_la-rsb_spgemm_csr.lo librsb_nounroll_la-rsb_spsum_misc.lo librsb_nounroll_la-rsb_prec.lo -lm -lhwloc -lz -fopenmp -L/usr/lib/gcc/i686-linux-gnu/14 -L/usr/lib/gcc/i686-linux-gnu/14/../../../i386-linux-gnu -L/usr/lib/gcc/i686-linux-gnu/14/../../../../lib -L/lib/i386-linux-gnu -L/lib/../lib -L/usr/lib/i386-linux-gnu -L/usr/lib/../lib -L/usr/lib/gcc/i686-linux-gnu/14/../../.. -lgfortran -lm -lquadmath libtool: warning: '-version-info/-version-number' is ignored for convenience libraries libtool: link: ar cr .libs/librsb_nounroll.a .libs/librsb_nounroll_la-rsb_stropts.o .libs/librsb_nounroll_la-rsb_strmif.o .libs/librsb_nounroll_la-rsb_unroll.o .libs/librsb_nounroll_la-rsb_krnl_vb.o .libs/librsb_nounroll_la-rsb_krnl_lb.o .libs/librsb_nounroll_la-rsb_krnl.o .libs/librsb_nounroll_la-rsb_bench.o .libs/librsb_nounroll_la-rsb_mergesort.o .libs/librsb_nounroll_la-rsb_permute.o .libs/librsb_nounroll_la-rsb_krnl_bcss_l.o .libs/librsb_nounroll_la-rsb_krnl_bcss_u.o .libs/librsb_nounroll_la-rsb_krnl_bcss_spsv_u.o .libs/librsb_nounroll_la-rsb_krnl_bcss_spmv_u.o .libs/librsb_nounroll_la-rsb_krnl_bcss_misc_u.o .libs/librsb_nounroll_la-rsb_krnl_bcoo_spmv_u.o .libs/librsb_nounroll_la-rsb_krnl_bcss.o .libs/librsb_nounroll_la-rsb_spmv.o .libs/librsb_nounroll_la-rsb_merge.o .libs/librsb_nounroll_la-rsb_ompio.o .libs/librsb_nounroll_la-rsb_util.o .libs/librsb_nounroll_la-rsb_spgemm_csr.o .libs/librsb_nounroll_la-rsb_spsum_misc.o .libs/librsb_nounroll_la-rsb_prec.o libtool: link: ranlib .libs/librsb_nounroll.a libtool: link: ( cd ".libs" && rm -f "librsb_nounroll.la" && ln -s "../librsb_nounroll.la" "librsb_nounroll.la" ) -/bin/bash ./libtool --tag=CC --mode=link gcc -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -no-undefined -version-info 0:0:0 -Wl,-z,relro -o librsb.la -rpath /usr/lib/i386-linux-gnu rsb.lo librsb_nounroll.la librsb_base.la librsb_spblas.la /build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp/librsbpp.la -lstdc++ -lm -lhwloc -lz -fopenmp -L/usr/lib/gcc/i686-linux-gnu/14 -L/usr/lib/gcc/i686-linux-gnu/14/../../../i386-linux-gnu -L/usr/lib/gcc/i686-linux-gnu/14/../../../../lib -L/lib/i386-linux-gnu -L/lib/../lib -L/usr/lib/i386-linux-gnu -L/usr/lib/../lib -L/usr/lib/gcc/i686-linux-gnu/14/../../.. -lgfortran -lm -lquadmath +/bin/sh ./libtool --tag=CC --mode=link gcc -g -O2 -Werror=implicit-function-declaration -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -no-undefined -version-info 0:0:0 -Wl,-z,relro -o librsb.la -rpath /usr/lib/i386-linux-gnu rsb.lo librsb_nounroll.la librsb_base.la librsb_spblas.la /build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp/librsbpp.la -lstdc++ -lm -lhwloc -lz -fopenmp -L/usr/lib/gcc/i686-linux-gnu/14 -L/usr/lib/gcc/i686-linux-gnu/14/../../../i386-linux-gnu -L/usr/lib/gcc/i686-linux-gnu/14/../../../../lib -L/lib/i386-linux-gnu -L/lib/../lib -L/usr/lib/i386-linux-gnu -L/usr/lib/../lib -L/usr/lib/gcc/i686-linux-gnu/14/../../.. -lgfortran -lm -lquadmath libtool: link: gcc -shared -fPIC -DPIC .libs/rsb.o -Wl,--whole-archive ./.libs/librsb_nounroll.a ./.libs/librsb_base.a ./.libs/librsb_spblas.a /build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp/.libs/librsbpp.a -Wl,--no-whole-archive -L/usr/lib/gcc/i686-linux-gnu/14 -L/usr/lib/gcc/i686-linux-gnu/14/../../../i386-linux-gnu -L/usr/lib/gcc/i686-linux-gnu/14/../../../../lib -L/lib/i386-linux-gnu -L/lib/../lib -L/usr/lib/i386-linux-gnu -L/usr/lib/../lib -L/usr/lib/gcc/i686-linux-gnu/14/../../.. -lpthread -lstdc++fs -lstdc++ -lhwloc -lz -lgfortran -lm -lquadmath -g -O2 -fstack-protector-strong -O3 -Wl,-z -Wl,relro -fopenmp -fopenmp -Wl,-soname -Wl,librsb.so.0 -o .libs/librsb.so.0.0.0 libtool: link: (cd ".libs" && rm -f "librsb.so.0" && ln -s "librsb.so.0.0.0" "librsb.so.0") libtool: link: (cd ".libs" && rm -f "librsb.so" && ln -s "librsb.so.0.0.0" "librsb.so") @@ -2351,7 +2387,7 @@ libtool: link: ranlib .libs/librsb.a libtool: link: rm -fr .libs/librsb.lax libtool: link: ( cd ".libs" && rm -f "librsb.la" && ln -s "../librsb.la" "librsb.la" ) -/bin/bash ./libtool --tag=CXX --mode=link g++ -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -fopenmp -no-undefined -version-info 0:0:0 -Wl,-z,relro -o rsbench rsbench-rsbench.o rsbench-rsb_test_matops.o rsbench-rsb_mkl.o rsbench-rsb_genmm.o rsbench-rsb_mmls.o rsbench-rsb_pr.o rsbench-rsb_pcnt.o rsbench-rsb_failure_tests.o rsbench-rsb_libspblas_tests.o rsb_dummy.o librsb.la -lhwloc -lm -lhwloc -lz -fopenmp -L/usr/lib/gcc/i686-linux-gnu/14 -L/usr/lib/gcc/i686-linux-gnu/14/../../../i386-linux-gnu -L/usr/lib/gcc/i686-linux-gnu/14/../../../../lib -L/lib/i386-linux-gnu -L/lib/../lib -L/usr/lib/i386-linux-gnu -L/usr/lib/../lib -L/usr/lib/gcc/i686-linux-gnu/14/../../.. -lgfortran -lm -lquadmath +/bin/sh ./libtool --tag=CXX --mode=link g++ -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -fopenmp -no-undefined -version-info 0:0:0 -Wl,-z,relro -o rsbench rsbench-rsbench.o rsbench-rsb_test_matops.o rsbench-rsb_mkl.o rsbench-rsb_genmm.o rsbench-rsb_mmls.o rsbench-rsb_pr.o rsbench-rsb_pcnt.o rsbench-rsb_failure_tests.o rsbench-rsb_libspblas_tests.o rsb_dummy.o librsb.la -lhwloc -lm -lhwloc -lz -fopenmp -L/usr/lib/gcc/i686-linux-gnu/14 -L/usr/lib/gcc/i686-linux-gnu/14/../../../i386-linux-gnu -L/usr/lib/gcc/i686-linux-gnu/14/../../../../lib -L/lib/i386-linux-gnu -L/lib/../lib -L/usr/lib/i386-linux-gnu -L/usr/lib/../lib -L/usr/lib/gcc/i686-linux-gnu/14/../../.. -lgfortran -lm -lquadmath libtool: warning: '-version-info' is ignored for programs libtool: link: g++ -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -fopenmp -Wl,-z -Wl,relro -o .libs/rsbench rsbench-rsbench.o rsbench-rsb_test_matops.o rsbench-rsb_mkl.o rsbench-rsb_genmm.o rsbench-rsb_mmls.o rsbench-rsb_pr.o rsbench-rsb_pcnt.o rsbench-rsb_failure_tests.o rsbench-rsb_libspblas_tests.o rsb_dummy.o -fopenmp ./.libs/librsb.so -lhwloc -lz -L/usr/lib/gcc/i686-linux-gnu/14 -L/usr/lib/gcc/i686-linux-gnu/14/../../../i386-linux-gnu -L/usr/lib/gcc/i686-linux-gnu/14/../../../../lib -L/lib/i386-linux-gnu -L/lib/../lib -L/usr/lib/i386-linux-gnu -L/usr/lib/../lib -L/usr/lib/gcc/i686-linux-gnu/14/../../.. -lgfortran -lm -lquadmath -fopenmp gmake[4]: Leaving directory '/build/reproducible-path/librsb-1.3.0.2+dfsg' @@ -2368,28 +2404,28 @@ gfortran -DHAVE_CONFIG_H -I. -I.. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -I.. -I.. -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -pipe -fopenmp -c -o fortran.o fortran.F90 gfortran -DHAVE_CONFIG_H -I. -I.. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -I.. -I.. -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -pipe -fopenmp -c -o fortran_rsb_fi.o fortran_rsb_fi.F90 g++ -DHAVE_CONFIG_H -I. -I.. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp -I/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -fopenmp -c -o cplusplus.o cplusplus.cpp -/bin/bash ../libtool --tag=CXX --mode=link g++ -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -fopenmp -Wl,-z,relro -o hello hello.o -L.. /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la -lhwloc -lm -lhwloc -lz -fopenmp -L/usr/lib/gcc/i686-linux-gnu/14 -L/usr/lib/gcc/i686-linux-gnu/14/../../../i386-linux-gnu -L/usr/lib/gcc/i686-linux-gnu/14/../../../../lib -L/lib/i386-linux-gnu -L/lib/../lib -L/usr/lib/i386-linux-gnu -L/usr/lib/../lib -L/usr/lib/gcc/i686-linux-gnu/14/../../.. -lgfortran -lm -lquadmath -/bin/bash ../libtool --tag=CXX --mode=link g++ -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -fopenmp -Wl,-z,relro -o transpose transpose.o -L.. /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la -lhwloc -lm -lhwloc -lz -fopenmp -L/usr/lib/gcc/i686-linux-gnu/14 -L/usr/lib/gcc/i686-linux-gnu/14/../../../i386-linux-gnu -L/usr/lib/gcc/i686-linux-gnu/14/../../../../lib -L/lib/i386-linux-gnu -L/lib/../lib -L/usr/lib/i386-linux-gnu -L/usr/lib/../lib -L/usr/lib/gcc/i686-linux-gnu/14/../../.. -lgfortran -lm -lquadmath -/bin/bash ../libtool --tag=CXX --mode=link g++ -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -fopenmp -Wl,-z,relro -o power power.o -L.. /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la -lhwloc -lm -lhwloc -lz -fopenmp -L/usr/lib/gcc/i686-linux-gnu/14 -L/usr/lib/gcc/i686-linux-gnu/14/../../../i386-linux-gnu -L/usr/lib/gcc/i686-linux-gnu/14/../../../../lib -L/lib/i386-linux-gnu -L/lib/../lib -L/usr/lib/i386-linux-gnu -L/usr/lib/../lib -L/usr/lib/gcc/i686-linux-gnu/14/../../.. -lgfortran -lm -lquadmath +/bin/sh ../libtool --tag=CXX --mode=link g++ -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -fopenmp -Wl,-z,relro -o hello hello.o -L.. /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la -lhwloc -lm -lhwloc -lz -fopenmp -L/usr/lib/gcc/i686-linux-gnu/14 -L/usr/lib/gcc/i686-linux-gnu/14/../../../i386-linux-gnu -L/usr/lib/gcc/i686-linux-gnu/14/../../../../lib -L/lib/i386-linux-gnu -L/lib/../lib -L/usr/lib/i386-linux-gnu -L/usr/lib/../lib -L/usr/lib/gcc/i686-linux-gnu/14/../../.. -lgfortran -lm -lquadmath +/bin/sh ../libtool --tag=CXX --mode=link g++ -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -fopenmp -Wl,-z,relro -o transpose transpose.o -L.. /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la -lhwloc -lm -lhwloc -lz -fopenmp -L/usr/lib/gcc/i686-linux-gnu/14 -L/usr/lib/gcc/i686-linux-gnu/14/../../../i386-linux-gnu -L/usr/lib/gcc/i686-linux-gnu/14/../../../../lib -L/lib/i386-linux-gnu -L/lib/../lib -L/usr/lib/i386-linux-gnu -L/usr/lib/../lib -L/usr/lib/gcc/i686-linux-gnu/14/../../.. -lgfortran -lm -lquadmath +/bin/sh ../libtool --tag=CXX --mode=link g++ -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -fopenmp -Wl,-z,relro -o power power.o -L.. /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la -lhwloc -lm -lhwloc -lz -fopenmp -L/usr/lib/gcc/i686-linux-gnu/14 -L/usr/lib/gcc/i686-linux-gnu/14/../../../i386-linux-gnu -L/usr/lib/gcc/i686-linux-gnu/14/../../../../lib -L/lib/i386-linux-gnu -L/lib/../lib -L/usr/lib/i386-linux-gnu -L/usr/lib/../lib -L/usr/lib/gcc/i686-linux-gnu/14/../../.. -lgfortran -lm -lquadmath +/bin/sh ../libtool --tag=CXX --mode=link g++ -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -fopenmp -Wl,-z,relro -o autotune autotune.o -L.. /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la -lhwloc -lm -lhwloc -lz -fopenmp -L/usr/lib/gcc/i686-linux-gnu/14 -L/usr/lib/gcc/i686-linux-gnu/14/../../../i386-linux-gnu -L/usr/lib/gcc/i686-linux-gnu/14/../../../../lib -L/lib/i386-linux-gnu -L/lib/../lib -L/usr/lib/i386-linux-gnu -L/usr/lib/../lib -L/usr/lib/gcc/i686-linux-gnu/14/../../.. -lgfortran -lm -lquadmath libtool: link: g++ -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -fopenmp -Wl,-z -Wl,relro -o .libs/hello hello.o -fopenmp -L.. /build/reproducible-path/librsb-1.3.0.2+dfsg/.libs/librsb.so -lhwloc -lz -L/usr/lib/gcc/i686-linux-gnu/14 -L/usr/lib/gcc/i686-linux-gnu/14/../../../i386-linux-gnu -L/usr/lib/gcc/i686-linux-gnu/14/../../../../lib -L/lib/i386-linux-gnu -L/lib/../lib -L/usr/lib/i386-linux-gnu -L/usr/lib/../lib -L/usr/lib/gcc/i686-linux-gnu/14/../../.. -lgfortran -lm -lquadmath -fopenmp -/bin/bash ../libtool --tag=CXX --mode=link g++ -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -fopenmp -Wl,-z,relro -o autotune autotune.o -L.. /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la -lhwloc -lm -lhwloc -lz -fopenmp -L/usr/lib/gcc/i686-linux-gnu/14 -L/usr/lib/gcc/i686-linux-gnu/14/../../../i386-linux-gnu -L/usr/lib/gcc/i686-linux-gnu/14/../../../../lib -L/lib/i386-linux-gnu -L/lib/../lib -L/usr/lib/i386-linux-gnu -L/usr/lib/../lib -L/usr/lib/gcc/i686-linux-gnu/14/../../.. -lgfortran -lm -lquadmath -libtool: link: g++ -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -fopenmp -Wl,-z -Wl,relro -o .libs/transpose transpose.o -fopenmp -L.. /build/reproducible-path/librsb-1.3.0.2+dfsg/.libs/librsb.so -lhwloc -lz -L/usr/lib/gcc/i686-linux-gnu/14 -L/usr/lib/gcc/i686-linux-gnu/14/../../../i386-linux-gnu -L/usr/lib/gcc/i686-linux-gnu/14/../../../../lib -L/lib/i386-linux-gnu -L/lib/../lib -L/usr/lib/i386-linux-gnu -L/usr/lib/../lib -L/usr/lib/gcc/i686-linux-gnu/14/../../.. -lgfortran -lm -lquadmath -fopenmp -/bin/bash ../libtool --tag=CXX --mode=link g++ -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -fopenmp -Wl,-z,relro -o backsolve backsolve.o -L.. /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la -lhwloc -lm -lhwloc -lz -fopenmp -L/usr/lib/gcc/i686-linux-gnu/14 -L/usr/lib/gcc/i686-linux-gnu/14/../../../i386-linux-gnu -L/usr/lib/gcc/i686-linux-gnu/14/../../../../lib -L/lib/i386-linux-gnu -L/lib/../lib -L/usr/lib/i386-linux-gnu -L/usr/lib/../lib -L/usr/lib/gcc/i686-linux-gnu/14/../../.. -lgfortran -lm -lquadmath +/bin/sh ../libtool --tag=CXX --mode=link g++ -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -fopenmp -Wl,-z,relro -o backsolve backsolve.o -L.. /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la -lhwloc -lm -lhwloc -lz -fopenmp -L/usr/lib/gcc/i686-linux-gnu/14 -L/usr/lib/gcc/i686-linux-gnu/14/../../../i386-linux-gnu -L/usr/lib/gcc/i686-linux-gnu/14/../../../../lib -L/lib/i386-linux-gnu -L/lib/../lib -L/usr/lib/i386-linux-gnu -L/usr/lib/../lib -L/usr/lib/gcc/i686-linux-gnu/14/../../.. -lgfortran -lm -lquadmath libtool: link: g++ -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -fopenmp -Wl,-z -Wl,relro -o .libs/power power.o -fopenmp -L.. /build/reproducible-path/librsb-1.3.0.2+dfsg/.libs/librsb.so -lhwloc -lz -L/usr/lib/gcc/i686-linux-gnu/14 -L/usr/lib/gcc/i686-linux-gnu/14/../../../i386-linux-gnu -L/usr/lib/gcc/i686-linux-gnu/14/../../../../lib -L/lib/i386-linux-gnu -L/lib/../lib -L/usr/lib/i386-linux-gnu -L/usr/lib/../lib -L/usr/lib/gcc/i686-linux-gnu/14/../../.. -lgfortran -lm -lquadmath -fopenmp -/bin/bash ../libtool --tag=CXX --mode=link g++ -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -fopenmp -Wl,-z,relro -o hello-spblas hello-spblas.o -L.. /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la -lhwloc -lm -lhwloc -lz -fopenmp -L/usr/lib/gcc/i686-linux-gnu/14 -L/usr/lib/gcc/i686-linux-gnu/14/../../../i386-linux-gnu -L/usr/lib/gcc/i686-linux-gnu/14/../../../../lib -L/lib/i386-linux-gnu -L/lib/../lib -L/usr/lib/i386-linux-gnu -L/usr/lib/../lib -L/usr/lib/gcc/i686-linux-gnu/14/../../.. -lgfortran -lm -lquadmath -/bin/bash ../libtool --tag=CXX --mode=link g++ -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -fopenmp -Wl,-z,relro -o io-spblas io-spblas.o -L.. /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la -lhwloc -lm -lhwloc -lz -fopenmp -L/usr/lib/gcc/i686-linux-gnu/14 -L/usr/lib/gcc/i686-linux-gnu/14/../../../i386-linux-gnu -L/usr/lib/gcc/i686-linux-gnu/14/../../../../lib -L/lib/i386-linux-gnu -L/lib/../lib -L/usr/lib/i386-linux-gnu -L/usr/lib/../lib -L/usr/lib/gcc/i686-linux-gnu/14/../../.. -lgfortran -lm -lquadmath -/bin/bash ../libtool --tag=CXX --mode=link g++ -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -fopenmp -Wl,-z,relro -o fortran fortran.o -L.. /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la -lhwloc -lm -lhwloc -lz -fopenmp -L/usr/lib/gcc/i686-linux-gnu/14 -L/usr/lib/gcc/i686-linux-gnu/14/../../../i386-linux-gnu -L/usr/lib/gcc/i686-linux-gnu/14/../../../../lib -L/lib/i386-linux-gnu -L/lib/../lib -L/usr/lib/i386-linux-gnu -L/usr/lib/../lib -L/usr/lib/gcc/i686-linux-gnu/14/../../.. -lgfortran -lm -lquadmath +libtool: link: g++ -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -fopenmp -Wl,-z -Wl,relro -o .libs/transpose transpose.o -fopenmp -L.. /build/reproducible-path/librsb-1.3.0.2+dfsg/.libs/librsb.so -lhwloc -lz -L/usr/lib/gcc/i686-linux-gnu/14 -L/usr/lib/gcc/i686-linux-gnu/14/../../../i386-linux-gnu -L/usr/lib/gcc/i686-linux-gnu/14/../../../../lib -L/lib/i386-linux-gnu -L/lib/../lib -L/usr/lib/i386-linux-gnu -L/usr/lib/../lib -L/usr/lib/gcc/i686-linux-gnu/14/../../.. -lgfortran -lm -lquadmath -fopenmp +/bin/sh ../libtool --tag=CXX --mode=link g++ -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -fopenmp -Wl,-z,relro -o hello-spblas hello-spblas.o -L.. /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la -lhwloc -lm -lhwloc -lz -fopenmp -L/usr/lib/gcc/i686-linux-gnu/14 -L/usr/lib/gcc/i686-linux-gnu/14/../../../i386-linux-gnu -L/usr/lib/gcc/i686-linux-gnu/14/../../../../lib -L/lib/i386-linux-gnu -L/lib/../lib -L/usr/lib/i386-linux-gnu -L/usr/lib/../lib -L/usr/lib/gcc/i686-linux-gnu/14/../../.. -lgfortran -lm -lquadmath libtool: link: g++ -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -fopenmp -Wl,-z -Wl,relro -o .libs/autotune autotune.o -fopenmp -L.. /build/reproducible-path/librsb-1.3.0.2+dfsg/.libs/librsb.so -lhwloc -lz -L/usr/lib/gcc/i686-linux-gnu/14 -L/usr/lib/gcc/i686-linux-gnu/14/../../../i386-linux-gnu -L/usr/lib/gcc/i686-linux-gnu/14/../../../../lib -L/lib/i386-linux-gnu -L/lib/../lib -L/usr/lib/i386-linux-gnu -L/usr/lib/../lib -L/usr/lib/gcc/i686-linux-gnu/14/../../.. -lgfortran -lm -lquadmath -fopenmp +/bin/sh ../libtool --tag=CXX --mode=link g++ -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -fopenmp -Wl,-z,relro -o io-spblas io-spblas.o -L.. /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la -lhwloc -lm -lhwloc -lz -fopenmp -L/usr/lib/gcc/i686-linux-gnu/14 -L/usr/lib/gcc/i686-linux-gnu/14/../../../i386-linux-gnu -L/usr/lib/gcc/i686-linux-gnu/14/../../../../lib -L/lib/i386-linux-gnu -L/lib/../lib -L/usr/lib/i386-linux-gnu -L/usr/lib/../lib -L/usr/lib/gcc/i686-linux-gnu/14/../../.. -lgfortran -lm -lquadmath +/bin/sh ../libtool --tag=CXX --mode=link g++ -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -fopenmp -Wl,-z,relro -o fortran fortran.o -L.. /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la -lhwloc -lm -lhwloc -lz -fopenmp -L/usr/lib/gcc/i686-linux-gnu/14 -L/usr/lib/gcc/i686-linux-gnu/14/../../../i386-linux-gnu -L/usr/lib/gcc/i686-linux-gnu/14/../../../../lib -L/lib/i386-linux-gnu -L/lib/../lib -L/usr/lib/i386-linux-gnu -L/usr/lib/../lib -L/usr/lib/gcc/i686-linux-gnu/14/../../.. -lgfortran -lm -lquadmath +/bin/sh ../libtool --tag=CXX --mode=link g++ -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -fopenmp -Wl,-z,relro -o fortran_rsb_fi fortran_rsb_fi.o -L.. /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la -lhwloc -lm -lhwloc -lz -fopenmp -L/usr/lib/gcc/i686-linux-gnu/14 -L/usr/lib/gcc/i686-linux-gnu/14/../../../i386-linux-gnu -L/usr/lib/gcc/i686-linux-gnu/14/../../../../lib -L/lib/i386-linux-gnu -L/lib/../lib -L/usr/lib/i386-linux-gnu -L/usr/lib/../lib -L/usr/lib/gcc/i686-linux-gnu/14/../../.. -lgfortran -lm -lquadmath libtool: link: g++ -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -fopenmp -Wl,-z -Wl,relro -o .libs/backsolve backsolve.o -fopenmp -L.. /build/reproducible-path/librsb-1.3.0.2+dfsg/.libs/librsb.so -lhwloc -lz -L/usr/lib/gcc/i686-linux-gnu/14 -L/usr/lib/gcc/i686-linux-gnu/14/../../../i386-linux-gnu -L/usr/lib/gcc/i686-linux-gnu/14/../../../../lib -L/lib/i386-linux-gnu -L/lib/../lib -L/usr/lib/i386-linux-gnu -L/usr/lib/../lib -L/usr/lib/gcc/i686-linux-gnu/14/../../.. -lgfortran -lm -lquadmath -fopenmp -/bin/bash ../libtool --tag=CXX --mode=link g++ -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -fopenmp -Wl,-z,relro -o fortran_rsb_fi fortran_rsb_fi.o -L.. /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la -lhwloc -lm -lhwloc -lz -fopenmp -L/usr/lib/gcc/i686-linux-gnu/14 -L/usr/lib/gcc/i686-linux-gnu/14/../../../i386-linux-gnu -L/usr/lib/gcc/i686-linux-gnu/14/../../../../lib -L/lib/i386-linux-gnu -L/lib/../lib -L/usr/lib/i386-linux-gnu -L/usr/lib/../lib -L/usr/lib/gcc/i686-linux-gnu/14/../../.. -lgfortran -lm -lquadmath -libtool: link: g++ -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -fopenmp -Wl,-z -Wl,relro -o .libs/hello-spblas hello-spblas.o -fopenmp -L.. /build/reproducible-path/librsb-1.3.0.2+dfsg/.libs/librsb.so -lhwloc -lz -L/usr/lib/gcc/i686-linux-gnu/14 -L/usr/lib/gcc/i686-linux-gnu/14/../../../i386-linux-gnu -L/usr/lib/gcc/i686-linux-gnu/14/../../../../lib -L/lib/i386-linux-gnu -L/lib/../lib -L/usr/lib/i386-linux-gnu -L/usr/lib/../lib -L/usr/lib/gcc/i686-linux-gnu/14/../../.. -lgfortran -lm -lquadmath -fopenmp +/bin/sh ../libtool --tag=CXX --mode=link g++ -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -fopenmp -Wl,-z,relro -o cplusplus cplusplus.o -L.. /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la -lhwloc -lm -lhwloc -lz -fopenmp -L/usr/lib/gcc/i686-linux-gnu/14 -L/usr/lib/gcc/i686-linux-gnu/14/../../../i386-linux-gnu -L/usr/lib/gcc/i686-linux-gnu/14/../../../../lib -L/lib/i386-linux-gnu -L/lib/../lib -L/usr/lib/i386-linux-gnu -L/usr/lib/../lib -L/usr/lib/gcc/i686-linux-gnu/14/../../.. -lgfortran -lm -lquadmath libtool: link: g++ -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -fopenmp -Wl,-z -Wl,relro -o .libs/io-spblas io-spblas.o -fopenmp -L.. /build/reproducible-path/librsb-1.3.0.2+dfsg/.libs/librsb.so -lhwloc -lz -L/usr/lib/gcc/i686-linux-gnu/14 -L/usr/lib/gcc/i686-linux-gnu/14/../../../i386-linux-gnu -L/usr/lib/gcc/i686-linux-gnu/14/../../../../lib -L/lib/i386-linux-gnu -L/lib/../lib -L/usr/lib/i386-linux-gnu -L/usr/lib/../lib -L/usr/lib/gcc/i686-linux-gnu/14/../../.. -lgfortran -lm -lquadmath -fopenmp -/bin/bash ../libtool --tag=CXX --mode=link g++ -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -fopenmp -Wl,-z,relro -o snippets snippets.o -L.. /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la -lhwloc -lm -lhwloc -lz -fopenmp -L/usr/lib/gcc/i686-linux-gnu/14 -L/usr/lib/gcc/i686-linux-gnu/14/../../../i386-linux-gnu -L/usr/lib/gcc/i686-linux-gnu/14/../../../../lib -L/lib/i386-linux-gnu -L/lib/../lib -L/usr/lib/i386-linux-gnu -L/usr/lib/../lib -L/usr/lib/gcc/i686-linux-gnu/14/../../.. -lgfortran -lm -lquadmath -libtool: link: g++ -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -fopenmp -Wl,-z -Wl,relro -o .libs/fortran fortran.o -fopenmp -L.. /build/reproducible-path/librsb-1.3.0.2+dfsg/.libs/librsb.so -lhwloc -lz -L/usr/lib/gcc/i686-linux-gnu/14 -L/usr/lib/gcc/i686-linux-gnu/14/../../../i386-linux-gnu -L/usr/lib/gcc/i686-linux-gnu/14/../../../../lib -L/lib/i386-linux-gnu -L/lib/../lib -L/usr/lib/i386-linux-gnu -L/usr/lib/../lib -L/usr/lib/gcc/i686-linux-gnu/14/../../.. -lgfortran -lm -lquadmath -fopenmp -/bin/bash ../libtool --tag=CXX --mode=link g++ -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -fopenmp -Wl,-z,relro -o cplusplus cplusplus.o -L.. /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la -lhwloc -lm -lhwloc -lz -fopenmp -L/usr/lib/gcc/i686-linux-gnu/14 -L/usr/lib/gcc/i686-linux-gnu/14/../../../i386-linux-gnu -L/usr/lib/gcc/i686-linux-gnu/14/../../../../lib -L/lib/i386-linux-gnu -L/lib/../lib -L/usr/lib/i386-linux-gnu -L/usr/lib/../lib -L/usr/lib/gcc/i686-linux-gnu/14/../../.. -lgfortran -lm -lquadmath +libtool: link: g++ -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -fopenmp -Wl,-z -Wl,relro -o .libs/hello-spblas hello-spblas.o -fopenmp -L.. /build/reproducible-path/librsb-1.3.0.2+dfsg/.libs/librsb.so -lhwloc -lz -L/usr/lib/gcc/i686-linux-gnu/14 -L/usr/lib/gcc/i686-linux-gnu/14/../../../i386-linux-gnu -L/usr/lib/gcc/i686-linux-gnu/14/../../../../lib -L/lib/i386-linux-gnu -L/lib/../lib -L/usr/lib/i386-linux-gnu -L/usr/lib/../lib -L/usr/lib/gcc/i686-linux-gnu/14/../../.. -lgfortran -lm -lquadmath -fopenmp +/bin/sh ../libtool --tag=CXX --mode=link g++ -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -fopenmp -Wl,-z,relro -o snippets snippets.o -L.. /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la -lhwloc -lm -lhwloc -lz -fopenmp -L/usr/lib/gcc/i686-linux-gnu/14 -L/usr/lib/gcc/i686-linux-gnu/14/../../../i386-linux-gnu -L/usr/lib/gcc/i686-linux-gnu/14/../../../../lib -L/lib/i386-linux-gnu -L/lib/../lib -L/usr/lib/i386-linux-gnu -L/usr/lib/../lib -L/usr/lib/gcc/i686-linux-gnu/14/../../.. -lgfortran -lm -lquadmath libtool: link: g++ -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -fopenmp -Wl,-z -Wl,relro -o .libs/fortran_rsb_fi fortran_rsb_fi.o -fopenmp -L.. /build/reproducible-path/librsb-1.3.0.2+dfsg/.libs/librsb.so -lhwloc -lz -L/usr/lib/gcc/i686-linux-gnu/14 -L/usr/lib/gcc/i686-linux-gnu/14/../../../i386-linux-gnu -L/usr/lib/gcc/i686-linux-gnu/14/../../../../lib -L/lib/i386-linux-gnu -L/lib/../lib -L/usr/lib/i386-linux-gnu -L/usr/lib/../lib -L/usr/lib/gcc/i686-linux-gnu/14/../../.. -lgfortran -lm -lquadmath -fopenmp -libtool: link: g++ -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -fopenmp -Wl,-z -Wl,relro -o .libs/snippets snippets.o -fopenmp -L.. /build/reproducible-path/librsb-1.3.0.2+dfsg/.libs/librsb.so -lhwloc -lz -L/usr/lib/gcc/i686-linux-gnu/14 -L/usr/lib/gcc/i686-linux-gnu/14/../../../i386-linux-gnu -L/usr/lib/gcc/i686-linux-gnu/14/../../../../lib -L/lib/i386-linux-gnu -L/lib/../lib -L/usr/lib/i386-linux-gnu -L/usr/lib/../lib -L/usr/lib/gcc/i686-linux-gnu/14/../../.. -lgfortran -lm -lquadmath -fopenmp +libtool: link: g++ -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -fopenmp -Wl,-z -Wl,relro -o .libs/fortran fortran.o -fopenmp -L.. /build/reproducible-path/librsb-1.3.0.2+dfsg/.libs/librsb.so -lhwloc -lz -L/usr/lib/gcc/i686-linux-gnu/14 -L/usr/lib/gcc/i686-linux-gnu/14/../../../i386-linux-gnu -L/usr/lib/gcc/i686-linux-gnu/14/../../../../lib -L/lib/i386-linux-gnu -L/lib/../lib -L/usr/lib/i386-linux-gnu -L/usr/lib/../lib -L/usr/lib/gcc/i686-linux-gnu/14/../../.. -lgfortran -lm -lquadmath -fopenmp libtool: link: g++ -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -fopenmp -Wl,-z -Wl,relro -o .libs/cplusplus cplusplus.o -fopenmp -L.. /build/reproducible-path/librsb-1.3.0.2+dfsg/.libs/librsb.so -lhwloc -lz -L/usr/lib/gcc/i686-linux-gnu/14 -L/usr/lib/gcc/i686-linux-gnu/14/../../../i386-linux-gnu -L/usr/lib/gcc/i686-linux-gnu/14/../../../../lib -L/lib/i386-linux-gnu -L/lib/../lib -L/usr/lib/i386-linux-gnu -L/usr/lib/../lib -L/usr/lib/gcc/i686-linux-gnu/14/../../.. -lgfortran -lm -lquadmath -fopenmp +libtool: link: g++ -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -fopenmp -Wl,-z -Wl,relro -o .libs/snippets snippets.o -fopenmp -L.. /build/reproducible-path/librsb-1.3.0.2+dfsg/.libs/librsb.so -lhwloc -lz -L/usr/lib/gcc/i686-linux-gnu/14 -L/usr/lib/gcc/i686-linux-gnu/14/../../../i386-linux-gnu -L/usr/lib/gcc/i686-linux-gnu/14/../../../../lib -L/lib/i386-linux-gnu -L/lib/../lib -L/usr/lib/i386-linux-gnu -L/usr/lib/../lib -L/usr/lib/gcc/i686-linux-gnu/14/../../.. -lgfortran -lm -lquadmath -fopenmp gmake[4]: Leaving directory '/build/reproducible-path/librsb-1.3.0.2+dfsg/examples' Making all in scripts gmake[4]: Entering directory '/build/reproducible-path/librsb-1.3.0.2+dfsg/scripts' @@ -2406,12 +2442,12 @@ Making all in doc gmake[4]: Entering directory '/build/reproducible-path/librsb-1.3.0.2+dfsg/doc' /usr/bin/mkdir -p man +SOURCE_DATE_EPOCH=1704020461 \ +help2man --name="benchmark and test for librsb" --no-info ../rsbench | /usr/bin/sed 's/January //g' > man/rsbench.1 /usr/bin/mkdir -p man -gmake makedox -SOURCE_DATE_EPOCH=1767272461 \ +SOURCE_DATE_EPOCH=1704020461 \ help2man --name="provide configuration information for librsb" --no-info /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb-config | /usr/bin/sed 's/January //g' > man/librsb-config.1 -SOURCE_DATE_EPOCH=1767272461 \ -help2man --name="benchmark and test for librsb" --no-info ../rsbench | /usr/bin/sed 's/January //g' > man/rsbench.1 +gmake makedox gmake[5]: Entering directory '/build/reproducible-path/librsb-1.3.0.2+dfsg/doc' DOXYGEN_PROJECT_NUMBER=1.3.0.2 doxygen Doxyfile || echo "are you sure you have doxygen installed ?" warning: Tag 'HTML_TIMESTAMP' at line 1513 of file 'Doxyfile' has become obsolete. @@ -3122,13 +3158,13 @@ g++ -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -c -o rgt-rgt.o `test -f 'rgt.cpp' || echo './'`rgt.cpp g++ -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -DRSBP_NOTHROW=1 -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -c -o rgt_ne-rgt.o `test -f 'rgt.cpp' || echo './'`rgt.cpp g++ -DHAVE_CONFIG_H -I. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -DRSBP_NOTHROW=1 -DRSBP_WANT_REV=1 -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -c -o rgt_rv-rgt.o `test -f 'rgt.cpp' || echo './'`rgt.cpp -/bin/bash ./libtool --tag=CXX --mode=link g++ -DRSBP_NOTHROW=1 -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -Wl,-z,relro -o rgt_ne rgt_ne-rgt.o -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la -/bin/bash ./libtool --tag=CXX --mode=link g++ -DRSBP_NOTHROW=1 -DRSBP_WANT_REV=1 -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -Wl,-z,relro -o rgt_rv rgt_rv-rgt.o -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la -/bin/bash ./libtool --tag=CXX --mode=link g++ -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -Wl,-z,relro -o rgt rgt-rgt.o -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la -libtool: link: g++ -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -Wl,-z -Wl,relro -o .libs/rgt rgt-rgt.o -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/.libs/librsb.so -fopenmp +/bin/sh ./libtool --tag=CXX --mode=link g++ -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -Wl,-z,relro -o rgt rgt-rgt.o -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la +/bin/sh ./libtool --tag=CXX --mode=link g++ -DRSBP_NOTHROW=1 -DRSBP_WANT_REV=1 -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -Wl,-z,relro -o rgt_rv rgt_rv-rgt.o -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la +/bin/sh ./libtool --tag=CXX --mode=link g++ -DRSBP_NOTHROW=1 -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -Wl,-z,relro -o rgt_ne rgt_ne-rgt.o -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la libtool: link: g++ -DRSBP_NOTHROW=1 -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -Wl,-z -Wl,relro -o .libs/rgt_ne rgt_ne-rgt.o -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/.libs/librsb.so -fopenmp +libtool: link: g++ -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -Wl,-z -Wl,relro -o .libs/rgt rgt-rgt.o -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/.libs/librsb.so -fopenmp libtool: link: g++ -DRSBP_NOTHROW=1 -DRSBP_WANT_REV=1 -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -Wl,-z -Wl,relro -o .libs/rgt_rv rgt_rv-rgt.o -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/.libs/librsb.so -fopenmp -/bin/bash ./libtool --tag=CXX --mode=link g++ -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -Wl,-z,relro -o rsb rsb.o -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la +/bin/sh ./libtool --tag=CXX --mode=link g++ -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -Wl,-z,relro -o rsb rsb.o -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la libtool: link: g++ -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -Wl,-z -Wl,relro -o .libs/rsb rsb.o -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/.libs/librsb.so -fopenmp gmake[6]: Leaving directory '/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib' Making all in examples @@ -3143,26 +3179,26 @@ g++ -DHAVE_CONFIG_H -I.. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I.. -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -c -o mtx2bin.o mtx2bin.cpp g++ -DHAVE_CONFIG_H -I.. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I.. -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -c -o render.o render.cpp g++ -DHAVE_CONFIG_H -I.. -Wdate-time -D_FORTIFY_SOURCE=2 -I/build/reproducible-path/librsb-1.3.0.2+dfsg -I.. -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -c -o span.o span.cpp -/bin/bash ../libtool --tag=CXX --mode=link g++ -I.. -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -Wl,-z,relro -o assemble assemble.o -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la -/bin/bash ../libtool --tag=CXX --mode=link g++ -I.. -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -Wl,-z,relro -o build build.o -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la -/bin/bash ../libtool --tag=CXX --mode=link g++ -I.. -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -Wl,-z,relro -o misc misc.o -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la +/bin/sh ../libtool --tag=CXX --mode=link g++ -I.. -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -Wl,-z,relro -o assemble assemble.o -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la +/bin/sh ../libtool --tag=CXX --mode=link g++ -I.. -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -Wl,-z,relro -o build build.o -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la +/bin/sh ../libtool --tag=CXX --mode=link g++ -I.. -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -Wl,-z,relro -o misc misc.o -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la +/bin/sh ../libtool --tag=CXX --mode=link g++ -I.. -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -Wl,-z,relro -o twonnz twonnz.o -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la libtool: link: g++ -I.. -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -Wl,-z -Wl,relro -o .libs/assemble assemble.o -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/.libs/librsb.so -fopenmp libtool: link: g++ -I.. -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -Wl,-z -Wl,relro -o .libs/build build.o -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/.libs/librsb.so -fopenmp -/bin/bash ../libtool --tag=CXX --mode=link g++ -I.. -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -Wl,-z,relro -o twonnz twonnz.o -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la +/bin/sh ../libtool --tag=CXX --mode=link g++ -I.. -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -Wl,-z,relro -o example example.o -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la +/bin/sh ../libtool --tag=CXX --mode=link g++ -I.. -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -Wl,-z,relro -o render render.o -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la libtool: link: g++ -I.. -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -Wl,-z -Wl,relro -o .libs/misc misc.o -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/.libs/librsb.so -fopenmp -/bin/bash ../libtool --tag=CXX --mode=link g++ -I.. -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -Wl,-z,relro -o example example.o -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la -/bin/bash ../libtool --tag=CXX --mode=link g++ -I.. -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -Wl,-z,relro -o render render.o -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la libtool: link: g++ -I.. -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -Wl,-z -Wl,relro -o .libs/twonnz twonnz.o -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/.libs/librsb.so -fopenmp -/bin/bash ../libtool --tag=CXX --mode=link g++ -I.. -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -Wl,-z,relro -o span span.o -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la +/bin/sh ../libtool --tag=CXX --mode=link g++ -I.. -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -Wl,-z,relro -o span span.o -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la +/bin/sh ../libtool --tag=CXX --mode=link g++ -I.. -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -Wl,-z,relro -o autotune autotune.o -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la +/bin/sh ../libtool --tag=CXX --mode=link g++ -I.. -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -Wl,-z,relro -o bench bench.o -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la libtool: link: g++ -I.. -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -Wl,-z -Wl,relro -o .libs/example example.o -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/.libs/librsb.so -fopenmp libtool: link: g++ -I.. -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -Wl,-z -Wl,relro -o .libs/render render.o -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/.libs/librsb.so -fopenmp -/bin/bash ../libtool --tag=CXX --mode=link g++ -I.. -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -Wl,-z,relro -o autotune autotune.o -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la +/bin/sh ../libtool --tag=CXX --mode=link g++ -I.. -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -Wl,-z,relro -o mtx2bin mtx2bin.o -lstdc++fs -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la libtool: link: g++ -I.. -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -Wl,-z -Wl,relro -o .libs/span span.o -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/.libs/librsb.so -fopenmp libtool: link: g++ -I.. -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -Wl,-z -Wl,relro -o .libs/autotune autotune.o -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/.libs/librsb.so -fopenmp -/bin/bash ../libtool --tag=CXX --mode=link g++ -I.. -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -Wl,-z,relro -o mtx2bin mtx2bin.o -lstdc++fs -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la -/bin/bash ../libtool --tag=CXX --mode=link g++ -I.. -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -Wl,-z,relro -o bench bench.o -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la -libtool: link: g++ -I.. -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -Wl,-z -Wl,relro -o .libs/mtx2bin mtx2bin.o -lstdc++fs -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/.libs/librsb.so -fopenmp libtool: link: g++ -I.. -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -Wl,-z -Wl,relro -o .libs/bench bench.o -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/.libs/librsb.so -fopenmp +libtool: link: g++ -I.. -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -Wl,-z -Wl,relro -o .libs/mtx2bin mtx2bin.o -lstdc++fs -lpthread /build/reproducible-path/librsb-1.3.0.2+dfsg/.libs/librsb.so -fopenmp gmake[6]: Leaving directory '/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib/examples' gmake[5]: Leaving directory '/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib' gmake[4]: Leaving directory '/build/reproducible-path/librsb-1.3.0.2+dfsg/rsblib' @@ -3171,7 +3207,7 @@ gmake all-am gmake[5]: Entering directory '/build/reproducible-path/librsb-1.3.0.2+dfsg/rsbtest' g++ -DHAVE_CONFIG_H -I. -I/build/reproducible-path/librsb-1.3.0.2+dfsg -Wdate-time -D_FORTIFY_SOURCE=2 -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -c -o rsbtest.o rsbtest.cpp -/bin/bash ./libtool --tag=CXX --mode=link g++ -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -Wl,-z,relro -o rsbtest rsbtest.o /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la -lstdc++fs -lstdc++fs +/bin/sh ./libtool --tag=CXX --mode=link g++ -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -Wl,-z,relro -o rsbtest rsbtest.o /build/reproducible-path/librsb-1.3.0.2+dfsg/librsb.la -lstdc++fs -lstdc++fs libtool: link: g++ -fopenmp -g -O2 -ffile-prefix-map=/build/reproducible-path/librsb-1.3.0.2+dfsg=. -fstack-protector-strong -Wformat -Werror=format-security -Wl,-z -Wl,relro -o .libs/rsbtest rsbtest.o /build/reproducible-path/librsb-1.3.0.2+dfsg/.libs/librsb.so -lstdc++fs -fopenmp gmake[5]: Leaving directory '/build/reproducible-path/librsb-1.3.0.2+dfsg/rsbtest' gmake[4]: Leaving directory '/build/reproducible-path/librsb-1.3.0.2+dfsg/rsbtest' @@ -3247,7 +3283,7 @@ gmake[3]: Leaving directory '/build/reproducible-path/librsb-1.3.0.2+dfsg' gmake mtests -C . gmake[3]: Entering directory '/build/reproducible-path/librsb-1.3.0.2+dfsg' -srcdir="/build/reproducible-path/librsb-1.3.0.2+dfsg" /bin/bash -ex ./scripts/readme-tests.sh +srcdir="/build/reproducible-path/librsb-1.3.0.2+dfsg" /bin/sh -ex ./scripts/readme-tests.sh + test x/build/reproducible-path/librsb-1.3.0.2+dfsg = x + ./rsbench -oa -Ob --bench -f /build/reproducible-path/librsb-1.3.0.2+dfsg/A.mtx -qH -R -n1,4 -T z --verbose --nrhs 1,2 --by-rows # --bench option implies -qH -R --write-performance-record --want-mkl-autotune --mkl-benchmark --types : --split-experimental 6 --merge-experimental 6 --also-transpose --sort-filenames-list --want-memory-benchmark @@ -3257,15 +3293,15 @@ Adding matrix file: /build/reproducible-path/librsb-1.3.0.2+dfsg/A.mtx # Sorting matrices list (use --no-sort-filenames-list to prevent this) # Using matrices: A.mtx -# beginning run at 1767573701 +# beginning run at 1733165242 # /build/reproducible-path/librsb-1.3.0.2+dfsg/.libs/rsbench -oa -Ob --bench -f /build/reproducible-path/librsb-1.3.0.2+dfsg/A.mtx -qH -R -n1,4 -T z --verbose --nrhs 1,2 --by-rows # compiled with: CC=gcc CFLAGS=-g -O2 -Werror=implicit-function-declaration -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -# average timer granularity: 5.05e-08 s -# Will write a final performance record to file rsbench_pr__1767573701_gcc-14.2-1,4th.rpr and periodic checkpoints to rsbench_pr__1767573701_gcc-14.2-1,4th.rpr.tmp +# average timer granularity: 5.6e-08 s +# Will write a final performance record to file rsbench_pr__1733165242_gcc-14.2-1,4th.rpr and periodic checkpoints to rsbench_pr__1733165242_gcc-14.2-1,4th.rpr.tmp # will NOT perform ancillary tests. # will flush cache memory: between each operation measurement series, and NOT between each operation. # will keep any zero encountered in the matrix. -# env: export PATH=/usr/sbin:/usr/bin:/sbin:/bin:/usr/games +# env: export PATH=/usr/sbin:/usr/bin:/sbin:/bin:/usr/games:/i/capture/the/path # env: export LD_LIBRARY_PATH=/build/reproducible-path/librsb-1.3.0.2+dfsg/.libs:/usr/lib/libeatmydata # env: HOSTNAME is not set # env: KMP_AFFINITY is not set @@ -3304,61 +3340,61 @@ # env: SLURM_NTASKS is not set # env: SLURM_STEP_TASKS_PER_NODE is not set # env: SLURM_TASKS_PER_NODE is not set -# detected hostname: infom08-i386 +# detected hostname: i-capture-the-hostname # user specified a verbosity level of 1 (each --verbose occurrence counts +1) # This test will measure times in scanning arrays sized and aligned to fit in caches. # 3 cache levels detected Will fill struct with 50 samples... -# Memory benchmark took 8.275s +# Memory benchmark took 11.170s # auto-tuning oriented output implies times==0 iterations and sort-after-load. #pr: allocated a performance record for 8 samples (2016 bytes). # Cache block size total 16777216 bytes, per-thread 2097152 bytes -# so far, program took 8.278s of wall clock time; ancillary tests 0.000s; I/O 0.000s; checks 0.000s; conversions 0.000s; rsb/mkl tuning 0.000s/0.000s . +# so far, program took 11.172s of wall clock time; ancillary tests 0.000s; I/O 0.000s; checks 0.000s; conversions 0.000s; rsb/mkl tuning 0.000s/0.000s . # Using 1 threads # reading A.mtx (184 bytes / 1 MiB / 6 nnz / 3 rows / 3 columns / 1 MiB COO) as type Z... -# file input of A.mtx took 0.00 s (6 nnz, 56680 nnz/s ) (1.74 MB/s ) -#pre-sorting (6 elements) took 0.000663042 s -#weeding duplicates (to 6 elements) took 9.53674e-07 s (and check, 2.14577e-06 s ) +# file input of A.mtx took 0.00 s (6 nnz, 79892 nnz/s ) (2.45 MB/s ) +#pre-sorting (6 elements) took 0.0368609 s +#weeding duplicates (to 6 elements) took 1.90735e-06 s (and check, 9.53674e-07 s ) # multi-nrhs benchmarking (1,2) -- now using nrhs 1. # Using alpha=1 beta=1 order=rows for rsb_spmv/rsb_spsv/rsb_spmm/rsb_spsm. # multi-transpose benchmarking -- now using transA = N. # will use input matrix flags: RSB_FLAG_USE_HALFWORD_INDICES, RSB_FLAG_SORTED_INPUT, RSB_FLAG_QUAD_PARTITIONING, RSB_FLAG_SYMMETRIC, RSB_FLAG_OWN_PARTITIONING_ARRAYS # Using 1 threads -# Constructed matrix (took 0.000s): (3 x 3)[0x56a7afc0]{Z} @ (0(0..0),0(0..0)) (6 nnz, 2 nnz/r) flags 0x2442186 (coo:1, csr:0, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'S' +# Constructed matrix (took 0.124s): (3 x 3)[0x57747000]{Z} @ (0(0..0),0(0..0)) (6 nnz, 2 nnz/r) flags 0x2442186 (coo:1, csr:0, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'S' # matrix consistency check took 0.000s (ok) RSB Sparse Blocks Autotuner invoked requesting max 6 splits and max 6 merges in 1 rounds, threads spec.0 (specify negative values to enable threads tuning). Will autotune matrix: 3 x 3, type Z, 6 nnz, 2 nnz/r, 4 subms, 3 lsubms, 4.0000 bpnz. Parameters: verbosity:1 mintimes:3 maxtimes:10 mindt:0 maxdt:3 -3 iterations (1 th.) took 4.411e-05s; avg 1.47e-05s ( +/- 59.46/104.32 %); best 5.96e-06s; worst 3.004e-05s; std dev. 1.088e-05 (taking best). -Reference operation time is 5.96046e-06 s (16.11 Mflops) with 1 threads. -Starting merge (same threads) based auto-tuning procedure (transA=N, nrhs=1, order=rows) (max 6 steps, inclusive 3 grace steps) on: 3 x 3, type Z, 6 nnz, 2 nnz/r, 4 subms, 3 lsubms, 4.0000 bpnz (tpop: 5.96e-06 Mflops: 16.106) -Merge (3 -> 1 leaves) took w.c.t. of 1.097e-05s, ~4.053e-06s of computing time (of which 0s sorting, 9.537e-07s analysis) -3 iterations (1 th.) took 1.907e-05s; avg 6.358e-06s ( +/- 99.17/200.00 %); best 5.27e-08s; worst 1.907e-05s; std dev. 8.991e-06 (taking best). -Reference operation time is 5.27024e-08 s (1822 Mflops) with 1 threads. -After merge step 1: tpop: 5.27e-08 s ~Mflops: 1821.548 nsubm:1 otn:1 -Applying merge (3 -> 1 leaves, 1 th.) yielded SPEEDUP of 113.097x: 5.96e-06s -> 5.27e-08s, so taking this instance. +3 iterations (1 th.) took 0.07201s; avg 0.024s ( +/- 0.06/ 0.03 %); best 0.02399s; worst 0.02401s; std dev. 9.425e-06 (taking best). +Reference operation time is 0.0239911 s (0.004001 Mflops) with 1 threads. +Starting merge (same threads) based auto-tuning procedure (transA=N, nrhs=1, order=rows) (max 6 steps, inclusive 3 grace steps) on: 3 x 3, type Z, 6 nnz, 2 nnz/r, 4 subms, 3 lsubms, 4.0000 bpnz (tpop: 0.02399 Mflops: 0.004) +Merge (3 -> 1 leaves) took w.c.t. of 2.599e-05s, ~8.106e-06s of computing time (of which 1.192e-06s sorting, 4.053e-06s analysis) +3 iterations (1 th.) took 2.503e-05s; avg 8.345e-06s ( +/- 99.36/185.71 %); best 5.33e-08s; worst 2.384e-05s; std dev. 1.097e-05 (taking best). +Reference operation time is 5.32985e-08 s (1801 Mflops) with 1 threads. +After merge step 1: tpop: 5.33e-08 s ~Mflops: 1801.177 nsubm:1 otn:1 +Applying merge (3 -> 1 leaves, 1 th.) yielded SPEEDUP of 450127.488x: 0.02399s -> 5.33e-08s, so taking this instance. Merged all the matrix leaves: no reason to continue merging. -A total of 1 merge steps (of max 6) (3 -> 1 subms) took 6.104e-05s (of which 1.407e-05s partitioning, 0s I/O); computing times: 4.053e-06s in par. loops, 0s sorting, 9.537e-07s analyzing) -Total merge + benchmarking process took 6.104e-05s, equivalent to 1158.1/10.2 new/old ops (4.387e-05s for 2 clones -- as 832.4/7.4 ops, or 416.2/3.7 ops per clone), SPEEDUP of 113.097x -Applying multi-merge (3 -> 1 leaves, 1 steps, 0 -> 1 th.sp.) yielded SPEEDUP of 113.097x (5.96e-06s -> 5.27e-08s), will amortize in 10.3 ops by saving 5.908e-06s per op. -In 1 tuning rounds (tot. 0.00015s, 4.4e-05s for constructor, 2 clones) obtained a SPEEDUP of 11209.7% (113.1x) (from 16.11 to 1822 Mflops). +A total of 1 merge steps (of max 6) (3 -> 1 subms) took 0.06398s (of which 2.885e-05s partitioning, 0s I/O); computing times: 8.106e-06s in par. loops, 1.192e-06s sorting, 4.053e-06s analyzing) +Total merge + benchmarking process took 0.06398s, equivalent to 1200425.0/2.7 new/old ops (0.1238s for 2 clones -- as 2323386.3/5.2 ops, or 1161693.1/2.6 ops per clone), SPEEDUP of 450127.488x +Applying multi-merge (3 -> 1 leaves, 1 steps, 0 -> 1 th.sp.) yielded SPEEDUP of 450127.488x (0.02399s -> 5.33e-08s), will amortize in 2.7 ops by saving 0.02399s per op. +In 1 tuning rounds (tot. 0.2s, 0.12s for constructor, 2 clones) obtained a SPEEDUP of 45012648.8% (4.501e+05x) (from 0.004001 to 1801 Mflops). #pr: updating sample at index 1 (0^th of 8), 0^th touch for (0,0,0,0,0,0,0). -First run of RSB Autotuner took 0.000188828 s (5.960e-06 s -> 5.270e-08 s per spmv_sxsa) (tuned: 3 -> 1 lsubm). +First run of RSB Autotuner took 0.195997 s (2.399e-02 s -> 5.330e-08 s per spmv_sxsa) (tuned: 3 -> 1 lsubm). RSB Sparse Blocks Autotuner invoked requesting max 0 splits and max 0 merges in 1 rounds, auto threads spec. -Second run of RSB Autotuner took 0.000944138 s and estimated a speedup of 1.000000 x (5.270e-08 s -> 5.270e-08 s per op) in same matrix (1 -> 1 lsubm) +Second run of RSB Autotuner took 1.24796 s and estimated a speedup of 1.000000 x (5.330e-08 s -> 5.330e-08 s per op) in same matrix (1 -> 1 lsubm) #min:1 0 #max:1 0 #sum:3 0 #norm:1.7320508075688772 0 #used index storage compared to COO:28 vs 48 bytes (58.33%) ; compared to CSR:28 vs 40 bytes (77.78%) #%:CONSTRUCTOR_*:SORT SCAN INSERT SCAN+INSERT -%:CONSTRUCTOR_TIMES:A.mtx S N 1 3 3 6 0.000000 0.000023 0.000021 0.000044 -%:UNSORTEDCOO2RSB_TIME:A.mtx S N 1 3 3 6 0.000044 -%:RSB_SUBDIVISION_TIME:A.mtx S N 1 3 3 6 0.000023 -%:RSB_SHUFFLE_TIME:A.mtx S N 1 3 3 6 0.000021 +%:CONSTRUCTOR_TIMES:A.mtx S N 1 3 3 6 0.000000 0.035909 0.040002 0.075911 +%:UNSORTEDCOO2RSB_TIME:A.mtx S N 1 3 3 6 0.075911 +%:RSB_SUBDIVISION_TIME:A.mtx S N 1 3 3 6 0.035909 +%:RSB_SHUFFLE_TIME:A.mtx S N 1 3 3 6 0.040002 %:ROW_MAJOR_SORT_TIME:A.mtx S N 1 3 3 6 0.000000 %:ROW_MAJOR_SORT_SCALING:A.mtx S N 1 3 3 6 -nan -%:SORTEDCOO2RSB_TIME:A.mtx S N 1 3 3 6 0.000044 +%:SORTEDCOO2RSB_TIME:A.mtx S N 1 3 3 6 0.075911 %:ROW_MAJOR_SORT_TO_MOP:A.mtx S N 1 3 3 6 0.000 %:UNSORTEDCOO2RSB_SCALING:A.mtx S N 1 3 3 6 1.00 %:SORTEDCOO2RSB_SCALING:A.mtx S N 1 3 3 6 1.00 @@ -3373,47 +3409,47 @@ %:SM_MINMAXAVGNNZ:A.mtx S N 1 3 3 6 6 6 6 # # Using 4 threads -# Constructed matrix (took 0.000s): (3 x 3)[0x56a7e700]{Z} @ (0(0..0),0(0..0)) (6 nnz, 2 nnz/r) flags 0x2442186 (coo:1, csr:0, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'S' +# Constructed matrix (took 0.148s): (3 x 3)[0x5774a740]{Z} @ (0(0..0),0(0..0)) (6 nnz, 2 nnz/r) flags 0x2442186 (coo:1, csr:0, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'S' # matrix consistency check took 0.000s (ok) RSB Sparse Blocks Autotuner invoked requesting max 6 splits and max 6 merges in 1 rounds, threads spec.1 (specify negative values to enable threads tuning). Will autotune matrix: 3 x 3, type Z, 6 nnz, 2 nnz/r, 4 subms, 3 lsubms, 4.0000 bpnz. Parameters: verbosity:1 mintimes:3 maxtimes:10 mindt:0 maxdt:3 -3 iterations (4 th.) took 3.195e-05s; avg 1.065e-05s ( +/- 35.07/ 70.15 %); best 6.914e-06s; worst 1.812e-05s; std dev. 5.282e-06 (taking best). -Reference operation time is 6.91414e-06 s (13.88 Mflops) with 4 threads. -Starting merge (user-supplied threads) based auto-tuning procedure (transA=N, nrhs=1, order=rows) (max 6 steps, inclusive 3 grace steps) on: 3 x 3, type Z, 6 nnz, 2 nnz/r, 4 subms, 3 lsubms, 4.0000 bpnz (tpop: 6.914e-06 Mflops: 13.885) -Merge (3 -> 1 leaves) took w.c.t. of 2.217e-05s, ~1.907e-06s of computing time (of which 9.537e-07s sorting, 1.192e-06s analysis) -3 iterations (4 th.) took 3.099e-06s; avg 1.033e-06s ( +/- 94.90/ 84.62 %); best 5.27e-08s; worst 1.907e-06s; std dev. 7.867e-07 (taking best). -Reference operation time is 5.27024e-08 s (1822 Mflops) with 4 threads. -After merge step 1: tpop: 5.27e-08 s ~Mflops: 1821.548 nsubm:1 otn:1 -Applying merge (3 -> 1 leaves, 1 th.) yielded SPEEDUP of 131.192x: 6.914e-06s -> 5.27e-08s, so taking this instance. +3 iterations (4 th.) took 0.07601s; avg 0.02534s ( +/- 52.57/ 65.11 %); best 0.01202s; worst 0.04183s; std dev. 0.01238 (taking best). +Reference operation time is 0.0120161 s (0.007989 Mflops) with 4 threads. +Starting merge (user-supplied threads) based auto-tuning procedure (transA=N, nrhs=1, order=rows) (max 6 steps, inclusive 3 grace steps) on: 3 x 3, type Z, 6 nnz, 2 nnz/r, 4 subms, 3 lsubms, 4.0000 bpnz (tpop: 0.01202 Mflops: 0.008) +Merge (3 -> 1 leaves) took w.c.t. of 1.502e-05s, ~4.768e-06s of computing time (of which 1.907e-06s sorting, 3.099e-06s analysis) +3 iterations (4 th.) took 3.099e-06s; avg 1.033e-06s ( +/- 94.84/200.00 %); best 5.33e-08s; worst 3.099e-06s; std dev. 1.461e-06 (taking best). +Reference operation time is 5.32985e-08 s (1801 Mflops) with 4 threads. +After merge step 1: tpop: 5.33e-08 s ~Mflops: 1801.177 nsubm:1 otn:1 +Applying merge (3 -> 1 leaves, 1 th.) yielded SPEEDUP of 225448.446x: 0.01202s -> 5.33e-08s, so taking this instance. Merged all the matrix leaves: no reason to continue merging. -A total of 1 merge steps (of max 6) (3 -> 1 subms) took 5.198e-05s (of which 2.313e-05s partitioning, 0s I/O); computing times: 1.907e-06s in par. loops, 9.537e-07s sorting, 1.192e-06s analyzing) -Total merge + benchmarking process took 5.198e-05s, equivalent to 986.2/7.5 new/old ops (3.886e-05s for 2 clones -- as 737.4/5.6 ops, or 368.7/2.8 ops per clone), SPEEDUP of 131.192x -Applying multi-merge (3 -> 1 leaves, 1 steps, 1 -> 1 th.sp.) yielded SPEEDUP of 131.192x (6.914e-06s -> 5.27e-08s), will amortize in 7.6 ops by saving 6.861e-06s per op. -In 1 tuning rounds (tot. 0.00013s, 3.9e-05s for constructor, 2 clones) obtained a SPEEDUP of 13019.2% (131.2x) (from 13.88 to 1822 Mflops). +A total of 1 merge steps (of max 6) (3 -> 1 subms) took 0.07198s (of which 1.907e-05s partitioning, 0s I/O); computing times: 4.768e-06s in par. loops, 1.907e-06s sorting, 3.099e-06s analyzing) +Total merge + benchmarking process took 0.07198s, equivalent to 1350489.8/6.0 new/old ops (0.1559s for 2 clones -- as 2924831.1/13.0 ops, or 1462415.6/6.5 ops per clone), SPEEDUP of 225448.446x +Applying multi-merge (3 -> 1 leaves, 1 steps, 1 -> 1 th.sp.) yielded SPEEDUP of 225448.446x (0.01202s -> 5.33e-08s), will amortize in 6.0 ops by saving 0.01202s per op. +In 1 tuning rounds (tot. 0.23s, 0.16s for constructor, 2 clones) obtained a SPEEDUP of 22544744.6% (2.254e+05x) (from 0.007989 to 1801 Mflops). #pr: updating sample at index 5 (1^th of 8), 0^th touch for (0,1,0,0,0,0,0). -First run of RSB Autotuner took 0.000135183 s (6.914e-06 s -> 5.270e-08 s per spmv_sxsa) (tuned: 3 -> 1 lsubm). +First run of RSB Autotuner took 0.231992 s (1.202e-02 s -> 5.330e-08 s per spmv_sxsa) (tuned: 3 -> 1 lsubm). RSB Sparse Blocks Autotuner invoked requesting max 0 splits and max 0 merges in 1 rounds, auto threads spec. -Second run of RSB Autotuner took 0.000363827 s and estimated a speedup of 1.000000 x (5.270e-08 s -> 5.270e-08 s per op) in same matrix (1 -> 1 lsubm) +Second run of RSB Autotuner took 1.18396 s and estimated a speedup of 1.000000 x (5.330e-08 s -> 5.330e-08 s per op) in same matrix (1 -> 1 lsubm) #min:1 0 #max:1 0 #sum:3 0 #norm:1.7320508075688772 0 #used index storage compared to COO:28 vs 48 bytes (58.33%) ; compared to CSR:28 vs 40 bytes (77.78%) #%:CONSTRUCTOR_*:SORT SCAN INSERT SCAN+INSERT -%:CONSTRUCTOR_TIMES:A.mtx S N 4 3 3 6 0.000000 0.000024 0.000349 0.000373 -%:UNSORTEDCOO2RSB_TIME:A.mtx S N 4 3 3 6 0.000373 -%:RSB_SUBDIVISION_TIME:A.mtx S N 4 3 3 6 0.000024 -%:RSB_SHUFFLE_TIME:A.mtx S N 4 3 3 6 0.000349 +%:CONSTRUCTOR_TIMES:A.mtx S N 4 3 3 6 0.000000 0.039739 0.076020 0.115759 +%:UNSORTEDCOO2RSB_TIME:A.mtx S N 4 3 3 6 0.115759 +%:RSB_SUBDIVISION_TIME:A.mtx S N 4 3 3 6 0.039739 +%:RSB_SHUFFLE_TIME:A.mtx S N 4 3 3 6 0.076020 %:ROW_MAJOR_SORT_TIME:A.mtx S N 4 3 3 6 0.000000 %:ROW_MAJOR_SORT_SCALING:A.mtx S N 4 3 3 6 -nan -%:SORTEDCOO2RSB_TIME:A.mtx S N 4 3 3 6 0.000373 +%:SORTEDCOO2RSB_TIME:A.mtx S N 4 3 3 6 0.115759 %:ROW_MAJOR_SORT_TO_MOP:A.mtx S N 4 3 3 6 0.000 -%:UNSORTEDCOO2RSB_SCALING:A.mtx S N 4 3 3 6 0.12 -%:SORTEDCOO2RSB_SCALING:A.mtx S N 4 3 3 6 0.12 -%:RSB_SUBDIVISION_SCALING:A.mtx S N 4 3 3 6 0.97 -%:RSB_SHUFFLE_SCALING:A.mtx S N 4 3 3 6 0.06 -%:CONSTRUCTOR_SCALING:A.mtx S N 4 3 3 6 -nan 0.97 0.06 0.12 +%:UNSORTEDCOO2RSB_SCALING:A.mtx S N 4 3 3 6 0.66 +%:SORTEDCOO2RSB_SCALING:A.mtx S N 4 3 3 6 0.66 +%:RSB_SUBDIVISION_SCALING:A.mtx S N 4 3 3 6 0.90 +%:RSB_SHUFFLE_SCALING:A.mtx S N 4 3 3 6 0.53 +%:CONSTRUCTOR_SCALING:A.mtx S N 4 3 3 6 -nan 0.90 0.53 0.66 #%:SM_COUNTS: Tot HalfwordCsr FullwordCsr HalfwordCoo FullwordCoo %:SM_COUNTS:A.mtx S N 4 3 3 6 1 1 0 0 0 %:SM_IDXOCCUPATIONRSBVSCOOANDCSR:A.mtx S N 4 3 3 6 28 48 36 @@ -3422,50 +3458,50 @@ %:SM_MINMAXAVGNNZ:A.mtx S N 4 3 3 6 6 6 6 # %operation:matrix CONSTRUCTOR[1] SPMV[1] SPMV[4] -%operation:A.mtx 7.08103e-05 1e+09 1e+09 +%operation:A.mtx 0.123905 1e+09 1e+09 %constructor:matrix SORT[1] SCAN[1] SHUFFLE[1] INSERT[1] -%constructor:A.mtx 0 2.31266e-05 0 2.09808e-05 +%constructor:A.mtx 0 0.0359089 0 0.0400021 # symmetric matrix --- skipping transposed benchmarking # multi-nrhs benchmarking (1,2) -- now using nrhs 2. # Using alpha=1 beta=1 order=rows for rsb_spmv/rsb_spsv/rsb_spmm/rsb_spsm. # multi-transpose benchmarking -- now using transA = N. # will use input matrix flags: RSB_FLAG_USE_HALFWORD_INDICES, RSB_FLAG_SORTED_INPUT, RSB_FLAG_QUAD_PARTITIONING, RSB_FLAG_SYMMETRIC, RSB_FLAG_OWN_PARTITIONING_ARRAYS # Using 1 threads -# Constructed matrix (took 0.000s): (3 x 3)[0x56a7e700]{Z} @ (0(0..0),0(0..0)) (6 nnz, 2 nnz/r) flags 0x2442186 (coo:1, csr:0, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'S' +# Constructed matrix (took 0.129s): (3 x 3)[0x5774a740]{Z} @ (0(0..0),0(0..0)) (6 nnz, 2 nnz/r) flags 0x2442186 (coo:1, csr:0, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'S' # matrix consistency check took 0.000s (ok) RSB Sparse Blocks Autotuner invoked requesting max 6 splits and max 6 merges in 1 rounds, threads spec.0 (specify negative values to enable threads tuning). Will autotune matrix: 3 x 3, type Z, 6 nnz, 2 nnz/r, 4 subms, 3 lsubms, 4.0000 bpnz. Parameters: verbosity:1 mintimes:3 maxtimes:10 mindt:0 maxdt:3 -3 iterations (1 th.) took 3.695e-05s; avg 1.232e-05s ( +/- 59.35/ 95.48 %); best 5.007e-06s; worst 2.408e-05s; std dev. 8.399e-06 (taking best). -Reference operation time is 5.00679e-06 s (38.35 Mflops) with 1 threads. -Starting merge (same threads) based auto-tuning procedure (transA=N, nrhs=2, order=rows) (max 6 steps, inclusive 3 grace steps) on: 3 x 3, type Z, 6 nnz, 2 nnz/r, 4 subms, 3 lsubms, 4.0000 bpnz (tpop: 5.007e-06 Mflops: 38.348) -Merge (3 -> 1 leaves) took w.c.t. of 7.153e-06s, ~2.861e-06s of computing time (of which 0s sorting, 9.537e-07s analysis) -3 iterations (1 th.) took 2.861e-06s; avg 9.537e-07s ( +/- 94.47/200.00 %); best 5.27e-08s; worst 2.861e-06s; std dev. 1.349e-06 (taking best). -Reference operation time is 5.27024e-08 s (3643 Mflops) with 1 threads. -After merge step 1: tpop: 5.27e-08 s ~Mflops: 3643.096 nsubm:1 otn:1 -Applying merge (3 -> 1 leaves, 1 th.) yielded SPEEDUP of 95.001x: 5.007e-06s -> 5.27e-08s, so taking this instance. +3 iterations (1 th.) took 0.06001s; avg 0.02s ( +/- 39.96/ 20.01 %); best 0.01201s; worst 0.02401s; std dev. 0.005653 (taking best). +Reference operation time is 0.0120101 s (0.01599 Mflops) with 1 threads. +Starting merge (same threads) based auto-tuning procedure (transA=N, nrhs=2, order=rows) (max 6 steps, inclusive 3 grace steps) on: 3 x 3, type Z, 6 nnz, 2 nnz/r, 4 subms, 3 lsubms, 4.0000 bpnz (tpop: 0.01201 Mflops: 0.016) +Merge (3 -> 1 leaves) took w.c.t. of 1.597e-05s, ~5.007e-06s of computing time (of which 1.907e-06s sorting, 3.099e-06s analysis) +3 iterations (1 th.) took 4.053e-06s; avg 1.351e-06s ( +/- 96.05/111.76 %); best 5.33e-08s; worst 2.861e-06s; std dev. 1.173e-06 (taking best). +Reference operation time is 5.32985e-08 s (3602 Mflops) with 1 threads. +After merge step 1: tpop: 5.33e-08 s ~Mflops: 3602.355 nsubm:1 otn:1 +Applying merge (3 -> 1 leaves, 1 th.) yielded SPEEDUP of 225336.614x: 0.01201s -> 5.33e-08s, so taking this instance. Merged all the matrix leaves: no reason to continue merging. -A total of 1 merge steps (of max 6) (3 -> 1 subms) took 3.695e-05s (of which 9.06e-06s partitioning, 0s I/O); computing times: 2.861e-06s in par. loops, 0s sorting, 9.537e-07s analyzing) -Total merge + benchmarking process took 3.695e-05s, equivalent to 701.2/7.4 new/old ops (3.719e-05s for 2 clones -- as 705.7/7.4 ops, or 352.9/3.7 ops per clone), SPEEDUP of 95.001x -Applying multi-merge (3 -> 1 leaves, 1 steps, 0 -> 1 th.sp.) yielded SPEEDUP of 95.001x (5.007e-06s -> 5.27e-08s), will amortize in 7.5 ops by saving 4.954e-06s per op. -In 1 tuning rounds (tot. 0.00011s, 3.7e-05s for constructor, 2 clones) obtained a SPEEDUP of 9400.1% (95x) (from 38.35 to 3643 Mflops). +A total of 1 merge steps (of max 6) (3 -> 1 subms) took 0.05998s (of which 1.788e-05s partitioning, 0s I/O); computing times: 5.007e-06s in par. loops, 1.907e-06s sorting, 3.099e-06s analyzing) +Total merge + benchmarking process took 0.05998s, equivalent to 1125359.0/5.0 new/old ops (0.1399s for 2 clones -- as 2624388.3/11.6 ops, or 1312194.1/5.8 ops per clone), SPEEDUP of 225336.614x +Applying multi-merge (3 -> 1 leaves, 1 steps, 0 -> 1 th.sp.) yielded SPEEDUP of 225336.614x (0.01201s -> 5.33e-08s), will amortize in 5.0 ops by saving 0.01201s per op. +In 1 tuning rounds (tot. 0.2s, 0.14s for constructor, 2 clones) obtained a SPEEDUP of 22533561.4% (2.253e+05x) (from 0.01599 to 3602 Mflops). #pr: updating sample at index 3 (2^th of 8), 0^th touch for (0,0,0,0,1,0,0). -First run of RSB Autotuner took 0.000121832 s (5.007e-06 s -> 5.270e-08 s per spmv_sxsa) (tuned: 3 -> 1 lsubm). +First run of RSB Autotuner took 0.199984 s (1.201e-02 s -> 5.330e-08 s per spmv_sxsa) (tuned: 3 -> 1 lsubm). RSB Sparse Blocks Autotuner invoked requesting max 0 splits and max 0 merges in 1 rounds, auto threads spec. -Second run of RSB Autotuner took 0.000339031 s and estimated a speedup of 1.000000 x (5.270e-08 s -> 5.270e-08 s per op) in same matrix (1 -> 1 lsubm) +Second run of RSB Autotuner took 1.13597 s and estimated a speedup of 1.000000 x (5.330e-08 s -> 5.330e-08 s per op) in same matrix (1 -> 1 lsubm) #min:1 0 #max:1 0 #sum:3 0 #norm:1.7320508075688772 0 #used index storage compared to COO:28 vs 48 bytes (58.33%) ; compared to CSR:28 vs 40 bytes (77.78%) #%:CONSTRUCTOR_*:SORT SCAN INSERT SCAN+INSERT -%:CONSTRUCTOR_TIMES:A.mtx S N 1 3 3 6 0.000000 0.000020 0.000017 0.000037 -%:UNSORTEDCOO2RSB_TIME:A.mtx S N 1 3 3 6 0.000037 -%:RSB_SUBDIVISION_TIME:A.mtx S N 1 3 3 6 0.000020 -%:RSB_SHUFFLE_TIME:A.mtx S N 1 3 3 6 0.000017 +%:CONSTRUCTOR_TIMES:A.mtx S N 1 3 3 6 0.000000 0.041163 0.039981 0.081144 +%:UNSORTEDCOO2RSB_TIME:A.mtx S N 1 3 3 6 0.081144 +%:RSB_SUBDIVISION_TIME:A.mtx S N 1 3 3 6 0.041163 +%:RSB_SHUFFLE_TIME:A.mtx S N 1 3 3 6 0.039981 %:ROW_MAJOR_SORT_TIME:A.mtx S N 1 3 3 6 0.000000 %:ROW_MAJOR_SORT_SCALING:A.mtx S N 1 3 3 6 -nan -%:SORTEDCOO2RSB_TIME:A.mtx S N 1 3 3 6 0.000037 +%:SORTEDCOO2RSB_TIME:A.mtx S N 1 3 3 6 0.081144 %:ROW_MAJOR_SORT_TO_MOP:A.mtx S N 1 3 3 6 0.000 %:UNSORTEDCOO2RSB_SCALING:A.mtx S N 1 3 3 6 1.00 %:SORTEDCOO2RSB_SCALING:A.mtx S N 1 3 3 6 1.00 @@ -3480,47 +3516,47 @@ %:SM_MINMAXAVGNNZ:A.mtx S N 1 3 3 6 6 6 6 # # Using 4 threads -# Constructed matrix (took 0.000s): (3 x 3)[0x56a7e700]{Z} @ (0(0..0),0(0..0)) (6 nnz, 2 nnz/r) flags 0x2442186 (coo:1, csr:0, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'S' +# Constructed matrix (took 0.129s): (3 x 3)[0x5774a740]{Z} @ (0(0..0),0(0..0)) (6 nnz, 2 nnz/r) flags 0x2442186 (coo:1, csr:0, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'S' # matrix consistency check took 0.000s (ok) RSB Sparse Blocks Autotuner invoked requesting max 6 splits and max 6 merges in 1 rounds, threads spec.1 (specify negative values to enable threads tuning). Will autotune matrix: 3 x 3, type Z, 6 nnz, 2 nnz/r, 4 subms, 3 lsubms, 4.0000 bpnz. Parameters: verbosity:1 mintimes:3 maxtimes:10 mindt:0 maxdt:3 -3 iterations (4 th.) took 4.101e-05s; avg 1.367e-05s ( +/- 19.77/ 9.88 %); best 1.097e-05s; worst 1.502e-05s; std dev. 1.911e-06 (taking best). -Reference operation time is 1.09673e-05 s (17.51 Mflops) with 4 threads. -Starting merge (user-supplied threads) based auto-tuning procedure (transA=N, nrhs=2, order=rows) (max 6 steps, inclusive 3 grace steps) on: 3 x 3, type Z, 6 nnz, 2 nnz/r, 4 subms, 3 lsubms, 4.0000 bpnz (tpop: 1.097e-05 Mflops: 17.507) -Merge (3 -> 1 leaves) took w.c.t. of 7.868e-06s, ~3.099e-06s of computing time (of which 0s sorting, 9.537e-07s analysis) -3 iterations (4 th.) took 2.861e-06s; avg 9.537e-07s ( +/- 94.47/100.00 %); best 5.27e-08s; worst 1.907e-06s; std dev. 7.787e-07 (taking best). -Reference operation time is 5.27024e-08 s (3643 Mflops) with 4 threads. -After merge step 1: tpop: 5.27e-08 s ~Mflops: 3643.096 nsubm:1 otn:1 -Applying merge (3 -> 1 leaves, 1 th.) yielded SPEEDUP of 208.098x: 1.097e-05s -> 5.27e-08s, so taking this instance. +3 iterations (4 th.) took 0.06s; avg 0.02s ( +/- 39.86/ 19.94 %); best 0.01203s; worst 0.02399s; std dev. 0.005637 (taking best). +Reference operation time is 0.012027 s (0.01596 Mflops) with 4 threads. +Starting merge (user-supplied threads) based auto-tuning procedure (transA=N, nrhs=2, order=rows) (max 6 steps, inclusive 3 grace steps) on: 3 x 3, type Z, 6 nnz, 2 nnz/r, 4 subms, 3 lsubms, 4.0000 bpnz (tpop: 0.01203 Mflops: 0.016) +Merge (3 -> 1 leaves) took w.c.t. of 1.693e-05s, ~5.007e-06s of computing time (of which 1.907e-06s sorting, 3.099e-06s analysis) +3 iterations (4 th.) took 4.053e-06s; avg 1.351e-06s ( +/- 96.05/111.76 %); best 5.33e-08s; worst 2.861e-06s; std dev. 1.173e-06 (taking best). +Reference operation time is 5.32985e-08 s (3602 Mflops) with 4 threads. +After merge step 1: tpop: 5.33e-08 s ~Mflops: 3602.355 nsubm:1 otn:1 +Applying merge (3 -> 1 leaves, 1 th.) yielded SPEEDUP of 225654.216x: 0.01203s -> 5.33e-08s, so taking this instance. Merged all the matrix leaves: no reason to continue merging. -A total of 1 merge steps (of max 6) (3 -> 1 subms) took 6.008e-05s (of which 1.001e-05s partitioning, 0s I/O); computing times: 3.099e-06s in par. loops, 0s sorting, 9.537e-07s analyzing) -Total merge + benchmarking process took 6.008e-05s, equivalent to 1140.0/5.5 new/old ops (5.531e-05s for 2 clones -- as 1049.5/5.0 ops, or 524.8/2.5 ops per clone), SPEEDUP of 208.098x -Applying multi-merge (3 -> 1 leaves, 1 steps, 1 -> 1 th.sp.) yielded SPEEDUP of 208.098x (1.097e-05s -> 5.27e-08s), will amortize in 5.5 ops by saving 1.091e-05s per op. -In 1 tuning rounds (tot. 0.00014s, 5.5e-05s for constructor, 2 clones) obtained a SPEEDUP of 20709.8% (208.1x) (from 17.51 to 3643 Mflops). +A total of 1 merge steps (of max 6) (3 -> 1 subms) took 0.04803s (of which 1.907e-05s partitioning, 0s I/O); computing times: 5.007e-06s in par. loops, 1.907e-06s sorting, 3.099e-06s analyzing) +Total merge + benchmarking process took 0.04803s, equivalent to 901113.8/4.0 new/old ops (0.108s for 2 clones -- as 2026472.8/9.0 ops, or 1013236.4/4.5 ops per clone), SPEEDUP of 225654.216x +Applying multi-merge (3 -> 1 leaves, 1 steps, 1 -> 1 th.sp.) yielded SPEEDUP of 225654.216x (0.01203s -> 5.33e-08s), will amortize in 4.0 ops by saving 0.01203s per op. +In 1 tuning rounds (tot. 0.17s, 0.11s for constructor, 2 clones) obtained a SPEEDUP of 22565321.6% (2.257e+05x) (from 0.01596 to 3602 Mflops). #pr: updating sample at index 7 (3^th of 8), 0^th touch for (0,1,0,0,1,0,0). -First run of RSB Autotuner took 0.000146866 s (1.097e-05 s -> 5.270e-08 s per spmv_sxsa) (tuned: 3 -> 1 lsubm). +First run of RSB Autotuner took 0.168095 s (1.203e-02 s -> 5.330e-08 s per spmv_sxsa) (tuned: 3 -> 1 lsubm). RSB Sparse Blocks Autotuner invoked requesting max 0 splits and max 0 merges in 1 rounds, auto threads spec. -Second run of RSB Autotuner took 0.000414848 s and estimated a speedup of 1.000000 x (5.270e-08 s -> 5.270e-08 s per op) in same matrix (1 -> 1 lsubm) +Second run of RSB Autotuner took 0.907963 s and estimated a speedup of 1.000000 x (5.330e-08 s -> 5.330e-08 s per op) in same matrix (1 -> 1 lsubm) #min:1 0 #max:1 0 #sum:3 0 #norm:1.7320508075688772 0 #used index storage compared to COO:28 vs 48 bytes (58.33%) ; compared to CSR:28 vs 40 bytes (77.78%) #%:CONSTRUCTOR_*:SORT SCAN INSERT SCAN+INSERT -%:CONSTRUCTOR_TIMES:A.mtx S N 4 3 3 6 0.000000 0.000110 0.000190 0.000300 -%:UNSORTEDCOO2RSB_TIME:A.mtx S N 4 3 3 6 0.000300 -%:RSB_SUBDIVISION_TIME:A.mtx S N 4 3 3 6 0.000110 -%:RSB_SHUFFLE_TIME:A.mtx S N 4 3 3 6 0.000190 +%:CONSTRUCTOR_TIMES:A.mtx S N 4 3 3 6 0.000000 0.037205 0.047868 0.085073 +%:UNSORTEDCOO2RSB_TIME:A.mtx S N 4 3 3 6 0.085073 +%:RSB_SUBDIVISION_TIME:A.mtx S N 4 3 3 6 0.037205 +%:RSB_SHUFFLE_TIME:A.mtx S N 4 3 3 6 0.047868 %:ROW_MAJOR_SORT_TIME:A.mtx S N 4 3 3 6 0.000000 %:ROW_MAJOR_SORT_SCALING:A.mtx S N 4 3 3 6 -nan -%:SORTEDCOO2RSB_TIME:A.mtx S N 4 3 3 6 0.000300 +%:SORTEDCOO2RSB_TIME:A.mtx S N 4 3 3 6 0.085073 %:ROW_MAJOR_SORT_TO_MOP:A.mtx S N 4 3 3 6 0.000 -%:UNSORTEDCOO2RSB_SCALING:A.mtx S N 4 3 3 6 0.12 -%:SORTEDCOO2RSB_SCALING:A.mtx S N 4 3 3 6 0.12 -%:RSB_SUBDIVISION_SCALING:A.mtx S N 4 3 3 6 0.18 -%:RSB_SHUFFLE_SCALING:A.mtx S N 4 3 3 6 0.09 -%:CONSTRUCTOR_SCALING:A.mtx S N 4 3 3 6 -nan 0.18 0.09 0.12 +%:UNSORTEDCOO2RSB_SCALING:A.mtx S N 4 3 3 6 0.95 +%:SORTEDCOO2RSB_SCALING:A.mtx S N 4 3 3 6 0.95 +%:RSB_SUBDIVISION_SCALING:A.mtx S N 4 3 3 6 1.11 +%:RSB_SHUFFLE_SCALING:A.mtx S N 4 3 3 6 0.84 +%:CONSTRUCTOR_SCALING:A.mtx S N 4 3 3 6 -nan 1.11 0.84 0.95 #%:SM_COUNTS: Tot HalfwordCsr FullwordCsr HalfwordCoo FullwordCoo %:SM_COUNTS:A.mtx S N 4 3 3 6 1 1 0 0 0 %:SM_IDXOCCUPATIONRSBVSCOOANDCSR:A.mtx S N 4 3 3 6 28 48 36 @@ -3529,184 +3565,184 @@ %:SM_MINMAXAVGNNZ:A.mtx S N 4 3 3 6 6 6 6 # %operation:matrix CONSTRUCTOR[1] SPMV[1] SPMV[4] -%operation:A.mtx 5.6982e-05 1e+09 1e+09 +%operation:A.mtx 0.129158 1e+09 1e+09 %constructor:matrix SORT[1] SCAN[1] SHUFFLE[1] INSERT[1] -%constructor:A.mtx 0 2.00272e-05 0 1.69277e-05 +%constructor:A.mtx 0 0.041163 0 0.0399811 # symmetric matrix --- skipping transposed benchmarking -# so far, program took 8.721s of wall clock time; ancillary tests 0.000s; I/O 0.000s; checks 0.000s; conversions 0.000s; rsb/mkl tuning 0.003s/0.000s . +# so far, program took 18.077s of wall clock time; ancillary tests 0.000s; I/O 0.000s; checks 0.000s; conversions 0.000s; rsb/mkl tuning 5.272s/0.000s . getrusage() stats: -ru_maxrss: 73 (maximum resident set size -- MB) -ru_stime : 0.5055s (system CPU time used) -ru_utime : 9.795s (user CPU time used) +ru_maxrss: 69 (maximum resident set size -- MB) +ru_stime : 0.2987s (system CPU time used) +ru_utime : 20.62s (user CPU time used) # benchmarking terminated --- finalizing run. # ====== BEGIN Total summary record. #pr: ======== Limiting to nrhs=1: #pr: 2 samples (out of 4) matched the dump limiting criteria. #pr: Dump from a base of 4 samples (of max 8) ordered by (1,2,1,1,2,1,2) = (filename x cores x incX x incY x nrhs x typecode x transA). pr: BESTCODE MTX NR NC NNZ NRHS TYPE SYM TRANS NT AT-NT AT-MKL-NT BPNZ AT-BPNZ NSUBM AT-SUBM RSBBEST-MFLOPS OPTIME MKL-OPTIME AT-OPTIME AT-MKL-OPTIME AT-TIME RWminBW-GBps CB-bpf AT-MS CMFLOPS -pr: 1:R_R A 3 3 6 1 Z S N 1 1 0 4.0000 4.6667 3 1 1821.55 5.960e-06 0.000e+00 5.270e-08 0.000e+00 1.888e-04 5.09e+00 2.29e+00 1 9.60e-05 -pr: 5:R_R A 3 3 6 1 Z S N 4 1 0 4.0000 4.6667 3 1 1821.55 6.914e-06 0.000e+00 5.270e-08 0.000e+00 1.352e-04 5.09e+00 2.29e+00 1 9.60e-05 +pr: 1:R_R A 3 3 6 1 Z S N 1 1 0 4.0000 4.6667 3 1 1801.18 2.399e-02 0.000e+00 5.330e-08 0.000e+00 1.960e-01 5.03e+00 2.29e+00 1 9.60e-05 +pr: 5:R_R A 3 3 6 1 Z S N 4 1 0 4.0000 4.6667 3 1 1801.18 1.202e-02 0.000e+00 5.330e-08 0.000e+00 2.320e-01 5.03e+00 2.29e+00 1 9.60e-05 #pr: 2 samples (out of 4) matched the dump limiting criteria. #pr: below, we define 'successful' autotuning when speedup of 1.010000x is exceeded, and 'tuned' results even the ones which are same as untuned #pr: rsb autotuning was successful in 2 cases (100.00 %) and unsuccessful in 0 cases (0.00 %) -#pr: (in succ. cases rsb autotuning gave avg. 12114.4 % faster, avg. sp. ratio 122.144x, max sp. ratio 131.192x, avg. ratio 0.000x) -#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 3074.0/2565.0/3582.9/6147.9 tuned ops) -#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 25.6/ 19.6/ 31.7/ 51.2 untuned ops) -#pr: (and amortizes from untuned rsb in avg. 25.8, min. 19.7, max. 32.0 ops) +#pr: (in succ. cases rsb autotuning gave avg. 33778696.7 % faster, avg. sp. ratio 337787.967x, max sp. ratio 450127.488x, avg. ratio 0.000x) +#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 4015021.2/3677347.3/4352695.1/8030042.5 tuned ops) +#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 13.7/ 8.2/ 19.3/ 27.5 untuned ops) +#pr: (and amortizes from untuned rsb in avg. 13.7, min. 8.2, max. 19.3 ops) #pr: (avg/min/max (avg) nnz per subm before successful tuning were 2/ 2/ 2) #pr: (avg/min/max (avg) nnz per subm after successful tuning were 6/ 6/ 6) #pr: (avg/min/max (avg) bytes per subm before successful tuning were 32/ 32/ 32) #pr: (avg/min/max (avg) bytes per subm after successful tuning were 96/ 96/ 96) #pr: (avg/min/max (avg) bytes per nnz before successful tuning were 4.000/ 4.000/ 4.000) -#pr: (avg/min/max operands (mtx,lhs,rhs) read bandwidth lower bound 4.174/ 4.174/ 4.174,GBps) -#pr: (avg/min/max operands (mtx,rhs:r;lhs:rw) bandwidth lower bound 10.170/ 5.085/ 5.085,GBps) +#pr: (avg/min/max operands (mtx,lhs,rhs) read bandwidth lower bound 4.128/ 4.128/ 4.128,GBps) +#pr: (avg/min/max operands (mtx,rhs:r;lhs:rw) bandwidth lower bound 10.057/ 5.028/ 5.028,GBps) #pr: (avg/min/max code balance (bytes read at least once per flop) 2.292/ 2.292/ 2.292) #pr: (avg/min/max (avg) bytes per nnz after successful tuning were 4.667/ 4.667/ 4.667) #pr: (matrix has been subdivided more/less/same in resp. 0 / 2 /0 cases) #pr: (matrix has used more/less/same threads in resp. 0 / 1 /1 cases) #pr: no unsuccessful rsb autotuning attempt (according to 1.01x threshold) -#pr: rsb auto tuning (either succ. or uns.) time was: on avg.: 0.00 s, min 0.00 s, max 0.00 s, tot 0.00 s (2 samples) -#pr: rsb auto tuning ( only successful ) time was: on avg.: 0.00 s, min 0.00 s, max 0.00 s, tot 0.00 s (2 samples) -#pr: best tun. rsb canon. mflops were: on avg. 1.822e+03, min 1.822e+03, max 1.822e+03 (2 samples) -#pr: ref. unt. rsb canon. mflops were: on avg. 1.500e+01, min 1.388e+01, max 1.611e+01 (2 samples) -#pr: best tun. rsb operation time was: on avg. 5.270e-08s, min 5.270e-08s, max 5.270e-08s, tot 1.054e-07s (2 samples) -#pr: ref. unt. rsb operation time was: on avg. 6.437e-06s, min 5.960e-06s, max 6.914e-06s, tot 1.287e-05s (2 samples) -#pr: min / max ratio of in-memory MEMSET bandwidth to extrapolated read bandwidth ratio: 6.466e+00 6.466e+00 -#pr: in-cache to in-memory MEMSET bandwidth ratio: 1.759e+00 +#pr: rsb auto tuning (either succ. or uns.) time was: on avg.: 0.21 s, min 0.20 s, max 0.23 s, tot 0.43 s (2 samples) +#pr: rsb auto tuning ( only successful ) time was: on avg.: 0.21 s, min 0.20 s, max 0.23 s, tot 0.43 s (2 samples) +#pr: best tun. rsb canon. mflops were: on avg. 1.801e+03, min 1.801e+03, max 1.801e+03 (2 samples) +#pr: ref. unt. rsb canon. mflops were: on avg. 5.995e-03, min 4.001e-03, max 7.989e-03 (2 samples) +#pr: best tun. rsb operation time was: on avg. 5.330e-08s, min 5.330e-08s, max 5.330e-08s, tot 1.066e-07s (2 samples) +#pr: ref. unt. rsb operation time was: on avg. 1.800e-02s, min 1.202e-02s, max 2.399e-02s, tot 3.601e-02s (2 samples) +#pr: min / max ratio of in-memory MEMSET bandwidth to extrapolated read bandwidth ratio: 2.557e+00 2.557e+00 +#pr: in-cache to in-memory MEMSET bandwidth ratio: 1.703e+00 #pr: ======== Limiting to nrhs=2: #pr: 2 samples (out of 4) matched the dump limiting criteria. #pr: Dump from a base of 4 samples (of max 8) ordered by (1,2,1,1,2,1,2) = (filename x cores x incX x incY x nrhs x typecode x transA). pr: BESTCODE MTX NR NC NNZ NRHS TYPE SYM TRANS NT AT-NT AT-MKL-NT BPNZ AT-BPNZ NSUBM AT-SUBM RSBBEST-MFLOPS OPTIME MKL-OPTIME AT-OPTIME AT-MKL-OPTIME AT-TIME RWminBW-GBps CB-bpf AT-MS CMFLOPS -pr: 3:R_R A 3 3 6 2 Z S N 1 1 0 4.0000 4.6667 3 1 3643.10 5.007e-06 0.000e+00 5.270e-08 0.000e+00 1.218e-04 7.82e+00 1.65e+00 1 1.92e-04 -pr: 7:R_R A 3 3 6 2 Z S N 4 1 0 4.0000 4.6667 3 1 3643.10 1.097e-05 0.000e+00 5.270e-08 0.000e+00 1.469e-04 7.82e+00 1.65e+00 1 1.92e-04 +pr: 3:R_R A 3 3 6 2 Z S N 1 1 0 4.0000 4.6667 3 1 3602.35 1.201e-02 0.000e+00 5.330e-08 0.000e+00 2.000e-01 7.73e+00 1.65e+00 1 1.92e-04 +pr: 7:R_R A 3 3 6 2 Z S N 4 1 0 4.0000 4.6667 3 1 3602.35 1.203e-02 0.000e+00 5.330e-08 0.000e+00 1.681e-01 7.73e+00 1.65e+00 1 1.92e-04 #pr: 2 samples (out of 4) matched the dump limiting criteria. #pr: below, we define 'successful' autotuning when speedup of 1.010000x is exceeded, and 'tuned' results even the ones which are same as untuned #pr: rsb autotuning was successful in 2 cases (100.00 %) and unsuccessful in 0 cases (0.00 %) -#pr: (in succ. cases rsb autotuning gave avg. 15054.9 % faster, avg. sp. ratio 151.549x, max sp. ratio 208.098x, avg. ratio 0.000x) -#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 2549.2/2311.7/2786.7/5098.4 tuned ops) -#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 18.9/ 13.4/ 24.3/ 37.7 untuned ops) -#pr: (and amortizes from untuned rsb in avg. 19.0, min. 13.5, max. 24.6 ops) +#pr: (in succ. cases rsb autotuning gave avg. 22549441.5 % faster, avg. sp. ratio 225495.415x, max sp. ratio 225654.216x, avg. ratio 0.000x) +#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 3452999.3/3153844.8/3752153.9/6905998.7 tuned ops) +#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 15.3/ 14.0/ 16.7/ 30.6 untuned ops) +#pr: (and amortizes from untuned rsb in avg. 15.3, min. 14.0, max. 16.7 ops) #pr: (avg/min/max (avg) nnz per subm before successful tuning were 2/ 2/ 2) #pr: (avg/min/max (avg) nnz per subm after successful tuning were 6/ 6/ 6) #pr: (avg/min/max (avg) bytes per subm before successful tuning were 32/ 32/ 32) #pr: (avg/min/max (avg) bytes per subm after successful tuning were 96/ 96/ 96) #pr: (avg/min/max (avg) bytes per nnz before successful tuning were 4.000/ 4.000/ 4.000) -#pr: (avg/min/max operands (mtx,lhs,rhs) read bandwidth lower bound 5.996/ 5.996/ 5.996,GBps) -#pr: (avg/min/max operands (mtx,rhs:r;lhs:rw) bandwidth lower bound 15.635/ 7.817/ 7.817,GBps) +#pr: (avg/min/max operands (mtx,lhs,rhs) read bandwidth lower bound 5.929/ 5.929/ 5.929,GBps) +#pr: (avg/min/max operands (mtx,rhs:r;lhs:rw) bandwidth lower bound 15.460/ 7.730/ 7.730,GBps) #pr: (avg/min/max code balance (bytes read at least once per flop) 1.646/ 1.646/ 1.646) #pr: (avg/min/max (avg) bytes per nnz after successful tuning were 4.667/ 4.667/ 4.667) #pr: (matrix has been subdivided more/less/same in resp. 0 / 2 /0 cases) #pr: (matrix has used more/less/same threads in resp. 0 / 1 /1 cases) #pr: no unsuccessful rsb autotuning attempt (according to 1.01x threshold) -#pr: rsb auto tuning (either succ. or uns.) time was: on avg.: 0.00 s, min 0.00 s, max 0.00 s, tot 0.00 s (2 samples) -#pr: rsb auto tuning ( only successful ) time was: on avg.: 0.00 s, min 0.00 s, max 0.00 s, tot 0.00 s (2 samples) -#pr: best tun. rsb canon. mflops were: on avg. 3.643e+03, min 3.643e+03, max 3.643e+03 (2 samples) -#pr: ref. unt. rsb canon. mflops were: on avg. 2.793e+01, min 1.751e+01, max 3.835e+01 (2 samples) -#pr: best tun. rsb operation time was: on avg. 5.270e-08s, min 5.270e-08s, max 5.270e-08s, tot 1.054e-07s (2 samples) -#pr: ref. unt. rsb operation time was: on avg. 7.987e-06s, min 5.007e-06s, max 1.097e-05s, tot 1.597e-05s (2 samples) -#pr: min / max ratio of in-memory MEMSET bandwidth to extrapolated read bandwidth ratio: 4.502e+00 4.502e+00 -#pr: in-cache to in-memory MEMSET bandwidth ratio: 1.759e+00 +#pr: rsb auto tuning (either succ. or uns.) time was: on avg.: 0.18 s, min 0.17 s, max 0.20 s, tot 0.37 s (2 samples) +#pr: rsb auto tuning ( only successful ) time was: on avg.: 0.18 s, min 0.17 s, max 0.20 s, tot 0.37 s (2 samples) +#pr: best tun. rsb canon. mflops were: on avg. 3.602e+03, min 3.602e+03, max 3.602e+03 (2 samples) +#pr: ref. unt. rsb canon. mflops were: on avg. 1.598e-02, min 1.596e-02, max 1.599e-02 (2 samples) +#pr: best tun. rsb operation time was: on avg. 5.330e-08s, min 5.330e-08s, max 5.330e-08s, tot 1.066e-07s (2 samples) +#pr: ref. unt. rsb operation time was: on avg. 1.202e-02s, min 1.201e-02s, max 1.203e-02s, tot 2.404e-02s (2 samples) +#pr: min / max ratio of in-memory MEMSET bandwidth to extrapolated read bandwidth ratio: 1.780e+00 1.780e+00 +#pr: in-cache to in-memory MEMSET bandwidth ratio: 1.703e+00 #pr: rsb nrhs-to-overall-min-rhs speed ratio was: on avg. 2.000e+00 x, min 2.000e+00 x, max 2.000e+00 x (2 samples, the non-min-nrhs ones) #pr: ======== Limiting to transA=N: #pr: Dump from a base of 4 samples (of max 8) ordered by (1,2,1,1,2,1,2) = (filename x cores x incX x incY x nrhs x typecode x transA). pr: BESTCODE MTX NR NC NNZ NRHS TYPE SYM TRANS NT AT-NT AT-MKL-NT BPNZ AT-BPNZ NSUBM AT-SUBM RSBBEST-MFLOPS OPTIME MKL-OPTIME AT-OPTIME AT-MKL-OPTIME AT-TIME RWminBW-GBps CB-bpf AT-MS CMFLOPS -pr: 1:R_R A 3 3 6 1 Z S N 1 1 0 4.0000 4.6667 3 1 1821.55 5.960e-06 0.000e+00 5.270e-08 0.000e+00 1.888e-04 5.09e+00 2.29e+00 1 9.60e-05 -pr: 3:R_R A 3 3 6 2 Z S N 1 1 0 4.0000 4.6667 3 1 3643.10 5.007e-06 0.000e+00 5.270e-08 0.000e+00 1.218e-04 7.82e+00 1.65e+00 1 1.92e-04 -pr: 5:R_R A 3 3 6 1 Z S N 4 1 0 4.0000 4.6667 3 1 1821.55 6.914e-06 0.000e+00 5.270e-08 0.000e+00 1.352e-04 5.09e+00 2.29e+00 1 9.60e-05 -pr: 7:R_R A 3 3 6 2 Z S N 4 1 0 4.0000 4.6667 3 1 3643.10 1.097e-05 0.000e+00 5.270e-08 0.000e+00 1.469e-04 7.82e+00 1.65e+00 1 1.92e-04 +pr: 1:R_R A 3 3 6 1 Z S N 1 1 0 4.0000 4.6667 3 1 1801.18 2.399e-02 0.000e+00 5.330e-08 0.000e+00 1.960e-01 5.03e+00 2.29e+00 1 9.60e-05 +pr: 3:R_R A 3 3 6 2 Z S N 1 1 0 4.0000 4.6667 3 1 3602.35 1.201e-02 0.000e+00 5.330e-08 0.000e+00 2.000e-01 7.73e+00 1.65e+00 1 1.92e-04 +pr: 5:R_R A 3 3 6 1 Z S N 4 1 0 4.0000 4.6667 3 1 1801.18 1.202e-02 0.000e+00 5.330e-08 0.000e+00 2.320e-01 5.03e+00 2.29e+00 1 9.60e-05 +pr: 7:R_R A 3 3 6 2 Z S N 4 1 0 4.0000 4.6667 3 1 3602.35 1.203e-02 0.000e+00 5.330e-08 0.000e+00 1.681e-01 7.73e+00 1.65e+00 1 1.92e-04 #pr: below, we define 'successful' autotuning when speedup of 1.010000x is exceeded, and 'tuned' results even the ones which are same as untuned #pr: rsb autotuning was successful in 4 cases (100.00 %) and unsuccessful in 0 cases (0.00 %) -#pr: (in succ. cases rsb autotuning gave avg. 13584.7 % faster, avg. sp. ratio 136.847x, max sp. ratio 208.098x, avg. ratio 0.000x) -#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 2811.6/2311.7/3582.9/11246.3 tuned ops) -#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 22.2/ 13.4/ 31.7/ 89.0 untuned ops) -#pr: (and amortizes from untuned rsb in avg. 22.4, min. 13.5, max. 32.0 ops) +#pr: (in succ. cases rsb autotuning gave avg. 28164069.1 % faster, avg. sp. ratio 281641.691x, max sp. ratio 450127.488x, avg. ratio 0.000x) +#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 3734010.3/3153844.8/4352695.1/14936041.2 tuned ops) +#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 14.5/ 8.2/ 19.3/ 58.1 untuned ops) +#pr: (and amortizes from untuned rsb in avg. 14.5, min. 8.2, max. 19.3 ops) #pr: (avg/min/max (avg) nnz per subm before successful tuning were 2/ 2/ 2) #pr: (avg/min/max (avg) nnz per subm after successful tuning were 6/ 6/ 6) #pr: (avg/min/max (avg) bytes per subm before successful tuning were 32/ 32/ 32) #pr: (avg/min/max (avg) bytes per subm after successful tuning were 96/ 96/ 96) #pr: (avg/min/max (avg) bytes per nnz before successful tuning were 4.000/ 4.000/ 4.000) -#pr: (avg/min/max operands (mtx,lhs,rhs) read bandwidth lower bound 5.085/ 4.174/ 5.996,GBps) -#pr: (avg/min/max operands (mtx,rhs:r;lhs:rw) bandwidth lower bound 25.805/ 5.085/ 7.817,GBps) +#pr: (avg/min/max operands (mtx,lhs,rhs) read bandwidth lower bound 5.028/ 4.128/ 5.929,GBps) +#pr: (avg/min/max operands (mtx,rhs:r;lhs:rw) bandwidth lower bound 25.517/ 5.028/ 7.730,GBps) #pr: (avg/min/max code balance (bytes read at least once per flop) 1.969/ 1.646/ 2.292) #pr: (avg/min/max (avg) bytes per nnz after successful tuning were 4.667/ 4.667/ 4.667) #pr: (matrix has been subdivided more/less/same in resp. 0 / 4 /0 cases) #pr: (matrix has used more/less/same threads in resp. 0 / 2 /2 cases) #pr: no unsuccessful rsb autotuning attempt (according to 1.01x threshold) -#pr: rsb auto tuning (either succ. or uns.) time was: on avg.: 0.00 s, min 0.00 s, max 0.00 s, tot 0.00 s (4 samples) -#pr: rsb auto tuning ( only successful ) time was: on avg.: 0.00 s, min 0.00 s, max 0.00 s, tot 0.00 s (4 samples) -#pr: best tun. rsb canon. mflops were: on avg. 2.732e+03, min 1.822e+03, max 3.643e+03 (4 samples) -#pr: ref. unt. rsb canon. mflops were: on avg. 2.146e+01, min 1.388e+01, max 3.835e+01 (4 samples) -#pr: best tun. rsb operation time was: on avg. 5.270e-08s, min 5.270e-08s, max 5.270e-08s, tot 2.108e-07s (4 samples) -#pr: ref. unt. rsb operation time was: on avg. 7.212e-06s, min 5.007e-06s, max 1.097e-05s, tot 2.885e-05s (4 samples) -#pr: min / max ratio of in-memory MEMSET bandwidth to extrapolated read bandwidth ratio: 4.502e+00 6.466e+00 -#pr: in-cache to in-memory MEMSET bandwidth ratio: 1.759e+00 +#pr: rsb auto tuning (either succ. or uns.) time was: on avg.: 0.20 s, min 0.17 s, max 0.23 s, tot 0.80 s (4 samples) +#pr: rsb auto tuning ( only successful ) time was: on avg.: 0.20 s, min 0.17 s, max 0.23 s, tot 0.80 s (4 samples) +#pr: best tun. rsb canon. mflops were: on avg. 2.702e+03, min 1.801e+03, max 3.602e+03 (4 samples) +#pr: ref. unt. rsb canon. mflops were: on avg. 1.099e-02, min 4.001e-03, max 1.599e-02 (4 samples) +#pr: best tun. rsb operation time was: on avg. 5.330e-08s, min 5.330e-08s, max 5.330e-08s, tot 2.132e-07s (4 samples) +#pr: ref. unt. rsb operation time was: on avg. 1.501e-02s, min 1.201e-02s, max 2.399e-02s, tot 6.004e-02s (4 samples) +#pr: min / max ratio of in-memory MEMSET bandwidth to extrapolated read bandwidth ratio: 1.780e+00 2.557e+00 +#pr: in-cache to in-memory MEMSET bandwidth ratio: 1.703e+00 #pr: rsb nrhs-to-overall-min-rhs speed ratio was: on avg. 2.000e+00 x, min 2.000e+00 x, max 2.000e+00 x (2 samples, the non-min-nrhs ones) #pr: ======== Limiting to both transA=N and nrhs=1: #pr: 2 samples (out of 4) matched the dump limiting criteria. #pr: Dump from a base of 4 samples (of max 8) ordered by (1,2,1,1,2,1,2) = (filename x cores x incX x incY x nrhs x typecode x transA). pr: BESTCODE MTX NR NC NNZ NRHS TYPE SYM TRANS NT AT-NT AT-MKL-NT BPNZ AT-BPNZ NSUBM AT-SUBM RSBBEST-MFLOPS OPTIME MKL-OPTIME AT-OPTIME AT-MKL-OPTIME AT-TIME RWminBW-GBps CB-bpf AT-MS CMFLOPS -pr: 1:R_R A 3 3 6 1 Z S N 1 1 0 4.0000 4.6667 3 1 1821.55 5.960e-06 0.000e+00 5.270e-08 0.000e+00 1.888e-04 5.09e+00 2.29e+00 1 9.60e-05 -pr: 5:R_R A 3 3 6 1 Z S N 4 1 0 4.0000 4.6667 3 1 1821.55 6.914e-06 0.000e+00 5.270e-08 0.000e+00 1.352e-04 5.09e+00 2.29e+00 1 9.60e-05 +pr: 1:R_R A 3 3 6 1 Z S N 1 1 0 4.0000 4.6667 3 1 1801.18 2.399e-02 0.000e+00 5.330e-08 0.000e+00 1.960e-01 5.03e+00 2.29e+00 1 9.60e-05 +pr: 5:R_R A 3 3 6 1 Z S N 4 1 0 4.0000 4.6667 3 1 1801.18 1.202e-02 0.000e+00 5.330e-08 0.000e+00 2.320e-01 5.03e+00 2.29e+00 1 9.60e-05 #pr: 2 samples (out of 4) matched the dump limiting criteria. #pr: below, we define 'successful' autotuning when speedup of 1.010000x is exceeded, and 'tuned' results even the ones which are same as untuned #pr: rsb autotuning was successful in 2 cases (100.00 %) and unsuccessful in 0 cases (0.00 %) -#pr: (in succ. cases rsb autotuning gave avg. 12114.4 % faster, avg. sp. ratio 122.144x, max sp. ratio 131.192x, avg. ratio 0.000x) -#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 3074.0/2565.0/3582.9/6147.9 tuned ops) -#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 25.6/ 19.6/ 31.7/ 51.2 untuned ops) -#pr: (and amortizes from untuned rsb in avg. 25.8, min. 19.7, max. 32.0 ops) +#pr: (in succ. cases rsb autotuning gave avg. 33778696.7 % faster, avg. sp. ratio 337787.967x, max sp. ratio 450127.488x, avg. ratio 0.000x) +#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 4015021.2/3677347.3/4352695.1/8030042.5 tuned ops) +#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 13.7/ 8.2/ 19.3/ 27.5 untuned ops) +#pr: (and amortizes from untuned rsb in avg. 13.7, min. 8.2, max. 19.3 ops) #pr: (avg/min/max (avg) nnz per subm before successful tuning were 2/ 2/ 2) #pr: (avg/min/max (avg) nnz per subm after successful tuning were 6/ 6/ 6) #pr: (avg/min/max (avg) bytes per subm before successful tuning were 32/ 32/ 32) #pr: (avg/min/max (avg) bytes per subm after successful tuning were 96/ 96/ 96) #pr: (avg/min/max (avg) bytes per nnz before successful tuning were 4.000/ 4.000/ 4.000) -#pr: (avg/min/max operands (mtx,lhs,rhs) read bandwidth lower bound 4.174/ 4.174/ 4.174,GBps) -#pr: (avg/min/max operands (mtx,rhs:r;lhs:rw) bandwidth lower bound 10.170/ 5.085/ 5.085,GBps) +#pr: (avg/min/max operands (mtx,lhs,rhs) read bandwidth lower bound 4.128/ 4.128/ 4.128,GBps) +#pr: (avg/min/max operands (mtx,rhs:r;lhs:rw) bandwidth lower bound 10.057/ 5.028/ 5.028,GBps) #pr: (avg/min/max code balance (bytes read at least once per flop) 2.292/ 2.292/ 2.292) #pr: (avg/min/max (avg) bytes per nnz after successful tuning were 4.667/ 4.667/ 4.667) #pr: (matrix has been subdivided more/less/same in resp. 0 / 2 /0 cases) #pr: (matrix has used more/less/same threads in resp. 0 / 1 /1 cases) #pr: no unsuccessful rsb autotuning attempt (according to 1.01x threshold) -#pr: rsb auto tuning (either succ. or uns.) time was: on avg.: 0.00 s, min 0.00 s, max 0.00 s, tot 0.00 s (2 samples) -#pr: rsb auto tuning ( only successful ) time was: on avg.: 0.00 s, min 0.00 s, max 0.00 s, tot 0.00 s (2 samples) -#pr: best tun. rsb canon. mflops were: on avg. 1.822e+03, min 1.822e+03, max 1.822e+03 (2 samples) -#pr: ref. unt. rsb canon. mflops were: on avg. 1.500e+01, min 1.388e+01, max 1.611e+01 (2 samples) -#pr: best tun. rsb operation time was: on avg. 5.270e-08s, min 5.270e-08s, max 5.270e-08s, tot 1.054e-07s (2 samples) -#pr: ref. unt. rsb operation time was: on avg. 6.437e-06s, min 5.960e-06s, max 6.914e-06s, tot 1.287e-05s (2 samples) -#pr: min / max ratio of in-memory MEMSET bandwidth to extrapolated read bandwidth ratio: 6.466e+00 6.466e+00 -#pr: in-cache to in-memory MEMSET bandwidth ratio: 1.759e+00 +#pr: rsb auto tuning (either succ. or uns.) time was: on avg.: 0.21 s, min 0.20 s, max 0.23 s, tot 0.43 s (2 samples) +#pr: rsb auto tuning ( only successful ) time was: on avg.: 0.21 s, min 0.20 s, max 0.23 s, tot 0.43 s (2 samples) +#pr: best tun. rsb canon. mflops were: on avg. 1.801e+03, min 1.801e+03, max 1.801e+03 (2 samples) +#pr: ref. unt. rsb canon. mflops were: on avg. 5.995e-03, min 4.001e-03, max 7.989e-03 (2 samples) +#pr: best tun. rsb operation time was: on avg. 5.330e-08s, min 5.330e-08s, max 5.330e-08s, tot 1.066e-07s (2 samples) +#pr: ref. unt. rsb operation time was: on avg. 1.800e-02s, min 1.202e-02s, max 2.399e-02s, tot 3.601e-02s (2 samples) +#pr: min / max ratio of in-memory MEMSET bandwidth to extrapolated read bandwidth ratio: 2.557e+00 2.557e+00 +#pr: in-cache to in-memory MEMSET bandwidth ratio: 1.703e+00 #pr: ======== Limiting to both transA=N and nrhs=2: #pr: 2 samples (out of 4) matched the dump limiting criteria. #pr: Dump from a base of 4 samples (of max 8) ordered by (1,2,1,1,2,1,2) = (filename x cores x incX x incY x nrhs x typecode x transA). pr: BESTCODE MTX NR NC NNZ NRHS TYPE SYM TRANS NT AT-NT AT-MKL-NT BPNZ AT-BPNZ NSUBM AT-SUBM RSBBEST-MFLOPS OPTIME MKL-OPTIME AT-OPTIME AT-MKL-OPTIME AT-TIME RWminBW-GBps CB-bpf AT-MS CMFLOPS -pr: 3:R_R A 3 3 6 2 Z S N 1 1 0 4.0000 4.6667 3 1 3643.10 5.007e-06 0.000e+00 5.270e-08 0.000e+00 1.218e-04 7.82e+00 1.65e+00 1 1.92e-04 -pr: 7:R_R A 3 3 6 2 Z S N 4 1 0 4.0000 4.6667 3 1 3643.10 1.097e-05 0.000e+00 5.270e-08 0.000e+00 1.469e-04 7.82e+00 1.65e+00 1 1.92e-04 +pr: 3:R_R A 3 3 6 2 Z S N 1 1 0 4.0000 4.6667 3 1 3602.35 1.201e-02 0.000e+00 5.330e-08 0.000e+00 2.000e-01 7.73e+00 1.65e+00 1 1.92e-04 +pr: 7:R_R A 3 3 6 2 Z S N 4 1 0 4.0000 4.6667 3 1 3602.35 1.203e-02 0.000e+00 5.330e-08 0.000e+00 1.681e-01 7.73e+00 1.65e+00 1 1.92e-04 #pr: 2 samples (out of 4) matched the dump limiting criteria. #pr: below, we define 'successful' autotuning when speedup of 1.010000x is exceeded, and 'tuned' results even the ones which are same as untuned #pr: rsb autotuning was successful in 2 cases (100.00 %) and unsuccessful in 0 cases (0.00 %) -#pr: (in succ. cases rsb autotuning gave avg. 15054.9 % faster, avg. sp. ratio 151.549x, max sp. ratio 208.098x, avg. ratio 0.000x) -#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 2549.2/2311.7/2786.7/5098.4 tuned ops) -#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 18.9/ 13.4/ 24.3/ 37.7 untuned ops) -#pr: (and amortizes from untuned rsb in avg. 19.0, min. 13.5, max. 24.6 ops) +#pr: (in succ. cases rsb autotuning gave avg. 22549441.5 % faster, avg. sp. ratio 225495.415x, max sp. ratio 225654.216x, avg. ratio 0.000x) +#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 3452999.3/3153844.8/3752153.9/6905998.7 tuned ops) +#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 15.3/ 14.0/ 16.7/ 30.6 untuned ops) +#pr: (and amortizes from untuned rsb in avg. 15.3, min. 14.0, max. 16.7 ops) #pr: (avg/min/max (avg) nnz per subm before successful tuning were 2/ 2/ 2) #pr: (avg/min/max (avg) nnz per subm after successful tuning were 6/ 6/ 6) #pr: (avg/min/max (avg) bytes per subm before successful tuning were 32/ 32/ 32) #pr: (avg/min/max (avg) bytes per subm after successful tuning were 96/ 96/ 96) #pr: (avg/min/max (avg) bytes per nnz before successful tuning were 4.000/ 4.000/ 4.000) -#pr: (avg/min/max operands (mtx,lhs,rhs) read bandwidth lower bound 5.996/ 5.996/ 5.996,GBps) -#pr: (avg/min/max operands (mtx,rhs:r;lhs:rw) bandwidth lower bound 15.635/ 7.817/ 7.817,GBps) +#pr: (avg/min/max operands (mtx,lhs,rhs) read bandwidth lower bound 5.929/ 5.929/ 5.929,GBps) +#pr: (avg/min/max operands (mtx,rhs:r;lhs:rw) bandwidth lower bound 15.460/ 7.730/ 7.730,GBps) #pr: (avg/min/max code balance (bytes read at least once per flop) 1.646/ 1.646/ 1.646) #pr: (avg/min/max (avg) bytes per nnz after successful tuning were 4.667/ 4.667/ 4.667) #pr: (matrix has been subdivided more/less/same in resp. 0 / 2 /0 cases) #pr: (matrix has used more/less/same threads in resp. 0 / 1 /1 cases) #pr: no unsuccessful rsb autotuning attempt (according to 1.01x threshold) -#pr: rsb auto tuning (either succ. or uns.) time was: on avg.: 0.00 s, min 0.00 s, max 0.00 s, tot 0.00 s (2 samples) -#pr: rsb auto tuning ( only successful ) time was: on avg.: 0.00 s, min 0.00 s, max 0.00 s, tot 0.00 s (2 samples) -#pr: best tun. rsb canon. mflops were: on avg. 3.643e+03, min 3.643e+03, max 3.643e+03 (2 samples) -#pr: ref. unt. rsb canon. mflops were: on avg. 2.793e+01, min 1.751e+01, max 3.835e+01 (2 samples) -#pr: best tun. rsb operation time was: on avg. 5.270e-08s, min 5.270e-08s, max 5.270e-08s, tot 1.054e-07s (2 samples) -#pr: ref. unt. rsb operation time was: on avg. 7.987e-06s, min 5.007e-06s, max 1.097e-05s, tot 1.597e-05s (2 samples) -#pr: min / max ratio of in-memory MEMSET bandwidth to extrapolated read bandwidth ratio: 4.502e+00 4.502e+00 -#pr: in-cache to in-memory MEMSET bandwidth ratio: 1.759e+00 +#pr: rsb auto tuning (either succ. or uns.) time was: on avg.: 0.18 s, min 0.17 s, max 0.20 s, tot 0.37 s (2 samples) +#pr: rsb auto tuning ( only successful ) time was: on avg.: 0.18 s, min 0.17 s, max 0.20 s, tot 0.37 s (2 samples) +#pr: best tun. rsb canon. mflops were: on avg. 3.602e+03, min 3.602e+03, max 3.602e+03 (2 samples) +#pr: ref. unt. rsb canon. mflops were: on avg. 1.598e-02, min 1.596e-02, max 1.599e-02 (2 samples) +#pr: best tun. rsb operation time was: on avg. 5.330e-08s, min 5.330e-08s, max 5.330e-08s, tot 1.066e-07s (2 samples) +#pr: ref. unt. rsb operation time was: on avg. 1.202e-02s, min 1.201e-02s, max 1.203e-02s, tot 2.404e-02s (2 samples) +#pr: min / max ratio of in-memory MEMSET bandwidth to extrapolated read bandwidth ratio: 1.780e+00 1.780e+00 +#pr: in-cache to in-memory MEMSET bandwidth ratio: 1.703e+00 #pr: rsb nrhs-to-overall-min-rhs speed ratio was: on avg. 2.000e+00 x, min 2.000e+00 x, max 2.000e+00 x (2 samples, the non-min-nrhs ones) #pr: ======== Limiting to transA=T: #pr: No sample (out of 4) matched the dump criteria -- skipping dump round. @@ -3717,44 +3753,44 @@ #pr: ======== All results (not limiting) #pr: Dump from a base of 4 samples (of max 8) ordered by (1,2,1,1,2,1,2) = (filename x cores x incX x incY x nrhs x typecode x transA). pr: BESTCODE MTX NR NC NNZ NRHS TYPE SYM TRANS NT AT-NT AT-MKL-NT BPNZ AT-BPNZ NSUBM AT-SUBM RSBBEST-MFLOPS OPTIME MKL-OPTIME AT-OPTIME AT-MKL-OPTIME AT-TIME RWminBW-GBps CB-bpf AT-MS CMFLOPS -pr: 1:R_R A 3 3 6 1 Z S N 1 1 0 4.0000 4.6667 3 1 1821.55 5.960e-06 0.000e+00 5.270e-08 0.000e+00 1.888e-04 5.09e+00 2.29e+00 1 9.60e-05 -pr: 3:R_R A 3 3 6 2 Z S N 1 1 0 4.0000 4.6667 3 1 3643.10 5.007e-06 0.000e+00 5.270e-08 0.000e+00 1.218e-04 7.82e+00 1.65e+00 1 1.92e-04 -pr: 5:R_R A 3 3 6 1 Z S N 4 1 0 4.0000 4.6667 3 1 1821.55 6.914e-06 0.000e+00 5.270e-08 0.000e+00 1.352e-04 5.09e+00 2.29e+00 1 9.60e-05 -pr: 7:R_R A 3 3 6 2 Z S N 4 1 0 4.0000 4.6667 3 1 3643.10 1.097e-05 0.000e+00 5.270e-08 0.000e+00 1.469e-04 7.82e+00 1.65e+00 1 1.92e-04 +pr: 1:R_R A 3 3 6 1 Z S N 1 1 0 4.0000 4.6667 3 1 1801.18 2.399e-02 0.000e+00 5.330e-08 0.000e+00 1.960e-01 5.03e+00 2.29e+00 1 9.60e-05 +pr: 3:R_R A 3 3 6 2 Z S N 1 1 0 4.0000 4.6667 3 1 3602.35 1.201e-02 0.000e+00 5.330e-08 0.000e+00 2.000e-01 7.73e+00 1.65e+00 1 1.92e-04 +pr: 5:R_R A 3 3 6 1 Z S N 4 1 0 4.0000 4.6667 3 1 1801.18 1.202e-02 0.000e+00 5.330e-08 0.000e+00 2.320e-01 5.03e+00 2.29e+00 1 9.60e-05 +pr: 7:R_R A 3 3 6 2 Z S N 4 1 0 4.0000 4.6667 3 1 3602.35 1.203e-02 0.000e+00 5.330e-08 0.000e+00 1.681e-01 7.73e+00 1.65e+00 1 1.92e-04 #pr: below, we define 'successful' autotuning when speedup of 1.010000x is exceeded, and 'tuned' results even the ones which are same as untuned #pr: rsb autotuning was successful in 4 cases (100.00 %) and unsuccessful in 0 cases (0.00 %) -#pr: (in succ. cases rsb autotuning gave avg. 13584.7 % faster, avg. sp. ratio 136.847x, max sp. ratio 208.098x, avg. ratio 0.000x) -#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 2811.6/2311.7/3582.9/11246.3 tuned ops) -#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 22.2/ 13.4/ 31.7/ 89.0 untuned ops) -#pr: (and amortizes from untuned rsb in avg. 22.4, min. 13.5, max. 32.0 ops) +#pr: (in succ. cases rsb autotuning gave avg. 28164069.1 % faster, avg. sp. ratio 281641.691x, max sp. ratio 450127.488x, avg. ratio 0.000x) +#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 3734010.3/3153844.8/4352695.1/14936041.2 tuned ops) +#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 14.5/ 8.2/ 19.3/ 58.1 untuned ops) +#pr: (and amortizes from untuned rsb in avg. 14.5, min. 8.2, max. 19.3 ops) #pr: (avg/min/max (avg) nnz per subm before successful tuning were 2/ 2/ 2) #pr: (avg/min/max (avg) nnz per subm after successful tuning were 6/ 6/ 6) #pr: (avg/min/max (avg) bytes per subm before successful tuning were 32/ 32/ 32) #pr: (avg/min/max (avg) bytes per subm after successful tuning were 96/ 96/ 96) #pr: (avg/min/max (avg) bytes per nnz before successful tuning were 4.000/ 4.000/ 4.000) -#pr: (avg/min/max operands (mtx,lhs,rhs) read bandwidth lower bound 5.085/ 4.174/ 5.996,GBps) -#pr: (avg/min/max operands (mtx,rhs:r;lhs:rw) bandwidth lower bound 25.805/ 5.085/ 7.817,GBps) +#pr: (avg/min/max operands (mtx,lhs,rhs) read bandwidth lower bound 5.028/ 4.128/ 5.929,GBps) +#pr: (avg/min/max operands (mtx,rhs:r;lhs:rw) bandwidth lower bound 25.517/ 5.028/ 7.730,GBps) #pr: (avg/min/max code balance (bytes read at least once per flop) 1.969/ 1.646/ 2.292) #pr: (avg/min/max (avg) bytes per nnz after successful tuning were 4.667/ 4.667/ 4.667) #pr: (matrix has been subdivided more/less/same in resp. 0 / 4 /0 cases) #pr: (matrix has used more/less/same threads in resp. 0 / 2 /2 cases) #pr: no unsuccessful rsb autotuning attempt (according to 1.01x threshold) -#pr: rsb auto tuning (either succ. or uns.) time was: on avg.: 0.00 s, min 0.00 s, max 0.00 s, tot 0.00 s (4 samples) -#pr: rsb auto tuning ( only successful ) time was: on avg.: 0.00 s, min 0.00 s, max 0.00 s, tot 0.00 s (4 samples) -#pr: best tun. rsb canon. mflops were: on avg. 2.732e+03, min 1.822e+03, max 3.643e+03 (4 samples) -#pr: ref. unt. rsb canon. mflops were: on avg. 2.146e+01, min 1.388e+01, max 3.835e+01 (4 samples) -#pr: best tun. rsb operation time was: on avg. 5.270e-08s, min 5.270e-08s, max 5.270e-08s, tot 2.108e-07s (4 samples) -#pr: ref. unt. rsb operation time was: on avg. 7.212e-06s, min 5.007e-06s, max 1.097e-05s, tot 2.885e-05s (4 samples) -#pr: min / max ratio of in-memory MEMSET bandwidth to extrapolated read bandwidth ratio: 4.502e+00 6.466e+00 -#pr: in-cache to in-memory MEMSET bandwidth ratio: 1.759e+00 +#pr: rsb auto tuning (either succ. or uns.) time was: on avg.: 0.20 s, min 0.17 s, max 0.23 s, tot 0.80 s (4 samples) +#pr: rsb auto tuning ( only successful ) time was: on avg.: 0.20 s, min 0.17 s, max 0.23 s, tot 0.80 s (4 samples) +#pr: best tun. rsb canon. mflops were: on avg. 2.702e+03, min 1.801e+03, max 3.602e+03 (4 samples) +#pr: ref. unt. rsb canon. mflops were: on avg. 1.099e-02, min 4.001e-03, max 1.599e-02 (4 samples) +#pr: best tun. rsb operation time was: on avg. 5.330e-08s, min 5.330e-08s, max 5.330e-08s, tot 2.132e-07s (4 samples) +#pr: ref. unt. rsb operation time was: on avg. 1.501e-02s, min 1.201e-02s, max 2.399e-02s, tot 6.004e-02s (4 samples) +#pr: min / max ratio of in-memory MEMSET bandwidth to extrapolated read bandwidth ratio: 1.780e+00 2.557e+00 +#pr: in-cache to in-memory MEMSET bandwidth ratio: 1.703e+00 #pr: rsb nrhs-to-overall-min-rhs speed ratio was: on avg. 2.000e+00 x, min 2.000e+00 x, max 2.000e+00 x (2 samples, the non-min-nrhs ones) -#pr: Record collection took 0.33 s. +#pr: Record collection took 5.80 s. #pr: Record comprises 50 memory benchmark samples (prepend RSB_PR_MBW=1 to dump this). -#pr: Record comprises 100 environment variables in 4759 bytes (prepend RSB_PR_ENV=1 to dump this). +#pr: Record comprises 100 environment variables in 4813 bytes (prepend RSB_PR_ENV=1 to dump this). # ====== END Total summary record. -#pr: ======== Saved a performance record of 8 samples to rsbench_pr__1767573701_gcc-14.2-1,4th.rpr -# Removing the temporary record file rsbench_pr__1767573701_gcc-14.2-1,4th.rpr.tmp. -# terminating run at 1767573710 (after 8.7s of w.c.t.) +#pr: ======== Saved a performance record of 8 samples to rsbench_pr__1733165242_gcc-14.2-1,4th.rpr +# Removing the temporary record file rsbench_pr__1733165242_gcc-14.2-1,4th.rpr.tmp. +# terminating run at 1733165260 (after 18.1s of w.c.t.) + ./rsbench -oa -Ob --help /build/reproducible-path/librsb-1.3.0.2+dfsg/.libs/rsbench is a swiss army knife for testing the library functionality and performance. You can use it to perform sparse matrix - unitary vector multiplication, specifying the blocking parameters, the times to perform multiplication. @@ -4026,10 +4062,10 @@ L2 size: 524288 L3 size: 16777216 sysconf() : 4096 bytes per pagesize -sysconf() : 4095708 physical pages -sysconf() : 3891118080 bytes (3710 MB) of physical memory -sysconf() : 1391361 available (free) physical pages -sysconf() : 1404047360 available (free) physical memory +sysconf() : 4093893 physical pages +sysconf() : 3883683840 bytes (3703 MB) of physical memory +sysconf() : 568978 available (free) physical pages +sysconf() : 2330533888 available (free) physical memory sysconf() , processors : 8 sysconf() , processors online : 8 sysconf() : level 1 cache size 32768 @@ -4060,35 +4096,35 @@ RSB_SUBM_IDX_MARKER : 2147483647 RSB_MAX_ALLOCATABLE_MEMORY_CHUNK: 4294967295 timing min delta (if negative, don't complain with us) : 0 s -timing granularity : 5.22494e-08 s +timing granularity : 5.32508e-08 s CFLAGS : -g -O2 -Werror=implicit-function-declaration -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 CXXFLAGS : -g -O2 -fstack-protector-strong -Wformat -Werror=format-security -fopenmp CC : gcc memhinfo : L3:16/64/16M,L2:8/64/512K,L1:8/64/32K -detected free memory : 1404047360 -detected total memory : -403849216 -for array sized 16777216 elems, took 0.005759 s for linear search and 0 s for binary search for element 16777215, in 17 tries, for a total of 0.101067 s (ignore this:570425310) -for array sized 16777216 elems, took 0.00286388 s for linear search and 0 s for binary search for element 8388607, in 35 tries, for a total of 0.100834 s (ignore this:1157627800) -for array sized 16777216 elems, took 0.00142312 s for linear search and 0 s for binary search for element 4194303, in 70 tries, for a total of 0.101083 s (ignore this:1744830220) -for array sized 16777216 elems, took 0.000706196 s for linear search and 0 s for binary search for element 2097151, in 140 tries, for a total of 0.100691 s (ignore this:-1962934796) -for array sized 16777216 elems, took 0.000352859 s for linear search and 0 s for binary search for element 1048575, in 281 tries, for a total of 0.100328 s (ignore this:-1373635646) -for array sized 16777216 elems, took 0.000175953 s for linear search and 0 s for binary search for element 524287, in 560 tries, for a total of 0.100086 s (ignore this:-786434206) -for array sized 16777216 elems, took 8.67844e-05 s for linear search and 0 s for binary search for element 262143, in 1119 tries, for a total of 0.100056 s (ignore this:-199758172) -for array sized 16777216 elems, took 4.29153e-05 s for linear search and 0 s for binary search for element 131071, in 2152 tries, for a total of 0.100003 s (ignore this:364371412) -for array sized 16777216 elems, took 3.38554e-05 s for linear search and 0 s for binary search for element 65535, in 2421 tries, for a total of 0.100023 s (ignore this:681691882) -for array sized 16777216 elems, took 1.00136e-05 s for linear search and 0 s for binary search for element 32767, in 8735 tries, for a total of 0.100007 s (ignore this:1254131372) -for array sized 16777216 elems, took 4.76837e-06 s for linear search and 0 s for binary search for element 16383, in 17624 tries, for a total of 0.100001 s (ignore this:1831599356) -for array sized 16777216 elems, took 1.90735e-06 s for linear search and 0 s for binary search for element 8191, in 34298 tries, for a total of 0.100001 s (ignore this:-1901498104) -for array sized 16777216 elems, took 9.53674e-07 s for linear search and 0 s for binary search for element 4095, in 65278 tries, for a total of 0.100002 s (ignore this:-1366871284) -for array sized 16777216 elems, took 0 s for linear search and 0 s for binary search for element 2047, in 118090 tries, for a total of 0.100001 s (ignore this:-883410824) -for array sized 16777216 elems, took 0 s for linear search and 0 s for binary search for element 1023, in 200319 tries, for a total of 0.100000 s (ignore this:-473558150) -for array sized 16777216 elems, took 0 s for linear search and 0 s for binary search for element 511, in 307573 tries, for a total of 0.100001 s (ignore this:-159218544) -for array sized 16777216 elems, took 0 s for linear search and 0 s for binary search for element 255, in 437661 tries, for a total of 0.100001 s (ignore this:63988566) -for array sized 16777216 elems, took 0 s for linear search and 0 s for binary search for element 127, in 550640 tries, for a total of 0.100000 s (ignore this:203851126) -for array sized 16777216 elems, took 0 s for linear search and 0 s for binary search for element 63, in 613381 tries, for a total of 0.100000 s (ignore this:281137132) -for array sized 16777216 elems, took 0 s for linear search and 0 s for binary search for element 31, in 671182 tries, for a total of 0.100001 s (ignore this:322750416) -for array sized 16777216 elems, took 0 s for linear search and 0 s for binary search for element 15, in 682558 tries, for a total of 0.100001 s (ignore this:343227156) -for array sized 16777216 elems, took 0 s for linear search and 0 s for binary search for element 7, in 688429 tries, for a total of 0.100000 s (ignore this:352865162) +detected free memory : -1964433408 +detected total memory : -411283456 +for array sized 16777216 elems, took 0.00628209 s for linear search and 9.53674e-07 s for binary search for element 16777215, in 10 tries, for a total of 0.192447 s (ignore this:335544300) +for array sized 16777216 elems, took 0.00310206 s for linear search and 0 s for binary search for element 8388607, in 10 tries, for a total of 0.105713 s (ignore this:503316440) +for array sized 16777216 elems, took 0.00147295 s for linear search and 0 s for binary search for element 4194303, in 21 tries, for a total of 0.100484 s (ignore this:679477166) +for array sized 16777216 elems, took 0.000699043 s for linear search and 0 s for binary search for element 2097151, in 46 tries, for a total of 0.106143 s (ignore this:872415058) +for array sized 16777216 elems, took 0.000347137 s for linear search and 0 s for binary search for element 1048575, in 96 tries, for a total of 0.103364 s (ignore this:1073741458) +for array sized 16777216 elems, took 0.0001719 s for linear search and 0 s for binary search for element 524287, in 196 tries, for a total of 0.107903 s (ignore this:1279261962) +for array sized 16777216 elems, took 8.58307e-05 s for linear search and 0 s for binary search for element 262143, in 385 tries, for a total of 0.107878 s (ignore this:1481112072) +for array sized 16777216 elems, took 4.19617e-05 s for linear search and 0 s for binary search for element 131071, in 808 tries, for a total of 0.107875 s (ignore this:1692922808) +for array sized 16777216 elems, took 2.09808e-05 s for linear search and 0 s for binary search for element 65535, in 2291 tries, for a total of 0.100001 s (ignore this:1993204178) +for array sized 16777216 elems, took 9.77516e-06 s for linear search and 0 s for binary search for element 32767, in 3664 tries, for a total of 0.100020 s (ignore this:-2061646542) +for array sized 16777216 elems, took 4.76837e-06 s for linear search and 0 s for binary search for element 16383, in 17653 tries, for a total of 0.100001 s (ignore this:-1483228344) +for array sized 16777216 elems, took 1.90735e-06 s for linear search and 0 s for binary search for element 8191, in 32811 tries, for a total of 0.100000 s (ignore this:-945718542) +for array sized 16777216 elems, took 9.53674e-07 s for linear search and 0 s for binary search for element 4095, in 48732 tries, for a total of 0.100001 s (ignore this:-546603462) +for array sized 16777216 elems, took 0 s for linear search and 0 s for binary search for element 2047, in 109723 tries, for a total of 0.103959 s (ignore this:-97397500) +for array sized 16777216 elems, took 0 s for linear search and 0 s for binary search for element 1023, in 64381 tries, for a total of 0.106830 s (ignore this:34326026) +for array sized 16777216 elems, took 0 s for linear search and 0 s for binary search for element 511, in 167796 tries, for a total of 0.100000 s (ignore this:205813538) +for array sized 16777216 elems, took 0 s for linear search and 0 s for binary search for element 255, in 167005 tries, for a total of 0.104570 s (ignore this:290986088) +for array sized 16777216 elems, took 0 s for linear search and 0 s for binary search for element 127, in 173885 tries, for a total of 0.100001 s (ignore this:335152878) +for array sized 16777216 elems, took 0 s for linear search and 0 s for binary search for element 63, in 270595 tries, for a total of 0.100001 s (ignore this:369247848) +for array sized 16777216 elems, took 0 s for linear search and 0 s for binary search for element 31, in 298124 tries, for a total of 0.100001 s (ignore this:387731536) +for array sized 16777216 elems, took 0 s for linear search and 0 s for binary search for element 15, in 358929 tries, for a total of 0.101977 s (ignore this:398499406) +for array sized 16777216 elems, took 0 s for linear search and 0 s for binary search for element 7, in 332374 tries, for a total of 0.100001 s (ignore this:403152642) + ./rsbench -C /build/reproducible-path/librsb-1.3.0.2+dfsg/.libs/rsbench version: 1.3.0 format switches:br @@ -4135,17 +4171,17 @@ Adding matrix file: /build/reproducible-path/librsb-1.3.0.2+dfsg/A.mtx # Sorting matrices list (use --no-sort-filenames-list to prevent this) # Using matrices: A.mtx -# beginning run at 1767573713 +# beginning run at 1733165264 # /build/reproducible-path/librsb-1.3.0.2+dfsg/.libs/rsbench -oa -Ob --bench -f /build/reproducible-path/librsb-1.3.0.2+dfsg/A.mtx --verbose --nrhs 1,4 --by-rows # compiled with: CC=gcc CFLAGS=-g -O2 -Werror=implicit-function-declaration -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 # User did not specify threads; assuming 1. Environment provides max 8 threads; this build supports max 128. # User did not specify threads; assuming 1. Environment provides max 8 threads; this build supports max 128. -# average timer granularity: 5.24e-08 s -# Will write a final performance record to file rsbench_pr__1767573713_gcc-14.2.rpr and periodic checkpoints to rsbench_pr__1767573713_gcc-14.2.rpr.tmp +# average timer granularity: 5.33e-08 s +# Will write a final performance record to file rsbench_pr__1733165264_gcc-14.2.rpr and periodic checkpoints to rsbench_pr__1733165264_gcc-14.2.rpr.tmp # will NOT perform ancillary tests. # will flush cache memory: between each operation measurement series, and NOT between each operation. # will keep any zero encountered in the matrix. -# env: export PATH=/usr/sbin:/usr/bin:/sbin:/bin:/usr/games +# env: export PATH=/usr/sbin:/usr/bin:/sbin:/bin:/usr/games:/i/capture/the/path # env: export LD_LIBRARY_PATH=/build/reproducible-path/librsb-1.3.0.2+dfsg/.libs:/usr/lib/libeatmydata # env: HOSTNAME is not set # env: KMP_AFFINITY is not set @@ -4184,61 +4220,61 @@ # env: SLURM_NTASKS is not set # env: SLURM_STEP_TASKS_PER_NODE is not set # env: SLURM_TASKS_PER_NODE is not set -# detected hostname: infom08-i386 +# detected hostname: i-capture-the-hostname # user specified a verbosity level of 1 (each --verbose occurrence counts +1) # This test will measure times in scanning arrays sized and aligned to fit in caches. # 3 cache levels detected Will fill struct with 50 samples... -# Memory benchmark took 8.840s +# Memory benchmark took 12.028s # auto-tuning oriented output implies times==0 iterations and sort-after-load. #pr: allocated a performance record for 16 samples (4032 bytes). # multi-type benchmarking (DSCZ) -- now using typecode D (last was D). # Cache block size total 16777216 bytes, per-thread 2097152 bytes -# so far, program took 8.842s of wall clock time; ancillary tests 0.000s; I/O 0.000s; checks 0.000s; conversions 0.000s; rsb/mkl tuning 0.000s/0.000s . +# so far, program took 12.030s of wall clock time; ancillary tests 0.000s; I/O 0.000s; checks 0.000s; conversions 0.000s; rsb/mkl tuning 0.000s/0.000s . # reading A.mtx (184 bytes / 1 MiB / 6 nnz / 3 rows / 3 columns / 1 MiB COO) as type D... -# file input of A.mtx took 0.00 s (6 nnz, 66576 nnz/s ) (2.04 MB/s ) -#pre-sorting (6 elements) took 0.000377893 s -#weeding duplicates (to 6 elements) took 2.14577e-06 s (and check, 9.53674e-07 s ) +# file input of A.mtx took 0.00 s (6 nnz, 73156 nnz/s ) (2.24 MB/s ) +#pre-sorting (6 elements) took 0.0433512 s +#weeding duplicates (to 6 elements) took 3.09944e-06 s (and check, 1.90735e-06 s ) # multi-nrhs benchmarking (1,4) -- now using nrhs 1. # Using alpha=1 beta=1 order=rows for rsb_spmv/rsb_spsv/rsb_spmm/rsb_spsm. # multi-transpose benchmarking -- now using transA = N. # will use input matrix flags: RSB_FLAG_USE_HALFWORD_INDICES, RSB_FLAG_SORTED_INPUT, RSB_FLAG_QUAD_PARTITIONING, RSB_FLAG_SYMMETRIC, RSB_FLAG_OWN_PARTITIONING_ARRAYS # Using 8 threads -# Constructed matrix (took 0.000s): (3 x 3)[0x582017d0]{D} @ (0(0..0),0(0..0)) (6 nnz, 2 nnz/r) flags 0x2442186 (coo:1, csr:0, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'S' +# Constructed matrix (took 0.156s): (3 x 3)[0x576ba810]{D} @ (0(0..0),0(0..0)) (6 nnz, 2 nnz/r) flags 0x2442186 (coo:1, csr:0, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'S' # matrix consistency check took 0.000s (ok) RSB Sparse Blocks Autotuner invoked requesting max 6 splits and max 6 merges in 1 rounds, threads spec.0 (specify negative values to enable threads tuning). Will autotune matrix: 3 x 3, type D, 6 nnz, 2 nnz/r, 4 subms, 3 lsubms, 4.0000 bpnz. Parameters: verbosity:1 mintimes:3 maxtimes:10 mindt:0 maxdt:3 -3 iterations (8 th.) took 4.888e-05s; avg 1.629e-05s ( +/- 38.54/ 65.37 %); best 1.001e-05s; worst 2.694e-05s; std dev. 7.57e-06 (taking best). -Reference operation time is 1.00136e-05 s (2.397 Mflops) with 8 threads. -Starting merge (same threads) based auto-tuning procedure (transA=N, nrhs=1, order=rows) (max 6 steps, inclusive 3 grace steps) on: 3 x 3, type D, 6 nnz, 2 nnz/r, 4 subms, 3 lsubms, 4.0000 bpnz (tpop: 1.001e-05 Mflops: 2.397) -Merge (3 -> 1 leaves) took w.c.t. of 1.121e-05s, ~4.053e-06s of computing time (of which 1.192e-06s sorting, 1.192e-06s analysis) -3 iterations (8 th.) took 1.407e-05s; avg 4.689e-06s ( +/- 98.82/174.58 %); best 5.519e-08s; worst 1.287e-05s; std dev. 5.809e-06 (taking best). -Reference operation time is 5.51939e-08 s (434.8 Mflops) with 8 threads. -After merge step 1: tpop: 5.519e-08 s ~Mflops: 434.831 nsubm:1 otn:8 -Applying merge (3 -> 1 leaves, 8 th.) yielded SPEEDUP of 181.425x: 1.001e-05s -> 5.519e-08s, so taking this instance. +3 iterations (8 th.) took 0.05999s; avg 0.02s ( +/- 40.01/ 60.02 %); best 0.01199s; worst 0.032s; std dev. 0.008642 (taking best). +Reference operation time is 0.0119948 s (0.002001 Mflops) with 8 threads. +Starting merge (same threads) based auto-tuning procedure (transA=N, nrhs=1, order=rows) (max 6 steps, inclusive 3 grace steps) on: 3 x 3, type D, 6 nnz, 2 nnz/r, 4 subms, 3 lsubms, 4.0000 bpnz (tpop: 0.01199 Mflops: 0.002) +Merge (3 -> 1 leaves) took w.c.t. of 3.791e-05s, ~9.06e-06s of computing time (of which 9.537e-07s sorting, 5.007e-06s analysis) +3 iterations (8 th.) took 1.502e-05s; avg 5.007e-06s ( +/- 98.88/200.00 %); best 5.594e-08s; worst 1.502e-05s; std dev. 7.081e-06 (taking best). +Reference operation time is 5.59449e-08 s (429 Mflops) with 8 threads. +After merge step 1: tpop: 5.594e-08 s ~Mflops: 428.993 nsubm:1 otn:8 +Applying merge (3 -> 1 leaves, 8 th.) yielded SPEEDUP of 214404.432x: 0.01199s -> 5.594e-08s, so taking this instance. Merged all the matrix leaves: no reason to continue merging. -A total of 1 merge steps (of max 6) (3 -> 1 subms) took 5.007e-05s (of which 1.407e-05s partitioning, 0s I/O); computing times: 4.053e-06s in par. loops, 1.192e-06s sorting, 1.192e-06s analyzing) -Total merge + benchmarking process took 5.007e-05s, equivalent to 907.1/5.0 new/old ops (3.076e-05s for 2 clones -- as 557.2/3.1 ops, or 278.6/1.5 ops per clone), SPEEDUP of 181.425x -Applying multi-merge (3 -> 1 leaves, 1 steps, 0 -> 8 th.sp.) yielded SPEEDUP of 181.425x (1.001e-05s -> 5.519e-08s), will amortize in 5.0 ops by saving 9.958e-06s per op. -In 1 tuning rounds (tot. 0.00014s, 3.1e-05s for constructor, 2 clones) obtained a SPEEDUP of 18042.5% (181.4x) (from 2.397 to 434.8 Mflops). +A total of 1 merge steps (of max 6) (3 -> 1 subms) took 0.12s (of which 4.196e-05s partitioning, 0s I/O); computing times: 9.06e-06s in par. loops, 9.537e-07s sorting, 5.007e-06s analyzing) +Total merge + benchmarking process took 0.12s, equivalent to 2144321.3/10.0 new/old ops (0.2038s for 2 clones -- as 3642757.3/17.0 ops, or 1821378.6/8.5 ops per clone), SPEEDUP of 214404.432x +Applying multi-merge (3 -> 1 leaves, 1 steps, 0 -> 8 th.sp.) yielded SPEEDUP of 214404.432x (0.01199s -> 5.594e-08s), will amortize in 10.0 ops by saving 0.01199s per op. +In 1 tuning rounds (tot. 0.26s, 0.2s for constructor, 2 clones) obtained a SPEEDUP of 21440343.2% (2.144e+05x) (from 0.002001 to 429 Mflops). #pr: updating sample at index 1 (0^th of 16), 0^th touch for (0,0,0,0,0,0,0). -First run of RSB Autotuner took 0.000158787 s (1.001e-05 s -> 5.519e-08 s per spmv_sxsa) (tuned: 3 -> 1 lsubm). +First run of RSB Autotuner took 0.263957 s (1.199e-02 s -> 5.594e-08 s per spmv_sxsa) (tuned: 3 -> 1 lsubm). RSB Sparse Blocks Autotuner invoked requesting max 0 splits and max 0 merges in 1 rounds, auto threads spec. -Second run of RSB Autotuner took 0.000332117 s and estimated a speedup of 1.000000 x (5.519e-08 s -> 5.519e-08 s per op) in same matrix (1 -> 1 lsubm) +Second run of RSB Autotuner took 1.58397 s and estimated a speedup of 1.000000 x (5.594e-08 s -> 5.594e-08 s per op) in same matrix (1 -> 1 lsubm) #min:1 #max:1 #sum:3 #norm:1.7320508075688772 #used index storage compared to COO:28 vs 48 bytes (58.33%) ; compared to CSR:28 vs 40 bytes (77.78%) #%:CONSTRUCTOR_*:SORT SCAN INSERT SCAN+INSERT -%:CONSTRUCTOR_TIMES:A.mtx S N 8 3 3 6 0.000000 0.000022 0.000014 0.000036 -%:UNSORTEDCOO2RSB_TIME:A.mtx S N 8 3 3 6 0.000036 -%:RSB_SUBDIVISION_TIME:A.mtx S N 8 3 3 6 0.000022 -%:RSB_SHUFFLE_TIME:A.mtx S N 8 3 3 6 0.000014 +%:CONSTRUCTOR_TIMES:A.mtx S N 8 3 3 6 0.000000 0.063758 0.048096 0.111854 +%:UNSORTEDCOO2RSB_TIME:A.mtx S N 8 3 3 6 0.111854 +%:RSB_SUBDIVISION_TIME:A.mtx S N 8 3 3 6 0.063758 +%:RSB_SHUFFLE_TIME:A.mtx S N 8 3 3 6 0.048096 %:ROW_MAJOR_SORT_TIME:A.mtx S N 8 3 3 6 0.000000 %:ROW_MAJOR_SORT_SCALING:A.mtx S N 8 3 3 6 -nan -%:SORTEDCOO2RSB_TIME:A.mtx S N 8 3 3 6 0.000036 +%:SORTEDCOO2RSB_TIME:A.mtx S N 8 3 3 6 0.111854 %:ROW_MAJOR_SORT_TO_MOP:A.mtx S N 8 3 3 6 0.000 %:UNSORTEDCOO2RSB_SCALING:A.mtx S N 8 3 3 6 1.00 %:SORTEDCOO2RSB_SCALING:A.mtx S N 8 3 3 6 1.00 @@ -4253,50 +4289,50 @@ %:SM_MINMAXAVGNNZ:A.mtx S N 8 3 3 6 6 6 6 # %operation:matrix CONSTRUCTOR[8] SPMV[8] SPMV[8] -%operation:A.mtx 5.60284e-05 1e+09 1e+09 +%operation:A.mtx 0.155876 1e+09 1e+09 %constructor:matrix SORT[8] SCAN[8] SHUFFLE[8] INSERT[8] -%constructor:A.mtx 0 2.19345e-05 0 1.40667e-05 +%constructor:A.mtx 0 0.0637579 0 0.0480959 # symmetric matrix --- skipping transposed benchmarking # multi-nrhs benchmarking (1,4) -- now using nrhs 4. # Using alpha=1 beta=1 order=rows for rsb_spmv/rsb_spsv/rsb_spmm/rsb_spsm. # multi-transpose benchmarking -- now using transA = N. # will use input matrix flags: RSB_FLAG_USE_HALFWORD_INDICES, RSB_FLAG_SORTED_INPUT, RSB_FLAG_QUAD_PARTITIONING, RSB_FLAG_SYMMETRIC, RSB_FLAG_OWN_PARTITIONING_ARRAYS # Using 8 threads -# Constructed matrix (took 0.000s): (3 x 3)[0x582017d0]{D} @ (0(0..0),0(0..0)) (6 nnz, 2 nnz/r) flags 0x2442186 (coo:1, csr:0, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'S' +# Constructed matrix (took 0.215s): (3 x 3)[0x576ba810]{D} @ (0(0..0),0(0..0)) (6 nnz, 2 nnz/r) flags 0x2442186 (coo:1, csr:0, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'S' # matrix consistency check took 0.000s (ok) RSB Sparse Blocks Autotuner invoked requesting max 6 splits and max 6 merges in 1 rounds, threads spec.0 (specify negative values to enable threads tuning). Will autotune matrix: 3 x 3, type D, 6 nnz, 2 nnz/r, 4 subms, 3 lsubms, 4.0000 bpnz. Parameters: verbosity:1 mintimes:3 maxtimes:10 mindt:0 maxdt:3 -3 iterations (8 th.) took 3.195e-05s; avg 1.065e-05s ( +/- 32.84/ 20.90 %); best 7.153e-06s; worst 1.287e-05s; std dev. 2.503e-06 (taking best). -Reference operation time is 7.15256e-06 s (13.42 Mflops) with 8 threads. -Starting merge (same threads) based auto-tuning procedure (transA=N, nrhs=4, order=rows) (max 6 steps, inclusive 3 grace steps) on: 3 x 3, type D, 6 nnz, 2 nnz/r, 4 subms, 3 lsubms, 4.0000 bpnz (tpop: 7.153e-06 Mflops: 13.422) -Merge (3 -> 1 leaves) took w.c.t. of 5.96e-06s, ~2.861e-06s of computing time (of which 0s sorting, 9.537e-07s analysis) -3 iterations (8 th.) took 3.099e-06s; avg 1.033e-06s ( +/- 94.66/107.69 %); best 5.519e-08s; worst 2.146e-06s; std dev. 8.778e-07 (taking best). -Reference operation time is 5.51939e-08 s (1739 Mflops) with 8 threads. -After merge step 1: tpop: 5.519e-08 s ~Mflops: 1739.323 nsubm:1 otn:8 -Applying merge (3 -> 1 leaves, 8 th.) yielded SPEEDUP of 129.590x: 7.153e-06s -> 5.519e-08s, so taking this instance. +3 iterations (8 th.) took 0.09197s; avg 0.03066s ( +/- 26.50/ 22.28 %); best 0.02253s; worst 0.03748s; std dev. 0.006173 (taking best). +Reference operation time is 0.022532 s (0.004261 Mflops) with 8 threads. +Starting merge (same threads) based auto-tuning procedure (transA=N, nrhs=4, order=rows) (max 6 steps, inclusive 3 grace steps) on: 3 x 3, type D, 6 nnz, 2 nnz/r, 4 subms, 3 lsubms, 4.0000 bpnz (tpop: 0.02253 Mflops: 0.004) +Merge (3 -> 1 leaves) took w.c.t. of 1.693e-05s, ~5.007e-06s of computing time (of which 1.907e-06s sorting, 4.053e-06s analysis) +3 iterations (8 th.) took 4.053e-06s; avg 1.351e-06s ( +/- 95.86/129.41 %); best 5.594e-08s; worst 3.099e-06s; std dev. 1.296e-06 (taking best). +Reference operation time is 5.59449e-08 s (1716 Mflops) with 8 threads. +After merge step 1: tpop: 5.594e-08 s ~Mflops: 1715.974 nsubm:1 otn:8 +Applying merge (3 -> 1 leaves, 8 th.) yielded SPEEDUP of 402753.036x: 0.02253s -> 5.594e-08s, so taking this instance. Merged all the matrix leaves: no reason to continue merging. -A total of 1 merge steps (of max 6) (3 -> 1 subms) took 3.481e-05s (of which 7.868e-06s partitioning, 0s I/O); computing times: 2.861e-06s in par. loops, 0s sorting, 9.537e-07s analyzing) -Total merge + benchmarking process took 3.481e-05s, equivalent to 630.7/4.9 new/old ops (2.813e-05s for 2 clones -- as 509.7/3.9 ops, or 254.9/2.0 ops per clone), SPEEDUP of 129.590x -Applying multi-merge (3 -> 1 leaves, 1 steps, 0 -> 8 th.sp.) yielded SPEEDUP of 129.590x (7.153e-06s -> 5.519e-08s), will amortize in 4.9 ops by saving 7.097e-06s per op. -In 1 tuning rounds (tot. 0.0001s, 2.8e-05s for constructor, 2 clones) obtained a SPEEDUP of 12859.0% (129.6x) (from 13.42 to 1739 Mflops). +A total of 1 merge steps (of max 6) (3 -> 1 subms) took 0.06s (of which 1.907e-05s partitioning, 0s I/O); computing times: 5.007e-06s in par. loops, 1.907e-06s sorting, 4.053e-06s analyzing) +Total merge + benchmarking process took 0.06s, equivalent to 1072554.9/2.7 new/old ops (0.1359s for 2 clones -- as 2429997.9/6.0 ops, or 1214998.9/3.0 ops per clone), SPEEDUP of 402753.036x +Applying multi-merge (3 -> 1 leaves, 1 steps, 0 -> 8 th.sp.) yielded SPEEDUP of 402753.036x (0.02253s -> 5.594e-08s), will amortize in 2.7 ops by saving 0.02253s per op. +In 1 tuning rounds (tot. 0.23s, 0.14s for constructor, 2 clones) obtained a SPEEDUP of 40275203.6% (4.028e+05x) (from 0.004261 to 1716 Mflops). #pr: updating sample at index 9 (1^th of 16), 0^th touch for (0,0,0,0,1,0,0). -First run of RSB Autotuner took 0.000109911 s (7.153e-06 s -> 5.519e-08 s per spmv_sxsa) (tuned: 3 -> 1 lsubm). +First run of RSB Autotuner took 0.228008 s (2.253e-02 s -> 5.594e-08 s per spmv_sxsa) (tuned: 3 -> 1 lsubm). RSB Sparse Blocks Autotuner invoked requesting max 0 splits and max 0 merges in 1 rounds, auto threads spec. -Second run of RSB Autotuner took 0.000323057 s and estimated a speedup of 1.000000 x (5.519e-08 s -> 5.519e-08 s per op) in same matrix (1 -> 1 lsubm) +Second run of RSB Autotuner took 1.41997 s and estimated a speedup of 1.000000 x (5.594e-08 s -> 5.594e-08 s per op) in same matrix (1 -> 1 lsubm) #min:1 #max:1 #sum:3 #norm:1.7320508075688772 #used index storage compared to COO:28 vs 48 bytes (58.33%) ; compared to CSR:28 vs 40 bytes (77.78%) #%:CONSTRUCTOR_*:SORT SCAN INSERT SCAN+INSERT -%:CONSTRUCTOR_TIMES:A.mtx S N 8 3 3 6 0.000000 0.000025 0.000016 0.000041 -%:UNSORTEDCOO2RSB_TIME:A.mtx S N 8 3 3 6 0.000041 -%:RSB_SUBDIVISION_TIME:A.mtx S N 8 3 3 6 0.000025 -%:RSB_SHUFFLE_TIME:A.mtx S N 8 3 3 6 0.000016 +%:CONSTRUCTOR_TIMES:A.mtx S N 8 3 3 6 0.000000 0.079130 0.067995 0.147125 +%:UNSORTEDCOO2RSB_TIME:A.mtx S N 8 3 3 6 0.147125 +%:RSB_SUBDIVISION_TIME:A.mtx S N 8 3 3 6 0.079130 +%:RSB_SHUFFLE_TIME:A.mtx S N 8 3 3 6 0.067995 %:ROW_MAJOR_SORT_TIME:A.mtx S N 8 3 3 6 0.000000 %:ROW_MAJOR_SORT_SCALING:A.mtx S N 8 3 3 6 -nan -%:SORTEDCOO2RSB_TIME:A.mtx S N 8 3 3 6 0.000041 +%:SORTEDCOO2RSB_TIME:A.mtx S N 8 3 3 6 0.147125 %:ROW_MAJOR_SORT_TO_MOP:A.mtx S N 8 3 3 6 0.000 %:UNSORTEDCOO2RSB_SCALING:A.mtx S N 8 3 3 6 1.00 %:SORTEDCOO2RSB_SCALING:A.mtx S N 8 3 3 6 1.00 @@ -4311,59 +4347,59 @@ %:SM_MINMAXAVGNNZ:A.mtx S N 8 3 3 6 6 6 6 # %operation:matrix CONSTRUCTOR[8] SPMV[8] SPMV[8] -%operation:A.mtx 6.81877e-05 1e+09 1e+09 +%operation:A.mtx 0.215119 1e+09 1e+09 %constructor:matrix SORT[8] SCAN[8] SHUFFLE[8] INSERT[8] -%constructor:A.mtx 0 2.5034e-05 0 1.5974e-05 +%constructor:A.mtx 0 0.0791299 0 0.0679951 # symmetric matrix --- skipping transposed benchmarking -# so far, program took 8.992s of wall clock time; ancillary tests 0.000s; I/O 0.000s; checks 0.000s; conversions 0.000s; rsb/mkl tuning 0.001s/0.000s . +# so far, program took 16.674s of wall clock time; ancillary tests 0.000s; I/O 0.000s; checks 0.000s; conversions 0.000s; rsb/mkl tuning 3.496s/0.000s . getrusage() stats: -ru_maxrss: 73 (maximum resident set size -- MB) -ru_stime : 0.3349s (system CPU time used) -ru_utime : 9.417s (user CPU time used) +ru_maxrss: 69 (maximum resident set size -- MB) +ru_stime : 0.2354s (system CPU time used) +ru_utime : 14.01s (user CPU time used) # multi-type benchmarking (DSCZ) -- now using typecode S (last was D). # Cache block size total 16777216 bytes, per-thread 2097152 bytes -# so far, program took 8.992s of wall clock time; ancillary tests 0.000s; I/O 0.000s; checks 0.000s; conversions 0.000s; rsb/mkl tuning 0.001s/0.000s . +# so far, program took 16.674s of wall clock time; ancillary tests 0.000s; I/O 0.000s; checks 0.000s; conversions 0.000s; rsb/mkl tuning 3.496s/0.000s . # Reusing type converted (D->S) arrays from last iteration instead of reloading matrix file. # multi-nrhs benchmarking (1,4) -- now using nrhs 1. # Using alpha=1 beta=1 order=rows for rsb_spmv/rsb_spsv/rsb_spmm/rsb_spsm. # multi-transpose benchmarking -- now using transA = N. # will use input matrix flags: RSB_FLAG_USE_HALFWORD_INDICES, RSB_FLAG_SORTED_INPUT, RSB_FLAG_QUAD_PARTITIONING, RSB_FLAG_SYMMETRIC, RSB_FLAG_OWN_PARTITIONING_ARRAYS # Using 8 threads -# Constructed matrix (took 0.000s): (3 x 3)[0x582017d0]{S} @ (0(0..0),0(0..0)) (6 nnz, 2 nnz/r) flags 0x2442186 (coo:1, csr:0, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'S' +# Constructed matrix (took 0.164s): (3 x 3)[0x576ba810]{S} @ (0(0..0),0(0..0)) (6 nnz, 2 nnz/r) flags 0x2442186 (coo:1, csr:0, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'S' # matrix consistency check took 0.000s (ok) RSB Sparse Blocks Autotuner invoked requesting max 6 splits and max 6 merges in 1 rounds, threads spec.0 (specify negative values to enable threads tuning). Will autotune matrix: 3 x 3, type S, 6 nnz, 2 nnz/r, 4 subms, 3 lsubms, 4.0000 bpnz. Parameters: verbosity:1 mintimes:3 maxtimes:10 mindt:0 maxdt:3 -3 iterations (8 th.) took 5.198e-05s; avg 1.733e-05s ( +/- 65.60/107.80 %); best 5.96e-06s; worst 3.6e-05s; std dev. 1.331e-05 (taking best). -Reference operation time is 5.96046e-06 s (4.027 Mflops) with 8 threads. -Starting merge (same threads) based auto-tuning procedure (transA=N, nrhs=1, order=rows) (max 6 steps, inclusive 3 grace steps) on: 3 x 3, type S, 6 nnz, 2 nnz/r, 4 subms, 3 lsubms, 4.0000 bpnz (tpop: 5.96e-06 Mflops: 4.027) -Merge (3 -> 1 leaves) took w.c.t. of 6.914e-06s, ~3.099e-06s of computing time (of which 0s sorting, 1.907e-06s analysis) -3 iterations (8 th.) took 1.502e-05s; avg 5.007e-06s ( +/- 98.90/200.00 %); best 5.519e-08s; worst 1.502e-05s; std dev. 7.081e-06 (taking best). -Reference operation time is 5.51939e-08 s (434.8 Mflops) with 8 threads. -After merge step 1: tpop: 5.519e-08 s ~Mflops: 434.831 nsubm:1 otn:8 -Applying merge (3 -> 1 leaves, 8 th.) yielded SPEEDUP of 107.991x: 5.96e-06s -> 5.519e-08s, so taking this instance. +3 iterations (8 th.) took 0.068s; avg 0.02267s ( +/- 29.45/ 23.54 %); best 0.01599s; worst 0.028s; std dev. 0.004993 (taking best). +Reference operation time is 0.015991 s (0.001501 Mflops) with 8 threads. +Starting merge (same threads) based auto-tuning procedure (transA=N, nrhs=1, order=rows) (max 6 steps, inclusive 3 grace steps) on: 3 x 3, type S, 6 nnz, 2 nnz/r, 4 subms, 3 lsubms, 4.0000 bpnz (tpop: 0.01599 Mflops: 0.002) +Merge (3 -> 1 leaves) took w.c.t. of 2.384e-05s, ~6.199e-06s of computing time (of which 1.907e-06s sorting, 5.96e-06s analysis) +3 iterations (8 th.) took 2.503e-05s; avg 8.345e-06s ( +/- 99.33/200.00 %); best 5.594e-08s; worst 2.503e-05s; std dev. 1.18e-05 (taking best). +Reference operation time is 5.59449e-08 s (429 Mflops) with 8 threads. +After merge step 1: tpop: 5.594e-08 s ~Mflops: 428.993 nsubm:1 otn:8 +Applying merge (3 -> 1 leaves, 8 th.) yielded SPEEDUP of 285834.221x: 0.01599s -> 5.594e-08s, so taking this instance. Merged all the matrix leaves: no reason to continue merging. -A total of 1 merge steps (of max 6) (3 -> 1 subms) took 4.601e-05s (of which 9.06e-06s partitioning, 0s I/O); computing times: 3.099e-06s in par. loops, 0s sorting, 1.907e-06s analyzing) -Total merge + benchmarking process took 4.601e-05s, equivalent to 833.7/7.7 new/old ops (3.791e-05s for 2 clones -- as 686.8/6.4 ops, or 343.4/3.2 ops per clone), SPEEDUP of 107.991x -Applying multi-merge (3 -> 1 leaves, 1 steps, 0 -> 8 th.sp.) yielded SPEEDUP of 107.991x (5.96e-06s -> 5.519e-08s), will amortize in 7.8 ops by saving 5.905e-06s per op. -In 1 tuning rounds (tot. 0.00021s, 3.8e-05s for constructor, 2 clones) obtained a SPEEDUP of 10699.1% (108x) (from 4.027 to 434.8 Mflops). +A total of 1 merge steps (of max 6) (3 -> 1 subms) took 0.07732s (of which 2.694e-05s partitioning, 0s I/O); computing times: 6.199e-06s in par. loops, 1.907e-06s sorting, 5.96e-06s analyzing) +Total merge + benchmarking process took 0.07732s, equivalent to 1382109.5/4.8 new/old ops (0.1532s for 2 clones -- as 2738674.6/9.6 ops, or 1369337.3/4.8 ops per clone), SPEEDUP of 285834.221x +Applying multi-merge (3 -> 1 leaves, 1 steps, 0 -> 8 th.sp.) yielded SPEEDUP of 285834.221x (0.01599s -> 5.594e-08s), will amortize in 4.8 ops by saving 0.01599s per op. +In 1 tuning rounds (tot. 0.22s, 0.15s for constructor, 2 clones) obtained a SPEEDUP of 28583322.1% (2.858e+05x) (from 0.001501 to 429 Mflops). #pr: updating sample at index 3 (2^th of 16), 0^th touch for (0,0,0,0,0,1,0). -First run of RSB Autotuner took 0.000219107 s (5.960e-06 s -> 5.519e-08 s per spmv_sxsa) (tuned: 3 -> 1 lsubm). +First run of RSB Autotuner took 0.221354 s (1.599e-02 s -> 5.594e-08 s per spmv_sxsa) (tuned: 3 -> 1 lsubm). RSB Sparse Blocks Autotuner invoked requesting max 0 splits and max 0 merges in 1 rounds, auto threads spec. -Second run of RSB Autotuner took 0.000291824 s and estimated a speedup of 1.000000 x (5.519e-08 s -> 5.519e-08 s per op) in same matrix (1 -> 1 lsubm) +Second run of RSB Autotuner took 1.33462 s and estimated a speedup of 1.000000 x (5.594e-08 s -> 5.594e-08 s per op) in same matrix (1 -> 1 lsubm) #min:1 #max:1 #sum:3 #norm:1.73205078 #used index storage compared to COO:28 vs 48 bytes (58.33%) ; compared to CSR:28 vs 40 bytes (77.78%) #%:CONSTRUCTOR_*:SORT SCAN INSERT SCAN+INSERT -%:CONSTRUCTOR_TIMES:A.mtx S N 8 3 3 6 0.000000 0.000021 0.000017 0.000038 -%:UNSORTEDCOO2RSB_TIME:A.mtx S N 8 3 3 6 0.000038 -%:RSB_SUBDIVISION_TIME:A.mtx S N 8 3 3 6 0.000021 -%:RSB_SHUFFLE_TIME:A.mtx S N 8 3 3 6 0.000017 +%:CONSTRUCTOR_TIMES:A.mtx S N 8 3 3 6 0.000000 0.047608 0.057255 0.104863 +%:UNSORTEDCOO2RSB_TIME:A.mtx S N 8 3 3 6 0.104863 +%:RSB_SUBDIVISION_TIME:A.mtx S N 8 3 3 6 0.047608 +%:RSB_SHUFFLE_TIME:A.mtx S N 8 3 3 6 0.057255 %:ROW_MAJOR_SORT_TIME:A.mtx S N 8 3 3 6 0.000000 %:ROW_MAJOR_SORT_SCALING:A.mtx S N 8 3 3 6 -nan -%:SORTEDCOO2RSB_TIME:A.mtx S N 8 3 3 6 0.000038 +%:SORTEDCOO2RSB_TIME:A.mtx S N 8 3 3 6 0.104863 %:ROW_MAJOR_SORT_TO_MOP:A.mtx S N 8 3 3 6 0.000 %:UNSORTEDCOO2RSB_SCALING:A.mtx S N 8 3 3 6 1.00 %:SORTEDCOO2RSB_SCALING:A.mtx S N 8 3 3 6 1.00 @@ -4378,56 +4414,56 @@ %:SM_MINMAXAVGNNZ:A.mtx S N 8 3 3 6 6 6 6 # %operation:matrix CONSTRUCTOR[8] SPMV[8] SPMV[8] -%operation:A.mtx 5.48363e-05 1e+09 1e+09 +%operation:A.mtx 0.163614 1e+09 1e+09 %constructor:matrix SORT[8] SCAN[8] SHUFFLE[8] INSERT[8] -%constructor:A.mtx 0 2.09808e-05 0 1.69277e-05 +%constructor:A.mtx 0 0.0476081 0 0.057255 # symmetric matrix --- skipping transposed benchmarking # multi-nrhs benchmarking (1,4) -- now using nrhs 4. # Using alpha=1 beta=1 order=rows for rsb_spmv/rsb_spsv/rsb_spmm/rsb_spsm. # multi-transpose benchmarking -- now using transA = N. # will use input matrix flags: RSB_FLAG_USE_HALFWORD_INDICES, RSB_FLAG_SORTED_INPUT, RSB_FLAG_QUAD_PARTITIONING, RSB_FLAG_SYMMETRIC, RSB_FLAG_OWN_PARTITIONING_ARRAYS # Using 8 threads -# Constructed matrix (took 0.000s): (3 x 3)[0x582017d0]{S} @ (0(0..0),0(0..0)) (6 nnz, 2 nnz/r) flags 0x2442186 (coo:1, csr:0, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'S' +# Constructed matrix (took 0.203s): (3 x 3)[0x576ba810]{S} @ (0(0..0),0(0..0)) (6 nnz, 2 nnz/r) flags 0x2442186 (coo:1, csr:0, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'S' # matrix consistency check took 0.000s (ok) RSB Sparse Blocks Autotuner invoked requesting max 6 splits and max 6 merges in 1 rounds, threads spec.0 (specify negative values to enable threads tuning). Will autotune matrix: 3 x 3, type S, 6 nnz, 2 nnz/r, 4 subms, 3 lsubms, 4.0000 bpnz. Parameters: verbosity:1 mintimes:3 maxtimes:10 mindt:0 maxdt:3 -3 iterations (8 th.) took 3.409e-05s; avg 1.136e-05s ( +/- 28.67/ 48.95 %); best 8.106e-06s; worst 1.693e-05s; std dev. 3.953e-06 (taking best). -Reference operation time is 8.10623e-06 s (11.84 Mflops) with 8 threads. -Starting merge (same threads) based auto-tuning procedure (transA=N, nrhs=4, order=rows) (max 6 steps, inclusive 3 grace steps) on: 3 x 3, type S, 6 nnz, 2 nnz/r, 4 subms, 3 lsubms, 4.0000 bpnz (tpop: 8.106e-06 Mflops: 11.843) -Merge (3 -> 1 leaves) took w.c.t. of 7.153e-06s, ~1.907e-06s of computing time (of which 9.537e-07s sorting, 1.192e-06s analysis) -3 iterations (8 th.) took 4.053e-06s; avg 1.351e-06s ( +/- 95.91/129.41 %); best 5.519e-08s; worst 3.099e-06s; std dev. 1.296e-06 (taking best). -Reference operation time is 5.51939e-08 s (1739 Mflops) with 8 threads. -After merge step 1: tpop: 5.519e-08 s ~Mflops: 1739.323 nsubm:1 otn:8 -Applying merge (3 -> 1 leaves, 8 th.) yielded SPEEDUP of 146.868x: 8.106e-06s -> 5.519e-08s, so taking this instance. +3 iterations (8 th.) took 0.07999s; avg 0.02666s ( +/- 39.93/ 19.97 %); best 0.01602s; worst 0.03199s; std dev. 0.007529 (taking best). +Reference operation time is 0.0160151 s (0.005994 Mflops) with 8 threads. +Starting merge (same threads) based auto-tuning procedure (transA=N, nrhs=4, order=rows) (max 6 steps, inclusive 3 grace steps) on: 3 x 3, type S, 6 nnz, 2 nnz/r, 4 subms, 3 lsubms, 4.0000 bpnz (tpop: 0.01602 Mflops: 0.006) +Merge (3 -> 1 leaves) took w.c.t. of 1.693e-05s, ~5.007e-06s of computing time (of which 9.537e-07s sorting, 2.861e-06s analysis) +3 iterations (8 th.) took 4.053e-06s; avg 1.351e-06s ( +/- 95.86/111.76 %); best 5.594e-08s; worst 2.861e-06s; std dev. 1.173e-06 (taking best). +Reference operation time is 5.59449e-08 s (1716 Mflops) with 8 threads. +After merge step 1: tpop: 5.594e-08 s ~Mflops: 1715.974 nsubm:1 otn:8 +Applying merge (3 -> 1 leaves, 8 th.) yielded SPEEDUP of 286264.649x: 0.01602s -> 5.594e-08s, so taking this instance. Merged all the matrix leaves: no reason to continue merging. -A total of 1 merge steps (of max 6) (3 -> 1 subms) took 3.409e-05s (of which 9.06e-06s partitioning, 0s I/O); computing times: 1.907e-06s in par. loops, 9.537e-07s sorting, 1.192e-06s analyzing) -Total merge + benchmarking process took 3.409e-05s, equivalent to 617.7/4.2 new/old ops (2.885e-05s for 2 clones -- as 522.7/3.6 ops, or 261.3/1.8 ops per clone), SPEEDUP of 146.868x -Applying multi-merge (3 -> 1 leaves, 1 steps, 0 -> 8 th.sp.) yielded SPEEDUP of 146.868x (8.106e-06s -> 5.519e-08s), will amortize in 4.2 ops by saving 8.051e-06s per op. -In 1 tuning rounds (tot. 0.0003s, 2.9e-05s for constructor, 2 clones) obtained a SPEEDUP of 14586.8% (146.9x) (from 11.84 to 1739 Mflops). +A total of 1 merge steps (of max 6) (3 -> 1 subms) took 0.08s (of which 1.884e-05s partitioning, 0s I/O); computing times: 5.007e-06s in par. loops, 9.537e-07s sorting, 2.861e-06s analyzing) +Total merge + benchmarking process took 0.08s, equivalent to 1429891.3/5.0 new/old ops (0.1599s for 2 clones -- as 2858597.9/10.0 ops, or 1429299.0/5.0 ops per clone), SPEEDUP of 286264.649x +Applying multi-merge (3 -> 1 leaves, 1 steps, 0 -> 8 th.sp.) yielded SPEEDUP of 286264.649x (0.01602s -> 5.594e-08s), will amortize in 5.0 ops by saving 0.01601s per op. +In 1 tuning rounds (tot. 0.24s, 0.16s for constructor, 2 clones) obtained a SPEEDUP of 28626364.9% (2.863e+05x) (from 0.005994 to 1716 Mflops). #pr: updating sample at index 11 (3^th of 16), 0^th touch for (0,0,0,0,1,1,0). -First run of RSB Autotuner took 0.00031209 s (8.106e-06 s -> 5.519e-08 s per spmv_sxsa) (tuned: 3 -> 1 lsubm). +First run of RSB Autotuner took 0.240022 s (1.602e-02 s -> 5.594e-08 s per spmv_sxsa) (tuned: 3 -> 1 lsubm). RSB Sparse Blocks Autotuner invoked requesting max 0 splits and max 0 merges in 1 rounds, auto threads spec. -Second run of RSB Autotuner took 0.000303984 s and estimated a speedup of 1.000000 x (5.519e-08 s -> 5.519e-08 s per op) in same matrix (1 -> 1 lsubm) +Second run of RSB Autotuner took 1.07596 s and estimated a speedup of 1.000000 x (5.594e-08 s -> 5.594e-08 s per op) in same matrix (1 -> 1 lsubm) #min:1 #max:1 #sum:3 #norm:1.73205078 #used index storage compared to COO:28 vs 48 bytes (58.33%) ; compared to CSR:28 vs 40 bytes (77.78%) #%:CONSTRUCTOR_*:SORT SCAN INSERT SCAN+INSERT -%:CONSTRUCTOR_TIMES:A.mtx S N 8 3 3 6 0.000000 0.000022 0.000016 0.000038 -%:UNSORTEDCOO2RSB_TIME:A.mtx S N 8 3 3 6 0.000038 -%:RSB_SUBDIVISION_TIME:A.mtx S N 8 3 3 6 0.000022 -%:RSB_SHUFFLE_TIME:A.mtx S N 8 3 3 6 0.000016 -%:ROW_MAJOR_SORT_TIME:A.mtx S N 8 3 3 6 0.000000 -%:ROW_MAJOR_SORT_SCALING:A.mtx S N 8 3 3 6 -nan -%:SORTEDCOO2RSB_TIME:A.mtx S N 8 3 3 6 0.000038 +%:CONSTRUCTOR_TIMES:A.mtx S N 8 3 3 6 0.000001 0.090649 0.048079 0.138728 +%:UNSORTEDCOO2RSB_TIME:A.mtx S N 8 3 3 6 0.138729 +%:RSB_SUBDIVISION_TIME:A.mtx S N 8 3 3 6 0.090649 +%:RSB_SHUFFLE_TIME:A.mtx S N 8 3 3 6 0.048079 +%:ROW_MAJOR_SORT_TIME:A.mtx S N 8 3 3 6 0.000001 +%:ROW_MAJOR_SORT_SCALING:A.mtx S N 8 3 3 6 1.000 +%:SORTEDCOO2RSB_TIME:A.mtx S N 8 3 3 6 0.138728 %:ROW_MAJOR_SORT_TO_MOP:A.mtx S N 8 3 3 6 0.000 %:UNSORTEDCOO2RSB_SCALING:A.mtx S N 8 3 3 6 1.00 %:SORTEDCOO2RSB_SCALING:A.mtx S N 8 3 3 6 1.00 %:RSB_SUBDIVISION_SCALING:A.mtx S N 8 3 3 6 1.00 %:RSB_SHUFFLE_SCALING:A.mtx S N 8 3 3 6 1.00 -%:CONSTRUCTOR_SCALING:A.mtx S N 8 3 3 6 -nan 1.00 1.00 1.00 +%:CONSTRUCTOR_SCALING:A.mtx S N 8 3 3 6 1.00 1.00 1.00 1.00 #%:SM_COUNTS: Tot HalfwordCsr FullwordCsr HalfwordCoo FullwordCoo %:SM_COUNTS:A.mtx S N 8 3 3 6 1 1 0 0 0 %:SM_IDXOCCUPATIONRSBVSCOOANDCSR:A.mtx S N 8 3 3 6 28 48 36 @@ -4436,59 +4472,59 @@ %:SM_MINMAXAVGNNZ:A.mtx S N 8 3 3 6 6 6 6 # %operation:matrix CONSTRUCTOR[8] SPMV[8] SPMV[8] -%operation:A.mtx 5.6982e-05 1e+09 1e+09 +%operation:A.mtx 0.202652 1e+09 1e+09 %constructor:matrix SORT[8] SCAN[8] SHUFFLE[8] INSERT[8] -%constructor:A.mtx 0 2.21729e-05 0 1.5974e-05 +%constructor:A.mtx 9.53674e-07 0.0906491 0 0.048079 # symmetric matrix --- skipping transposed benchmarking -# so far, program took 9.153s of wall clock time; ancillary tests 0.000s; I/O 0.000s; checks 0.000s; conversions 0.000s; rsb/mkl tuning 0.002s/0.000s . +# so far, program took 20.637s of wall clock time; ancillary tests 0.000s; I/O 0.000s; checks 0.000s; conversions 0.000s; rsb/mkl tuning 6.368s/0.000s . getrusage() stats: -ru_maxrss: 73 (maximum resident set size -- MB) -ru_stime : 0.4872s (system CPU time used) -ru_utime : 10.22s (user CPU time used) +ru_maxrss: 69 (maximum resident set size -- MB) +ru_stime : 0.3714s (system CPU time used) +ru_utime : 21.52s (user CPU time used) # multi-type benchmarking (DSCZ) -- now using typecode C (last was S). # Cache block size total 16777216 bytes, per-thread 2097152 bytes -# so far, program took 9.153s of wall clock time; ancillary tests 0.000s; I/O 0.000s; checks 0.000s; conversions 0.000s; rsb/mkl tuning 0.002s/0.000s . +# so far, program took 20.637s of wall clock time; ancillary tests 0.000s; I/O 0.000s; checks 0.000s; conversions 0.000s; rsb/mkl tuning 6.368s/0.000s . # Reusing type converted (S->C) arrays from last iteration instead of reloading matrix file. # multi-nrhs benchmarking (1,4) -- now using nrhs 1. # Using alpha=1 beta=1 order=rows for rsb_spmv/rsb_spsv/rsb_spmm/rsb_spsm. # multi-transpose benchmarking -- now using transA = N. # will use input matrix flags: RSB_FLAG_USE_HALFWORD_INDICES, RSB_FLAG_SORTED_INPUT, RSB_FLAG_QUAD_PARTITIONING, RSB_FLAG_SYMMETRIC, RSB_FLAG_OWN_PARTITIONING_ARRAYS # Using 8 threads -# Constructed matrix (took 0.000s): (3 x 3)[0x58204140]{C} @ (0(0..0),0(0..0)) (6 nnz, 2 nnz/r) flags 0x2442186 (coo:1, csr:0, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'S' +# Constructed matrix (took 0.189s): (3 x 3)[0x576bd180]{C} @ (0(0..0),0(0..0)) (6 nnz, 2 nnz/r) flags 0x2442186 (coo:1, csr:0, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'S' # matrix consistency check took 0.000s (ok) RSB Sparse Blocks Autotuner invoked requesting max 6 splits and max 6 merges in 1 rounds, threads spec.0 (specify negative values to enable threads tuning). Will autotune matrix: 3 x 3, type C, 6 nnz, 2 nnz/r, 4 subms, 3 lsubms, 4.0000 bpnz. Parameters: verbosity:1 mintimes:3 maxtimes:10 mindt:0 maxdt:3 -3 iterations (8 th.) took 6.199e-05s; avg 2.066e-05s ( +/- 56.15/ 69.62 %); best 9.06e-06s; worst 3.505e-05s; std dev. 1.079e-05 (taking best). -Reference operation time is 9.05991e-06 s (10.6 Mflops) with 8 threads. -Starting merge (same threads) based auto-tuning procedure (transA=N, nrhs=1, order=rows) (max 6 steps, inclusive 3 grace steps) on: 3 x 3, type C, 6 nnz, 2 nnz/r, 4 subms, 3 lsubms, 4.0000 bpnz (tpop: 9.06e-06 Mflops: 10.596) -Merge (3 -> 1 leaves) took w.c.t. of 8.106e-06s, ~1.907e-06s of computing time (of which 9.537e-07s sorting, 9.537e-07s analysis) -3 iterations (8 th.) took 1.097e-05s; avg 3.656e-06s ( +/- 98.49/173.91 %); best 5.519e-08s; worst 1.001e-05s; std dev. 4.512e-06 (taking best). -Reference operation time is 5.51939e-08 s (1739 Mflops) with 8 threads. -After merge step 1: tpop: 5.519e-08 s ~Mflops: 1739.323 nsubm:1 otn:8 -Applying merge (3 -> 1 leaves, 8 th.) yielded SPEEDUP of 164.147x: 9.06e-06s -> 5.519e-08s, so taking this instance. +3 iterations (8 th.) took 0.068s; avg 0.02267s ( +/- 29.43/ 23.52 %); best 0.016s; worst 0.028s; std dev. 0.00499 (taking best). +Reference operation time is 0.0159969 s (0.006001 Mflops) with 8 threads. +Starting merge (same threads) based auto-tuning procedure (transA=N, nrhs=1, order=rows) (max 6 steps, inclusive 3 grace steps) on: 3 x 3, type C, 6 nnz, 2 nnz/r, 4 subms, 3 lsubms, 4.0000 bpnz (tpop: 0.016 Mflops: 0.006) +Merge (3 -> 1 leaves) took w.c.t. of 2.003e-05s, ~7.153e-06s of computing time (of which 1.907e-06s sorting, 4.053e-06s analysis) +3 iterations (8 th.) took 2.003e-05s; avg 6.676e-06s ( +/- 99.16/200.00 %); best 5.594e-08s; worst 2.003e-05s; std dev. 9.441e-06 (taking best). +Reference operation time is 5.59449e-08 s (1716 Mflops) with 8 threads. +After merge step 1: tpop: 5.594e-08 s ~Mflops: 1715.974 nsubm:1 otn:8 +Applying merge (3 -> 1 leaves, 8 th.) yielded SPEEDUP of 285940.763x: 0.016s -> 5.594e-08s, so taking this instance. Merged all the matrix leaves: no reason to continue merging. -A total of 1 merge steps (of max 6) (3 -> 1 subms) took 4.292e-05s (of which 9.06e-06s partitioning, 0s I/O); computing times: 1.907e-06s in par. loops, 9.537e-07s sorting, 9.537e-07s analyzing) -Total merge + benchmarking process took 4.292e-05s, equivalent to 777.5/4.7 new/old ops (3.219e-05s for 2 clones -- as 583.2/3.6 ops, or 291.6/1.8 ops per clone), SPEEDUP of 164.147x -Applying multi-merge (3 -> 1 leaves, 1 steps, 0 -> 8 th.sp.) yielded SPEEDUP of 164.147x (9.06e-06s -> 5.519e-08s), will amortize in 4.8 ops by saving 9.005e-06s per op. -In 1 tuning rounds (tot. 0.00014s, 3.2e-05s for constructor, 2 clones) obtained a SPEEDUP of 16314.7% (164.1x) (from 10.6 to 1739 Mflops). +A total of 1 merge steps (of max 6) (3 -> 1 subms) took 0.09998s (of which 2.193e-05s partitioning, 0s I/O); computing times: 7.153e-06s in par. loops, 1.907e-06s sorting, 4.053e-06s analyzing) +Total merge + benchmarking process took 0.09998s, equivalent to 1787078.6/6.2 new/old ops (0.1639s for 2 clones -- as 2928949.5/10.2 ops, or 1464474.7/5.1 ops per clone), SPEEDUP of 285940.763x +Applying multi-merge (3 -> 1 leaves, 1 steps, 0 -> 8 th.sp.) yielded SPEEDUP of 285940.763x (0.016s -> 5.594e-08s), will amortize in 6.2 ops by saving 0.016s per op. +In 1 tuning rounds (tot. 0.23s, 0.16s for constructor, 2 clones) obtained a SPEEDUP of 28593976.3% (2.859e+05x) (from 0.006001 to 1716 Mflops). #pr: updating sample at index 5 (4^th of 16), 0^th touch for (0,0,0,0,0,2,0). -First run of RSB Autotuner took 0.000349998 s (9.060e-06 s -> 5.519e-08 s per spmv_sxsa) (tuned: 3 -> 1 lsubm). +First run of RSB Autotuner took 0.232005 s (1.600e-02 s -> 5.594e-08 s per spmv_sxsa) (tuned: 3 -> 1 lsubm). RSB Sparse Blocks Autotuner invoked requesting max 0 splits and max 0 merges in 1 rounds, auto threads spec. -Second run of RSB Autotuner took 0.000372887 s and estimated a speedup of 1.000000 x (5.519e-08 s -> 5.519e-08 s per op) in same matrix (1 -> 1 lsubm) +Second run of RSB Autotuner took 1.32797 s and estimated a speedup of 1.000000 x (5.594e-08 s -> 5.594e-08 s per op) in same matrix (1 -> 1 lsubm) #min:1 0 #max:1 0 #sum:3 0 #norm:1.73205078 0 #used index storage compared to COO:28 vs 48 bytes (58.33%) ; compared to CSR:28 vs 40 bytes (77.78%) #%:CONSTRUCTOR_*:SORT SCAN INSERT SCAN+INSERT -%:CONSTRUCTOR_TIMES:A.mtx S N 8 3 3 6 0.000000 0.000020 0.000019 0.000039 -%:UNSORTEDCOO2RSB_TIME:A.mtx S N 8 3 3 6 0.000039 -%:RSB_SUBDIVISION_TIME:A.mtx S N 8 3 3 6 0.000020 -%:RSB_SHUFFLE_TIME:A.mtx S N 8 3 3 6 0.000019 +%:CONSTRUCTOR_TIMES:A.mtx S N 8 3 3 6 0.000000 0.093007 0.047997 0.141004 +%:UNSORTEDCOO2RSB_TIME:A.mtx S N 8 3 3 6 0.141004 +%:RSB_SUBDIVISION_TIME:A.mtx S N 8 3 3 6 0.093007 +%:RSB_SHUFFLE_TIME:A.mtx S N 8 3 3 6 0.047997 %:ROW_MAJOR_SORT_TIME:A.mtx S N 8 3 3 6 0.000000 %:ROW_MAJOR_SORT_SCALING:A.mtx S N 8 3 3 6 -nan -%:SORTEDCOO2RSB_TIME:A.mtx S N 8 3 3 6 0.000039 +%:SORTEDCOO2RSB_TIME:A.mtx S N 8 3 3 6 0.141004 %:ROW_MAJOR_SORT_TO_MOP:A.mtx S N 8 3 3 6 0.000 %:UNSORTEDCOO2RSB_SCALING:A.mtx S N 8 3 3 6 1.00 %:SORTEDCOO2RSB_SCALING:A.mtx S N 8 3 3 6 1.00 @@ -4503,50 +4539,50 @@ %:SM_MINMAXAVGNNZ:A.mtx S N 8 3 3 6 6 6 6 # %operation:matrix CONSTRUCTOR[8] SPMV[8] SPMV[8] -%operation:A.mtx 5.38826e-05 1e+09 1e+09 +%operation:A.mtx 0.189018 1e+09 1e+09 %constructor:matrix SORT[8] SCAN[8] SHUFFLE[8] INSERT[8] -%constructor:A.mtx 0 1.97887e-05 0 1.88351e-05 +%constructor:A.mtx 0 0.0930071 0 0.047997 # symmetric matrix --- skipping transposed benchmarking # multi-nrhs benchmarking (1,4) -- now using nrhs 4. # Using alpha=1 beta=1 order=rows for rsb_spmv/rsb_spsv/rsb_spmm/rsb_spsm. # multi-transpose benchmarking -- now using transA = N. # will use input matrix flags: RSB_FLAG_USE_HALFWORD_INDICES, RSB_FLAG_SORTED_INPUT, RSB_FLAG_QUAD_PARTITIONING, RSB_FLAG_SYMMETRIC, RSB_FLAG_OWN_PARTITIONING_ARRAYS # Using 8 threads -# Constructed matrix (took 0.000s): (3 x 3)[0x58204140]{C} @ (0(0..0),0(0..0)) (6 nnz, 2 nnz/r) flags 0x2442186 (coo:1, csr:0, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'S' +# Constructed matrix (took 0.217s): (3 x 3)[0x576bd180]{C} @ (0(0..0),0(0..0)) (6 nnz, 2 nnz/r) flags 0x2442186 (coo:1, csr:0, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'S' # matrix consistency check took 0.000s (ok) RSB Sparse Blocks Autotuner invoked requesting max 6 splits and max 6 merges in 1 rounds, threads spec.0 (specify negative values to enable threads tuning). Will autotune matrix: 3 x 3, type C, 6 nnz, 2 nnz/r, 4 subms, 3 lsubms, 4.0000 bpnz. Parameters: verbosity:1 mintimes:3 maxtimes:10 mindt:0 maxdt:3 -3 iterations (8 th.) took 7.105e-05s; avg 2.368e-05s ( +/- 57.72/ 73.15 %); best 1.001e-05s; worst 4.101e-05s; std dev. 1.291e-05 (taking best). -Reference operation time is 1.00136e-05 s (38.35 Mflops) with 8 threads. -Starting merge (same threads) based auto-tuning procedure (transA=N, nrhs=4, order=rows) (max 6 steps, inclusive 3 grace steps) on: 3 x 3, type C, 6 nnz, 2 nnz/r, 4 subms, 3 lsubms, 4.0000 bpnz (tpop: 1.001e-05 Mflops: 38.348) -Merge (3 -> 1 leaves) took w.c.t. of 6.914e-06s, ~3.099e-06s of computing time (of which 1.192e-06s sorting, 0s analysis) -3 iterations (8 th.) took 2.861e-06s; avg 9.537e-07s ( +/- 94.21/100.00 %); best 5.519e-08s; worst 1.907e-06s; std dev. 7.787e-07 (taking best). -Reference operation time is 5.51939e-08 s (6957 Mflops) with 8 threads. -After merge step 1: tpop: 5.519e-08 s ~Mflops: 6957.290 nsubm:1 otn:8 -Applying merge (3 -> 1 leaves, 8 th.) yielded SPEEDUP of 181.425x: 1.001e-05s -> 5.519e-08s, so taking this instance. +3 iterations (8 th.) took 0.06429s; avg 0.02143s ( +/- 44.01/ 32.04 %); best 0.012s; worst 0.0283s; std dev. 0.006897 (taking best). +Reference operation time is 0.0119989 s (0.032 Mflops) with 8 threads. +Starting merge (same threads) based auto-tuning procedure (transA=N, nrhs=4, order=rows) (max 6 steps, inclusive 3 grace steps) on: 3 x 3, type C, 6 nnz, 2 nnz/r, 4 subms, 3 lsubms, 4.0000 bpnz (tpop: 0.012 Mflops: 0.032) +Merge (3 -> 1 leaves) took w.c.t. of 1.812e-05s, ~5.007e-06s of computing time (of which 9.537e-07s sorting, 1.907e-06s analysis) +3 iterations (8 th.) took 3.815e-06s; avg 1.272e-06s ( +/- 95.60/125.00 %); best 5.594e-08s; worst 2.861e-06s; std dev. 1.189e-06 (taking best). +Reference operation time is 5.59449e-08 s (6864 Mflops) with 8 threads. +After merge step 1: tpop: 5.594e-08 s ~Mflops: 6863.894 nsubm:1 otn:8 +Applying merge (3 -> 1 leaves, 8 th.) yielded SPEEDUP of 214476.880x: 0.012s -> 5.594e-08s, so taking this instance. Merged all the matrix leaves: no reason to continue merging. -A total of 1 merge steps (of max 6) (3 -> 1 subms) took 3.6e-05s (of which 8.821e-06s partitioning, 0s I/O); computing times: 3.099e-06s in par. loops, 1.192e-06s sorting, 0s analyzing) -Total merge + benchmarking process took 3.6e-05s, equivalent to 652.3/3.6 new/old ops (3.219e-05s for 2 clones -- as 583.2/3.2 ops, or 291.6/1.6 ops per clone), SPEEDUP of 181.425x -Applying multi-merge (3 -> 1 leaves, 1 steps, 0 -> 8 th.sp.) yielded SPEEDUP of 181.425x (1.001e-05s -> 5.519e-08s), will amortize in 3.6 ops by saving 9.958e-06s per op. -In 1 tuning rounds (tot. 0.00014s, 3.2e-05s for constructor, 2 clones) obtained a SPEEDUP of 18042.5% (181.4x) (from 38.35 to 6957 Mflops). +A total of 1 merge steps (of max 6) (3 -> 1 subms) took 0.07672s (of which 2.003e-05s partitioning, 0s I/O); computing times: 5.007e-06s in par. loops, 9.537e-07s sorting, 1.907e-06s analyzing) +Total merge + benchmarking process took 0.07672s, equivalent to 1371421.3/6.4 new/old ops (0.1686s for 2 clones -- as 3014353.3/14.1 ops, or 1507176.6/7.0 ops per clone), SPEEDUP of 214476.880x +Applying multi-merge (3 -> 1 leaves, 1 steps, 0 -> 8 th.sp.) yielded SPEEDUP of 214476.880x (0.012s -> 5.594e-08s), will amortize in 6.4 ops by saving 0.012s per op. +In 1 tuning rounds (tot. 0.23s, 0.17s for constructor, 2 clones) obtained a SPEEDUP of 21447588.0% (2.145e+05x) (from 0.032 to 6864 Mflops). #pr: updating sample at index 13 (5^th of 16), 0^th touch for (0,0,0,0,1,2,0). -First run of RSB Autotuner took 0.000153065 s (1.001e-05 s -> 5.519e-08 s per spmv_sxsa) (tuned: 3 -> 1 lsubm). +First run of RSB Autotuner took 0.233026 s (1.200e-02 s -> 5.594e-08 s per spmv_sxsa) (tuned: 3 -> 1 lsubm). RSB Sparse Blocks Autotuner invoked requesting max 0 splits and max 0 merges in 1 rounds, auto threads spec. -Second run of RSB Autotuner took 0.000315905 s and estimated a speedup of 1.000000 x (5.519e-08 s -> 5.519e-08 s per op) in same matrix (1 -> 1 lsubm) +Second run of RSB Autotuner took 1.44317 s and estimated a speedup of 1.000000 x (5.594e-08 s -> 5.594e-08 s per op) in same matrix (1 -> 1 lsubm) #min:1 0 #max:1 0 #sum:3 0 #norm:1.73205078 0 #used index storage compared to COO:28 vs 48 bytes (58.33%) ; compared to CSR:28 vs 40 bytes (77.78%) #%:CONSTRUCTOR_*:SORT SCAN INSERT SCAN+INSERT -%:CONSTRUCTOR_TIMES:A.mtx S N 8 3 3 6 0.000000 0.000022 0.000014 0.000036 -%:UNSORTEDCOO2RSB_TIME:A.mtx S N 8 3 3 6 0.000036 -%:RSB_SUBDIVISION_TIME:A.mtx S N 8 3 3 6 0.000022 -%:RSB_SHUFFLE_TIME:A.mtx S N 8 3 3 6 0.000014 +%:CONSTRUCTOR_TIMES:A.mtx S N 8 3 3 6 0.000000 0.068832 0.067979 0.136811 +%:UNSORTEDCOO2RSB_TIME:A.mtx S N 8 3 3 6 0.136811 +%:RSB_SUBDIVISION_TIME:A.mtx S N 8 3 3 6 0.068832 +%:RSB_SHUFFLE_TIME:A.mtx S N 8 3 3 6 0.067979 %:ROW_MAJOR_SORT_TIME:A.mtx S N 8 3 3 6 0.000000 %:ROW_MAJOR_SORT_SCALING:A.mtx S N 8 3 3 6 -nan -%:SORTEDCOO2RSB_TIME:A.mtx S N 8 3 3 6 0.000036 +%:SORTEDCOO2RSB_TIME:A.mtx S N 8 3 3 6 0.136811 %:ROW_MAJOR_SORT_TO_MOP:A.mtx S N 8 3 3 6 0.000 %:UNSORTEDCOO2RSB_SCALING:A.mtx S N 8 3 3 6 1.00 %:SORTEDCOO2RSB_SCALING:A.mtx S N 8 3 3 6 1.00 @@ -4561,59 +4597,59 @@ %:SM_MINMAXAVGNNZ:A.mtx S N 8 3 3 6 6 6 6 # %operation:matrix CONSTRUCTOR[8] SPMV[8] SPMV[8] -%operation:A.mtx 5.38826e-05 1e+09 1e+09 +%operation:A.mtx 0.21682 1e+09 1e+09 %constructor:matrix SORT[8] SCAN[8] SHUFFLE[8] INSERT[8] -%constructor:A.mtx 0 2.19345e-05 0 1.40667e-05 +%constructor:A.mtx 0 0.0688322 0 0.0679791 # symmetric matrix --- skipping transposed benchmarking -# so far, program took 9.315s of wall clock time; ancillary tests 0.000s; I/O 0.000s; checks 0.000s; conversions 0.000s; rsb/mkl tuning 0.003s/0.000s . +# so far, program took 24.942s of wall clock time; ancillary tests 0.000s; I/O 0.000s; checks 0.000s; conversions 0.000s; rsb/mkl tuning 9.604s/0.000s . getrusage() stats: -ru_maxrss: 73 (maximum resident set size -- MB) -ru_stime : 0.6275s (system CPU time used) -ru_utime : 11.02s (user CPU time used) +ru_maxrss: 69 (maximum resident set size -- MB) +ru_stime : 0.544s (system CPU time used) +ru_utime : 30.13s (user CPU time used) # multi-type benchmarking (DSCZ) -- now using typecode Z (last was C). # Cache block size total 16777216 bytes, per-thread 2097152 bytes -# so far, program took 9.315s of wall clock time; ancillary tests 0.000s; I/O 0.000s; checks 0.000s; conversions 0.000s; rsb/mkl tuning 0.003s/0.000s . +# so far, program took 24.942s of wall clock time; ancillary tests 0.000s; I/O 0.000s; checks 0.000s; conversions 0.000s; rsb/mkl tuning 9.604s/0.000s . # Reusing type converted (C->Z) arrays from last iteration instead of reloading matrix file. # multi-nrhs benchmarking (1,4) -- now using nrhs 1. # Using alpha=1 beta=1 order=rows for rsb_spmv/rsb_spsv/rsb_spmm/rsb_spsm. # multi-transpose benchmarking -- now using transA = N. # will use input matrix flags: RSB_FLAG_USE_HALFWORD_INDICES, RSB_FLAG_SORTED_INPUT, RSB_FLAG_QUAD_PARTITIONING, RSB_FLAG_SYMMETRIC, RSB_FLAG_OWN_PARTITIONING_ARRAYS # Using 8 threads -# Constructed matrix (took 0.000s): (3 x 3)[0x58204140]{Z} @ (0(0..0),0(0..0)) (6 nnz, 2 nnz/r) flags 0x2442186 (coo:1, csr:0, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'S' +# Constructed matrix (took 0.139s): (3 x 3)[0x576bd180]{Z} @ (0(0..0),0(0..0)) (6 nnz, 2 nnz/r) flags 0x2442186 (coo:1, csr:0, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'S' # matrix consistency check took 0.000s (ok) RSB Sparse Blocks Autotuner invoked requesting max 6 splits and max 6 merges in 1 rounds, threads spec.0 (specify negative values to enable threads tuning). Will autotune matrix: 3 x 3, type Z, 6 nnz, 2 nnz/r, 4 subms, 3 lsubms, 4.0000 bpnz. Parameters: verbosity:1 mintimes:3 maxtimes:10 mindt:0 maxdt:3 -3 iterations (8 th.) took 5.317e-05s; avg 1.772e-05s ( +/- 55.61/109.87 %); best 7.868e-06s; worst 3.719e-05s; std dev. 1.377e-05 (taking best). -Reference operation time is 7.86781e-06 s (12.2 Mflops) with 8 threads. -Starting merge (same threads) based auto-tuning procedure (transA=N, nrhs=1, order=rows) (max 6 steps, inclusive 3 grace steps) on: 3 x 3, type Z, 6 nnz, 2 nnz/r, 4 subms, 3 lsubms, 4.0000 bpnz (tpop: 7.868e-06 Mflops: 12.202) -Merge (3 -> 1 leaves) took w.c.t. of 6.199e-06s, ~1.907e-06s of computing time (of which 9.537e-07s sorting, 1.192e-06s analysis) -3 iterations (8 th.) took 1.311e-05s; avg 4.371e-06s ( +/- 98.74/172.73 %); best 5.519e-08s; worst 1.192e-05s; std dev. 5.361e-06 (taking best). -Reference operation time is 5.51939e-08 s (1739 Mflops) with 8 threads. -After merge step 1: tpop: 5.519e-08 s ~Mflops: 1739.323 nsubm:1 otn:8 -Applying merge (3 -> 1 leaves, 8 th.) yielded SPEEDUP of 142.549x: 7.868e-06s -> 5.519e-08s, so taking this instance. +3 iterations (8 th.) took 0.09184s; avg 0.03061s ( +/- 9.04/ 17.59 %); best 0.02785s; worst 0.036s; std dev. 0.003808 (taking best). +Reference operation time is 0.0278471 s (0.003447 Mflops) with 8 threads. +Starting merge (same threads) based auto-tuning procedure (transA=N, nrhs=1, order=rows) (max 6 steps, inclusive 3 grace steps) on: 3 x 3, type Z, 6 nnz, 2 nnz/r, 4 subms, 3 lsubms, 4.0000 bpnz (tpop: 0.02785 Mflops: 0.003) +Merge (3 -> 1 leaves) took w.c.t. of 1.812e-05s, ~6.199e-06s of computing time (of which 1.907e-06s sorting, 4.053e-06s analysis) +3 iterations (8 th.) took 1.407e-05s; avg 4.689e-06s ( +/- 98.81/200.00 %); best 5.594e-08s; worst 1.407e-05s; std dev. 6.631e-06 (taking best). +Reference operation time is 5.59449e-08 s (1716 Mflops) with 8 threads. +After merge step 1: tpop: 5.594e-08 s ~Mflops: 1715.974 nsubm:1 otn:8 +Applying merge (3 -> 1 leaves, 8 th.) yielded SPEEDUP of 497758.364x: 0.02785s -> 5.594e-08s, so taking this instance. Merged all the matrix leaves: no reason to continue merging. -A total of 1 merge steps (of max 6) (3 -> 1 subms) took 4.315e-05s (of which 8.106e-06s partitioning, 0s I/O); computing times: 1.907e-06s in par. loops, 9.537e-07s sorting, 1.192e-06s analyzing) -Total merge + benchmarking process took 4.315e-05s, equivalent to 781.9/5.5 new/old ops (2.885e-05s for 2 clones -- as 522.7/3.7 ops, or 261.3/1.8 ops per clone), SPEEDUP of 142.549x -Applying multi-merge (3 -> 1 leaves, 1 steps, 0 -> 8 th.sp.) yielded SPEEDUP of 142.549x (7.868e-06s -> 5.519e-08s), will amortize in 5.5 ops by saving 7.813e-06s per op. -In 1 tuning rounds (tot. 0.00013s, 2.9e-05s for constructor, 2 clones) obtained a SPEEDUP of 14154.9% (142.5x) (from 12.2 to 1739 Mflops). +A total of 1 merge steps (of max 6) (3 -> 1 subms) took 0.08417s (of which 2.003e-05s partitioning, 0s I/O); computing times: 6.199e-06s in par. loops, 1.907e-06s sorting, 4.053e-06s analyzing) +Total merge + benchmarking process took 0.08417s, equivalent to 1504479.0/3.0 new/old ops (0.1601s for 2 clones -- as 2861440.4/5.7 ops, or 1430720.2/2.9 ops per clone), SPEEDUP of 497758.364x +Applying multi-merge (3 -> 1 leaves, 1 steps, 0 -> 8 th.sp.) yielded SPEEDUP of 497758.364x (0.02785s -> 5.594e-08s), will amortize in 3.0 ops by saving 0.02785s per op. +In 1 tuning rounds (tot. 0.25s, 0.16s for constructor, 2 clones) obtained a SPEEDUP of 49775736.4% (4.978e+05x) (from 0.003447 to 1716 Mflops). #pr: updating sample at index 7 (6^th of 16), 0^th touch for (0,0,0,0,0,3,0). -First run of RSB Autotuner took 0.000138998 s (7.868e-06 s -> 5.519e-08 s per spmv_sxsa) (tuned: 3 -> 1 lsubm). +First run of RSB Autotuner took 0.252036 s (2.785e-02 s -> 5.594e-08 s per spmv_sxsa) (tuned: 3 -> 1 lsubm). RSB Sparse Blocks Autotuner invoked requesting max 0 splits and max 0 merges in 1 rounds, auto threads spec. -Second run of RSB Autotuner took 0.000335932 s and estimated a speedup of 1.000000 x (5.519e-08 s -> 5.519e-08 s per op) in same matrix (1 -> 1 lsubm) +Second run of RSB Autotuner took 1.17994 s and estimated a speedup of 1.000000 x (5.594e-08 s -> 5.594e-08 s per op) in same matrix (1 -> 1 lsubm) #min:1 0 #max:1 0 #sum:3 0 #norm:1.7320508075688772 0 #used index storage compared to COO:28 vs 48 bytes (58.33%) ; compared to CSR:28 vs 40 bytes (77.78%) #%:CONSTRUCTOR_*:SORT SCAN INSERT SCAN+INSERT -%:CONSTRUCTOR_TIMES:A.mtx S N 8 3 3 6 0.000000 0.000024 0.000014 0.000038 -%:UNSORTEDCOO2RSB_TIME:A.mtx S N 8 3 3 6 0.000038 -%:RSB_SUBDIVISION_TIME:A.mtx S N 8 3 3 6 0.000024 -%:RSB_SHUFFLE_TIME:A.mtx S N 8 3 3 6 0.000014 +%:CONSTRUCTOR_TIMES:A.mtx S N 8 3 3 6 0.000000 0.051344 0.048002 0.099346 +%:UNSORTEDCOO2RSB_TIME:A.mtx S N 8 3 3 6 0.099346 +%:RSB_SUBDIVISION_TIME:A.mtx S N 8 3 3 6 0.051344 +%:RSB_SHUFFLE_TIME:A.mtx S N 8 3 3 6 0.048002 %:ROW_MAJOR_SORT_TIME:A.mtx S N 8 3 3 6 0.000000 %:ROW_MAJOR_SORT_SCALING:A.mtx S N 8 3 3 6 -nan -%:SORTEDCOO2RSB_TIME:A.mtx S N 8 3 3 6 0.000038 +%:SORTEDCOO2RSB_TIME:A.mtx S N 8 3 3 6 0.099346 %:ROW_MAJOR_SORT_TO_MOP:A.mtx S N 8 3 3 6 0.000 %:UNSORTEDCOO2RSB_SCALING:A.mtx S N 8 3 3 6 1.00 %:SORTEDCOO2RSB_SCALING:A.mtx S N 8 3 3 6 1.00 @@ -4628,56 +4664,56 @@ %:SM_MINMAXAVGNNZ:A.mtx S N 8 3 3 6 6 6 6 # %operation:matrix CONSTRUCTOR[8] SPMV[8] SPMV[8] -%operation:A.mtx 6.19888e-05 1e+09 1e+09 +%operation:A.mtx 0.139345 1e+09 1e+09 %constructor:matrix SORT[8] SCAN[8] SHUFFLE[8] INSERT[8] -%constructor:A.mtx 0 2.40803e-05 0 1.40667e-05 +%constructor:A.mtx 0 0.0513439 0 0.048002 # symmetric matrix --- skipping transposed benchmarking # multi-nrhs benchmarking (1,4) -- now using nrhs 4. # Using alpha=1 beta=1 order=rows for rsb_spmv/rsb_spsv/rsb_spmm/rsb_spsm. # multi-transpose benchmarking -- now using transA = N. # will use input matrix flags: RSB_FLAG_USE_HALFWORD_INDICES, RSB_FLAG_SORTED_INPUT, RSB_FLAG_QUAD_PARTITIONING, RSB_FLAG_SYMMETRIC, RSB_FLAG_OWN_PARTITIONING_ARRAYS # Using 8 threads -# Constructed matrix (took 0.000s): (3 x 3)[0x58204140]{Z} @ (0(0..0),0(0..0)) (6 nnz, 2 nnz/r) flags 0x2442186 (coo:1, csr:0, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'S' +# Constructed matrix (took 0.169s): (3 x 3)[0x576bd180]{Z} @ (0(0..0),0(0..0)) (6 nnz, 2 nnz/r) flags 0x2442186 (coo:1, csr:0, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'S' # matrix consistency check took 0.000s (ok) RSB Sparse Blocks Autotuner invoked requesting max 6 splits and max 6 merges in 1 rounds, threads spec.0 (specify negative values to enable threads tuning). Will autotune matrix: 3 x 3, type Z, 6 nnz, 2 nnz/r, 4 subms, 3 lsubms, 4.0000 bpnz. Parameters: verbosity:1 mintimes:3 maxtimes:10 mindt:0 maxdt:3 -3 iterations (8 th.) took 3.91e-05s; avg 1.303e-05s ( +/- 37.80/ 53.66 %); best 8.106e-06s; worst 2.003e-05s; std dev. 5.081e-06 (taking best). -Reference operation time is 8.10623e-06 s (47.37 Mflops) with 8 threads. -Starting merge (same threads) based auto-tuning procedure (transA=N, nrhs=4, order=rows) (max 6 steps, inclusive 3 grace steps) on: 3 x 3, type Z, 6 nnz, 2 nnz/r, 4 subms, 3 lsubms, 4.0000 bpnz (tpop: 8.106e-06 Mflops: 47.371) -Merge (3 -> 1 leaves) took w.c.t. of 5.96e-06s, ~1.907e-06s of computing time (of which 9.537e-07s sorting, 9.537e-07s analysis) -3 iterations (8 th.) took 3.099e-06s; avg 1.033e-06s ( +/- 94.66/107.69 %); best 5.519e-08s; worst 2.146e-06s; std dev. 8.778e-07 (taking best). -Reference operation time is 5.51939e-08 s (6957 Mflops) with 8 threads. -After merge step 1: tpop: 5.519e-08 s ~Mflops: 6957.290 nsubm:1 otn:8 -Applying merge (3 -> 1 leaves, 8 th.) yielded SPEEDUP of 146.868x: 8.106e-06s -> 5.519e-08s, so taking this instance. +3 iterations (8 th.) took 0.06002s; avg 0.02001s ( +/- 39.88/ 59.90 %); best 0.01203s; worst 0.03199s; std dev. 0.008629 (taking best). +Reference operation time is 0.0120292 s (0.03192 Mflops) with 8 threads. +Starting merge (same threads) based auto-tuning procedure (transA=N, nrhs=4, order=rows) (max 6 steps, inclusive 3 grace steps) on: 3 x 3, type Z, 6 nnz, 2 nnz/r, 4 subms, 3 lsubms, 4.0000 bpnz (tpop: 0.01203 Mflops: 0.032) +Merge (3 -> 1 leaves) took w.c.t. of 1.907e-05s, ~5.007e-06s of computing time (of which 1.907e-06s sorting, 3.099e-06s analysis) +3 iterations (8 th.) took 4.053e-06s; avg 1.351e-06s ( +/- 95.86/129.41 %); best 5.594e-08s; worst 3.099e-06s; std dev. 1.296e-06 (taking best). +Reference operation time is 5.59449e-08 s (6864 Mflops) with 8 threads. +After merge step 1: tpop: 5.594e-08 s ~Mflops: 6863.894 nsubm:1 otn:8 +Applying merge (3 -> 1 leaves, 8 th.) yielded SPEEDUP of 215018.112x: 0.01203s -> 5.594e-08s, so taking this instance. Merged all the matrix leaves: no reason to continue merging. -A total of 1 merge steps (of max 6) (3 -> 1 subms) took 3.195e-05s (of which 7.868e-06s partitioning, 0s I/O); computing times: 1.907e-06s in par. loops, 9.537e-07s sorting, 9.537e-07s analyzing) -Total merge + benchmarking process took 3.195e-05s, equivalent to 578.8/3.9 new/old ops (2.789e-05s for 2 clones -- as 505.4/3.4 ops, or 252.7/1.7 ops per clone), SPEEDUP of 146.868x -Applying multi-merge (3 -> 1 leaves, 1 steps, 0 -> 8 th.sp.) yielded SPEEDUP of 146.868x (8.106e-06s -> 5.519e-08s), will amortize in 4.0 ops by saving 8.051e-06s per op. -In 1 tuning rounds (tot. 0.0001s, 2.8e-05s for constructor, 2 clones) obtained a SPEEDUP of 14586.8% (146.9x) (from 47.37 to 6957 Mflops). +A total of 1 merge steps (of max 6) (3 -> 1 subms) took 0.07195s (of which 2.098e-05s partitioning, 0s I/O); computing times: 5.007e-06s in par. loops, 1.907e-06s sorting, 3.099e-06s analyzing) +Total merge + benchmarking process took 0.07195s, equivalent to 1286175.2/6.0 new/old ops (0.1519s for 2 clones -- as 2714728.3/12.6 ops, or 1357364.2/6.3 ops per clone), SPEEDUP of 215018.112x +Applying multi-merge (3 -> 1 leaves, 1 steps, 0 -> 8 th.sp.) yielded SPEEDUP of 215018.112x (0.01203s -> 5.594e-08s), will amortize in 6.0 ops by saving 0.01203s per op. +In 1 tuning rounds (tot. 0.21s, 0.15s for constructor, 2 clones) obtained a SPEEDUP of 21501711.2% (2.15e+05x) (from 0.03192 to 6864 Mflops). #pr: updating sample at index 15 (7^th of 16), 0^th touch for (0,0,0,0,1,3,0). -First run of RSB Autotuner took 0.00011301 s (8.106e-06 s -> 5.519e-08 s per spmv_sxsa) (tuned: 3 -> 1 lsubm). +First run of RSB Autotuner took 0.211994 s (1.203e-02 s -> 5.594e-08 s per spmv_sxsa) (tuned: 3 -> 1 lsubm). RSB Sparse Blocks Autotuner invoked requesting max 0 splits and max 0 merges in 1 rounds, auto threads spec. -Second run of RSB Autotuner took 0.000349045 s and estimated a speedup of 1.000000 x (5.519e-08 s -> 5.519e-08 s per op) in same matrix (1 -> 1 lsubm) +Second run of RSB Autotuner took 1.14399 s and estimated a speedup of 1.000000 x (5.594e-08 s -> 5.594e-08 s per op) in same matrix (1 -> 1 lsubm) #min:1 0 #max:1 0 #sum:3 0 #norm:1.7320508075688772 0 #used index storage compared to COO:28 vs 48 bytes (58.33%) ; compared to CSR:28 vs 40 bytes (77.78%) #%:CONSTRUCTOR_*:SORT SCAN INSERT SCAN+INSERT -%:CONSTRUCTOR_TIMES:A.mtx S N 8 3 3 6 0.000000 0.000026 0.000016 0.000042 -%:UNSORTEDCOO2RSB_TIME:A.mtx S N 8 3 3 6 0.000042 -%:RSB_SUBDIVISION_TIME:A.mtx S N 8 3 3 6 0.000026 -%:RSB_SHUFFLE_TIME:A.mtx S N 8 3 3 6 0.000016 -%:ROW_MAJOR_SORT_TIME:A.mtx S N 8 3 3 6 0.000000 -%:ROW_MAJOR_SORT_SCALING:A.mtx S N 8 3 3 6 -nan -%:SORTEDCOO2RSB_TIME:A.mtx S N 8 3 3 6 0.000042 +%:CONSTRUCTOR_TIMES:A.mtx S N 8 3 3 6 0.000001 0.073192 0.047995 0.121187 +%:UNSORTEDCOO2RSB_TIME:A.mtx S N 8 3 3 6 0.121188 +%:RSB_SUBDIVISION_TIME:A.mtx S N 8 3 3 6 0.073192 +%:RSB_SHUFFLE_TIME:A.mtx S N 8 3 3 6 0.047995 +%:ROW_MAJOR_SORT_TIME:A.mtx S N 8 3 3 6 0.000001 +%:ROW_MAJOR_SORT_SCALING:A.mtx S N 8 3 3 6 1.000 +%:SORTEDCOO2RSB_TIME:A.mtx S N 8 3 3 6 0.121187 %:ROW_MAJOR_SORT_TO_MOP:A.mtx S N 8 3 3 6 0.000 %:UNSORTEDCOO2RSB_SCALING:A.mtx S N 8 3 3 6 1.00 %:SORTEDCOO2RSB_SCALING:A.mtx S N 8 3 3 6 1.00 %:RSB_SUBDIVISION_SCALING:A.mtx S N 8 3 3 6 1.00 %:RSB_SHUFFLE_SCALING:A.mtx S N 8 3 3 6 1.00 -%:CONSTRUCTOR_SCALING:A.mtx S N 8 3 3 6 -nan 1.00 1.00 1.00 +%:CONSTRUCTOR_SCALING:A.mtx S N 8 3 3 6 1.00 1.00 1.00 1.00 #%:SM_COUNTS: Tot HalfwordCsr FullwordCsr HalfwordCoo FullwordCoo %:SM_COUNTS:A.mtx S N 8 3 3 6 1 1 0 0 0 %:SM_IDXOCCUPATIONRSBVSCOOANDCSR:A.mtx S N 8 3 3 6 28 48 36 @@ -4686,332 +4722,336 @@ %:SM_MINMAXAVGNNZ:A.mtx S N 8 3 3 6 6 6 6 # %operation:matrix CONSTRUCTOR[8] SPMV[8] SPMV[8] -%operation:A.mtx 5.60284e-05 1e+09 1e+09 +%operation:A.mtx 0.169198 1e+09 1e+09 %constructor:matrix SORT[8] SCAN[8] SHUFFLE[8] INSERT[8] -%constructor:A.mtx 0 2.59876e-05 0 1.62125e-05 +%constructor:A.mtx 9.53674e-07 0.0731921 0 0.0479951 # symmetric matrix --- skipping transposed benchmarking -# so far, program took 9.475s of wall clock time; ancillary tests 0.000s; I/O 0.000s; checks 0.000s; conversions 0.000s; rsb/mkl tuning 0.004s/0.000s . +# so far, program took 28.564s of wall clock time; ancillary tests 0.000s; I/O 0.000s; checks 0.000s; conversions 0.000s; rsb/mkl tuning 12.392s/0.000s . getrusage() stats: -ru_maxrss: 73 (maximum resident set size -- MB) -ru_stime : 0.7806s (system CPU time used) -ru_utime : 11.82s (user CPU time used) +ru_maxrss: 69 (maximum resident set size -- MB) +ru_stime : 0.6658s (system CPU time used) +ru_utime : 38.29s (user CPU time used) # benchmarking terminated --- finalizing run. # ====== BEGIN Total summary record. #pr: ======== Limiting to type D: #pr: 2 samples (out of 8) matched the dump limiting criteria. #pr: Dump from a base of 8 samples (of max 16) ordered by (1,1,1,1,2,4,2) = (filename x cores x incX x incY x nrhs x typecode x transA). pr: BESTCODE MTX NR NC NNZ NRHS TYPE SYM TRANS NT AT-NT AT-MKL-NT BPNZ AT-BPNZ NSUBM AT-SUBM RSBBEST-MFLOPS OPTIME MKL-OPTIME AT-OPTIME AT-MKL-OPTIME AT-TIME RWminBW-GBps CB-bpf AT-MS CMFLOPS -pr: 1:R_R A 3 3 6 1 D S N 8 8 0 4.0000 4.6667 3 1 434.83 1.001e-05 0.000e+00 5.519e-08 0.000e+00 1.588e-04 2.68e+00 5.17e+00 1 2.40e-05 -pr: 9:R_R A 3 3 6 4 D S N 8 8 0 4.0000 4.6667 3 1 1739.32 7.153e-06 0.000e+00 5.519e-08 0.000e+00 1.099e-04 6.59e+00 2.79e+00 1 9.60e-05 +pr: 1:R_R A 3 3 6 1 D S N 8 8 0 4.0000 4.6667 3 1 428.99 1.199e-02 0.000e+00 5.594e-08 0.000e+00 2.640e-01 2.65e+00 5.17e+00 1 2.40e-05 +pr: 9:R_R A 3 3 6 4 D S N 8 8 0 4.0000 4.6667 3 1 1715.97 2.253e-02 0.000e+00 5.594e-08 0.000e+00 2.280e-01 6.51e+00 2.79e+00 1 9.60e-05 #pr: 2 samples (out of 8) matched the dump limiting criteria. #pr: below, we define 'successful' autotuning when speedup of 1.010000x is exceeded, and 'tuned' results even the ones which are same as untuned #pr: rsb autotuning was successful in 2 cases (100.00 %) and unsuccessful in 0 cases (0.00 %) -#pr: (in succ. cases rsb autotuning gave avg. 15450.8 % faster, avg. sp. ratio 155.508x, max sp. ratio 181.425x, avg. ratio 0.000x) -#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 2434.1/1991.4/2876.9/4868.3 tuned ops) -#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 15.6/ 15.4/ 15.9/ 31.2 untuned ops) -#pr: (and amortizes from untuned rsb in avg. 15.7, min. 15.5, max. 15.9 ops) +#pr: (in succ. cases rsb autotuning gave avg. 30857773.4 % faster, avg. sp. ratio 308578.734x, max sp. ratio 402753.036x, avg. ratio 0.000x) +#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 4396869.8/4075580.7/4718159.0/8793739.6 tuned ops) +#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 16.1/ 10.1/ 22.0/ 32.1 untuned ops) +#pr: (and amortizes from untuned rsb in avg. 16.1, min. 10.1, max. 22.0 ops) #pr: (avg/min/max (avg) nnz per subm before successful tuning were 2/ 2/ 2) #pr: (avg/min/max (avg) nnz per subm after successful tuning were 6/ 6/ 6) #pr: (avg/min/max (avg) bytes per subm before successful tuning were 16/ 16/ 16) #pr: (avg/min/max (avg) bytes per subm after successful tuning were 48/ 48/ 48) #pr: (avg/min/max (avg) bytes per nnz before successful tuning were 4.000/ 4.000/ 4.000) -#pr: (avg/min/max operands (mtx,lhs,rhs) read bandwidth lower bound 3.551/ 2.247/ 4.856,GBps) -#pr: (avg/min/max operands (mtx,rhs:r;lhs:rw) bandwidth lower bound 9.276/ 2.681/ 6.595,GBps) +#pr: (avg/min/max operands (mtx,lhs,rhs) read bandwidth lower bound 3.503/ 2.216/ 4.790,GBps) +#pr: (avg/min/max operands (mtx,rhs:r;lhs:rw) bandwidth lower bound 9.152/ 2.645/ 6.506,GBps) #pr: (avg/min/max code balance (bytes read at least once per flop) 3.979/ 2.792/ 5.167) #pr: (avg/min/max (avg) bytes per nnz after successful tuning were 4.667/ 4.667/ 4.667) #pr: (matrix has been subdivided more/less/same in resp. 0 / 2 /0 cases) #pr: (matrix has used more/less/same threads in resp. 0 / 0 /2 cases) #pr: no unsuccessful rsb autotuning attempt (according to 1.01x threshold) -#pr: rsb auto tuning (either succ. or uns.) time was: on avg.: 0.00 s, min 0.00 s, max 0.00 s, tot 0.00 s (2 samples) -#pr: rsb auto tuning ( only successful ) time was: on avg.: 0.00 s, min 0.00 s, max 0.00 s, tot 0.00 s (2 samples) -#pr: best tun. rsb canon. mflops were: on avg. 1.087e+03, min 4.348e+02, max 1.739e+03 (2 samples) -#pr: ref. unt. rsb canon. mflops were: on avg. 7.909e+00, min 2.397e+00, max 1.342e+01 (2 samples) -#pr: best tun. rsb operation time was: on avg. 5.519e-08s, min 5.519e-08s, max 5.519e-08s, tot 1.104e-07s (2 samples) -#pr: ref. unt. rsb operation time was: on avg. 8.583e-06s, min 7.153e-06s, max 1.001e-05s, tot 1.717e-05s (2 samples) -#pr: min / max ratio of in-memory MEMSET bandwidth to extrapolated read bandwidth ratio: 5.525e+00 1.194e+01 -#pr: in-cache to in-memory MEMSET bandwidth ratio: 1.773e+00 +#pr: rsb auto tuning (either succ. or uns.) time was: on avg.: 0.25 s, min 0.23 s, max 0.26 s, tot 0.49 s (2 samples) +#pr: rsb auto tuning ( only successful ) time was: on avg.: 0.25 s, min 0.23 s, max 0.26 s, tot 0.49 s (2 samples) +#pr: best tun. rsb canon. mflops were: on avg. 1.072e+03, min 4.290e+02, max 1.716e+03 (2 samples) +#pr: ref. unt. rsb canon. mflops were: on avg. 3.131e-03, min 2.001e-03, max 4.261e-03 (2 samples) +#pr: best tun. rsb operation time was: on avg. 5.594e-08s, min 5.594e-08s, max 5.594e-08s, tot 1.119e-07s (2 samples) +#pr: ref. unt. rsb operation time was: on avg. 1.726e-02s, min 1.199e-02s, max 2.253e-02s, tot 3.453e-02s (2 samples) +#pr: min / max ratio of in-memory MEMSET bandwidth to extrapolated read bandwidth ratio: 1.859e+00 4.019e+00 +#pr: in-cache to in-memory MEMSET bandwidth ratio: 2.897e+00 #pr: rsb nrhs-to-overall-min-rhs speed ratio was: on avg. 4.000e+00 x, min 4.000e+00 x, max 4.000e+00 x (1 samples, the non-min-nrhs ones) #pr: ======== Limiting to type S: #pr: 2 samples (out of 8) matched the dump limiting criteria. #pr: Dump from a base of 8 samples (of max 16) ordered by (1,1,1,1,2,4,2) = (filename x cores x incX x incY x nrhs x typecode x transA). pr: BESTCODE MTX NR NC NNZ NRHS TYPE SYM TRANS NT AT-NT AT-MKL-NT BPNZ AT-BPNZ NSUBM AT-SUBM RSBBEST-MFLOPS OPTIME MKL-OPTIME AT-OPTIME AT-MKL-OPTIME AT-TIME RWminBW-GBps CB-bpf AT-MS CMFLOPS -pr: 3:R_R A 3 3 6 1 S S N 8 8 0 4.0000 4.6667 3 1 434.83 5.960e-06 0.000e+00 5.519e-08 0.000e+00 2.191e-04 1.59e+00 3.17e+00 1 2.40e-05 -pr: 11:R_R A 3 3 6 4 S S N 8 8 0 4.0000 4.6667 3 1 1739.32 8.106e-06 0.000e+00 5.519e-08 0.000e+00 3.121e-04 3.55e+00 1.54e+00 1 9.60e-05 +pr: 3:R_R A 3 3 6 1 S S N 8 8 0 4.0000 4.6667 3 1 428.99 1.599e-02 0.000e+00 5.594e-08 0.000e+00 2.214e-01 1.57e+00 3.17e+00 1 2.40e-05 +pr: 11:R_R A 3 3 6 4 S S N 8 8 0 4.0000 4.6667 3 1 1715.97 1.602e-02 0.000e+00 5.594e-08 0.000e+00 2.400e-01 3.50e+00 1.54e+00 1 9.60e-05 #pr: 2 samples (out of 8) matched the dump limiting criteria. #pr: below, we define 'successful' autotuning when speedup of 1.010000x is exceeded, and 'tuned' results even the ones which are same as untuned #pr: rsb autotuning was successful in 2 cases (100.00 %) and unsuccessful in 0 cases (0.00 %) -#pr: (in succ. cases rsb autotuning gave avg. 12643.0 % faster, avg. sp. ratio 127.430x, max sp. ratio 146.868x, avg. ratio 0.000x) -#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 4812.1/3969.8/5654.4/9624.2 tuned ops) -#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 37.6/ 36.8/ 38.5/ 75.3 untuned ops) -#pr: (and amortizes from untuned rsb in avg. 37.9, min. 37.1, max. 38.8 ops) +#pr: (in succ. cases rsb autotuning gave avg. 28604843.5 % faster, avg. sp. ratio 286049.435x, max sp. ratio 286264.649x, avg. ratio 0.000x) +#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 4123483.9/3956641.8/4290326.0/8246967.8 tuned ops) +#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 14.4/ 13.8/ 15.0/ 28.8 untuned ops) +#pr: (and amortizes from untuned rsb in avg. 14.4, min. 13.8, max. 15.0 ops) #pr: (avg/min/max (avg) nnz per subm before successful tuning were 2/ 2/ 2) #pr: (avg/min/max (avg) nnz per subm after successful tuning were 6/ 6/ 6) #pr: (avg/min/max (avg) bytes per subm before successful tuning were 8/ 8/ 8) #pr: (avg/min/max (avg) bytes per subm after successful tuning were 24/ 24/ 24) #pr: (avg/min/max (avg) bytes per nnz before successful tuning were 4.000/ 4.000/ 4.000) -#pr: (avg/min/max operands (mtx,lhs,rhs) read bandwidth lower bound 2.029/ 1.377/ 2.681,GBps) -#pr: (avg/min/max operands (mtx,rhs:r;lhs:rw) bandwidth lower bound 5.145/ 1.594/ 3.551,GBps) +#pr: (avg/min/max operands (mtx,lhs,rhs) read bandwidth lower bound 2.002/ 1.358/ 2.645,GBps) +#pr: (avg/min/max operands (mtx,rhs:r;lhs:rw) bandwidth lower bound 5.076/ 1.573/ 3.503,GBps) #pr: (avg/min/max code balance (bytes read at least once per flop) 2.354/ 1.542/ 3.167) #pr: (avg/min/max (avg) bytes per nnz after successful tuning were 4.667/ 4.667/ 4.667) #pr: (matrix has been subdivided more/less/same in resp. 0 / 2 /0 cases) #pr: (matrix has used more/less/same threads in resp. 0 / 0 /2 cases) #pr: no unsuccessful rsb autotuning attempt (according to 1.01x threshold) -#pr: rsb auto tuning (either succ. or uns.) time was: on avg.: 0.00 s, min 0.00 s, max 0.00 s, tot 0.00 s (2 samples) -#pr: rsb auto tuning ( only successful ) time was: on avg.: 0.00 s, min 0.00 s, max 0.00 s, tot 0.00 s (2 samples) -#pr: best tun. rsb canon. mflops were: on avg. 1.087e+03, min 4.348e+02, max 1.739e+03 (2 samples) -#pr: ref. unt. rsb canon. mflops were: on avg. 7.935e+00, min 4.027e+00, max 1.184e+01 (2 samples) -#pr: best tun. rsb operation time was: on avg. 5.519e-08s, min 5.519e-08s, max 5.519e-08s, tot 1.104e-07s (2 samples) -#pr: ref. unt. rsb operation time was: on avg. 7.033e-06s, min 5.960e-06s, max 8.106e-06s, tot 1.407e-05s (2 samples) -#pr: min / max ratio of in-memory MEMSET bandwidth to extrapolated read bandwidth ratio: 1.000e+01 1.948e+01 -#pr: in-cache to in-memory MEMSET bandwidth ratio: 1.773e+00 +#pr: rsb auto tuning (either succ. or uns.) time was: on avg.: 0.23 s, min 0.22 s, max 0.24 s, tot 0.46 s (2 samples) +#pr: rsb auto tuning ( only successful ) time was: on avg.: 0.23 s, min 0.22 s, max 0.24 s, tot 0.46 s (2 samples) +#pr: best tun. rsb canon. mflops were: on avg. 1.072e+03, min 4.290e+02, max 1.716e+03 (2 samples) +#pr: ref. unt. rsb canon. mflops were: on avg. 3.748e-03, min 1.501e-03, max 5.994e-03 (2 samples) +#pr: best tun. rsb operation time was: on avg. 5.594e-08s, min 5.594e-08s, max 5.594e-08s, tot 1.119e-07s (2 samples) +#pr: ref. unt. rsb operation time was: on avg. 1.600e-02s, min 1.599e-02s, max 1.602e-02s, tot 3.201e-02s (2 samples) +#pr: min / max ratio of in-memory MEMSET bandwidth to extrapolated read bandwidth ratio: 3.367e+00 6.557e+00 +#pr: in-cache to in-memory MEMSET bandwidth ratio: 2.897e+00 #pr: rsb nrhs-to-overall-min-rhs speed ratio was: on avg. 4.000e+00 x, min 4.000e+00 x, max 4.000e+00 x (1 samples, the non-min-nrhs ones) #pr: ======== Limiting to type C: #pr: 2 samples (out of 8) matched the dump limiting criteria. #pr: Dump from a base of 8 samples (of max 16) ordered by (1,1,1,1,2,4,2) = (filename x cores x incX x incY x nrhs x typecode x transA). pr: BESTCODE MTX NR NC NNZ NRHS TYPE SYM TRANS NT AT-NT AT-MKL-NT BPNZ AT-BPNZ NSUBM AT-SUBM RSBBEST-MFLOPS OPTIME MKL-OPTIME AT-OPTIME AT-MKL-OPTIME AT-TIME RWminBW-GBps CB-bpf AT-MS CMFLOPS -pr: 5:R_R A 3 3 6 1 C S N 8 8 0 4.0000 4.6667 3 1 1739.32 9.060e-06 0.000e+00 5.519e-08 0.000e+00 3.500e-04 2.68e+00 1.29e+00 1 9.60e-05 -pr: 13:R_R A 3 3 6 4 C S N 8 8 0 4.0000 4.6667 3 1 6957.29 1.001e-05 0.000e+00 5.519e-08 0.000e+00 1.531e-04 6.59e+00 6.98e-01 1 3.84e-04 +pr: 5:R_R A 3 3 6 1 C S N 8 8 0 4.0000 4.6667 3 1 1715.97 1.600e-02 0.000e+00 5.594e-08 0.000e+00 2.320e-01 2.65e+00 1.29e+00 1 9.60e-05 +pr: 13:R_R A 3 3 6 4 C S N 8 8 0 4.0000 4.6667 3 1 6863.89 1.200e-02 0.000e+00 5.594e-08 0.000e+00 2.330e-01 6.51e+00 6.98e-01 1 3.84e-04 #pr: 2 samples (out of 8) matched the dump limiting criteria. #pr: below, we define 'successful' autotuning when speedup of 1.010000x is exceeded, and 'tuned' results even the ones which are same as untuned #pr: rsb autotuning was successful in 2 cases (100.00 %) and unsuccessful in 0 cases (0.00 %) -#pr: (in succ. cases rsb autotuning gave avg. 17178.6 % faster, avg. sp. ratio 172.786x, max sp. ratio 181.425x, avg. ratio 0.000x) -#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 4557.2/2773.2/6341.3/9114.5 tuned ops) -#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 27.0/ 15.3/ 38.6/ 53.9 untuned ops) -#pr: (and amortizes from untuned rsb in avg. 27.1, min. 15.4, max. 38.9 ops) +#pr: (in succ. cases rsb autotuning gave avg. 25020782.2 % faster, avg. sp. ratio 250208.822x, max sp. ratio 285940.763x, avg. ratio 0.000x) +#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 4156151.7/4147027.5/4165275.9/8312303.4 tuned ops) +#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 17.0/ 14.5/ 19.4/ 33.9 untuned ops) +#pr: (and amortizes from untuned rsb in avg. 17.0, min. 14.5, max. 19.4 ops) #pr: (avg/min/max (avg) nnz per subm before successful tuning were 2/ 2/ 2) #pr: (avg/min/max (avg) nnz per subm after successful tuning were 6/ 6/ 6) #pr: (avg/min/max (avg) bytes per subm before successful tuning were 16/ 16/ 16) #pr: (avg/min/max (avg) bytes per subm after successful tuning were 48/ 48/ 48) #pr: (avg/min/max (avg) bytes per nnz before successful tuning were 4.000/ 4.000/ 4.000) -#pr: (avg/min/max operands (mtx,lhs,rhs) read bandwidth lower bound 3.551/ 2.247/ 4.856,GBps) -#pr: (avg/min/max operands (mtx,rhs:r;lhs:rw) bandwidth lower bound 9.276/ 2.681/ 6.595,GBps) +#pr: (avg/min/max operands (mtx,lhs,rhs) read bandwidth lower bound 3.503/ 2.216/ 4.790,GBps) +#pr: (avg/min/max operands (mtx,rhs:r;lhs:rw) bandwidth lower bound 9.152/ 2.645/ 6.506,GBps) #pr: (avg/min/max code balance (bytes read at least once per flop) 0.995/ 0.698/ 1.292) #pr: (avg/min/max (avg) bytes per nnz after successful tuning were 4.667/ 4.667/ 4.667) #pr: (matrix has been subdivided more/less/same in resp. 0 / 2 /0 cases) #pr: (matrix has used more/less/same threads in resp. 0 / 0 /2 cases) #pr: no unsuccessful rsb autotuning attempt (according to 1.01x threshold) -#pr: rsb auto tuning (either succ. or uns.) time was: on avg.: 0.00 s, min 0.00 s, max 0.00 s, tot 0.00 s (2 samples) -#pr: rsb auto tuning ( only successful ) time was: on avg.: 0.00 s, min 0.00 s, max 0.00 s, tot 0.00 s (2 samples) -#pr: best tun. rsb canon. mflops were: on avg. 4.348e+03, min 1.739e+03, max 6.957e+03 (2 samples) -#pr: ref. unt. rsb canon. mflops were: on avg. 2.447e+01, min 1.060e+01, max 3.835e+01 (2 samples) -#pr: best tun. rsb operation time was: on avg. 5.519e-08s, min 5.519e-08s, max 5.519e-08s, tot 1.104e-07s (2 samples) -#pr: ref. unt. rsb operation time was: on avg. 9.537e-06s, min 9.060e-06s, max 1.001e-05s, tot 1.907e-05s (2 samples) -#pr: min / max ratio of in-memory MEMSET bandwidth to extrapolated read bandwidth ratio: 5.525e+00 1.194e+01 -#pr: in-cache to in-memory MEMSET bandwidth ratio: 1.773e+00 +#pr: rsb auto tuning (either succ. or uns.) time was: on avg.: 0.23 s, min 0.23 s, max 0.23 s, tot 0.47 s (2 samples) +#pr: rsb auto tuning ( only successful ) time was: on avg.: 0.23 s, min 0.23 s, max 0.23 s, tot 0.47 s (2 samples) +#pr: best tun. rsb canon. mflops were: on avg. 4.290e+03, min 1.716e+03, max 6.864e+03 (2 samples) +#pr: ref. unt. rsb canon. mflops were: on avg. 1.900e-02, min 6.001e-03, max 3.200e-02 (2 samples) +#pr: best tun. rsb operation time was: on avg. 5.594e-08s, min 5.594e-08s, max 5.594e-08s, tot 1.119e-07s (2 samples) +#pr: ref. unt. rsb operation time was: on avg. 1.400e-02s, min 1.200e-02s, max 1.600e-02s, tot 2.800e-02s (2 samples) +#pr: min / max ratio of in-memory MEMSET bandwidth to extrapolated read bandwidth ratio: 1.859e+00 4.019e+00 +#pr: in-cache to in-memory MEMSET bandwidth ratio: 2.897e+00 #pr: rsb nrhs-to-overall-min-rhs speed ratio was: on avg. 4.000e+00 x, min 4.000e+00 x, max 4.000e+00 x (1 samples, the non-min-nrhs ones) #pr: ======== Limiting to type Z: #pr: 2 samples (out of 8) matched the dump limiting criteria. #pr: Dump from a base of 8 samples (of max 16) ordered by (1,1,1,1,2,4,2) = (filename x cores x incX x incY x nrhs x typecode x transA). pr: BESTCODE MTX NR NC NNZ NRHS TYPE SYM TRANS NT AT-NT AT-MKL-NT BPNZ AT-BPNZ NSUBM AT-SUBM RSBBEST-MFLOPS OPTIME MKL-OPTIME AT-OPTIME AT-MKL-OPTIME AT-TIME RWminBW-GBps CB-bpf AT-MS CMFLOPS -pr: 7:R_R A 3 3 6 1 Z S N 8 8 0 4.0000 4.6667 3 1 1739.32 7.868e-06 0.000e+00 5.519e-08 0.000e+00 1.390e-04 4.86e+00 2.29e+00 1 9.60e-05 -pr: 15:R_R A 3 3 6 4 Z S N 8 8 0 4.0000 4.6667 3 1 6957.29 8.106e-06 0.000e+00 5.519e-08 0.000e+00 1.130e-04 1.27e+01 1.32e+00 1 3.84e-04 +pr: 7:R_R A 3 3 6 1 Z S N 8 8 0 4.0000 4.6667 3 1 1715.97 2.785e-02 0.000e+00 5.594e-08 0.000e+00 2.520e-01 4.79e+00 2.29e+00 1 9.60e-05 +pr: 15:R_R A 3 3 6 4 Z S N 8 8 0 4.0000 4.6667 3 1 6863.89 1.203e-02 0.000e+00 5.594e-08 0.000e+00 2.120e-01 1.25e+01 1.32e+00 1 3.84e-04 #pr: 2 samples (out of 8) matched the dump limiting criteria. #pr: below, we define 'successful' autotuning when speedup of 1.010000x is exceeded, and 'tuned' results even the ones which are same as untuned #pr: rsb autotuning was successful in 2 cases (100.00 %) and unsuccessful in 0 cases (0.00 %) -#pr: (in succ. cases rsb autotuning gave avg. 14370.8 % faster, avg. sp. ratio 144.708x, max sp. ratio 146.868x, avg. ratio 0.000x) -#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 2282.9/2047.5/2518.4/4565.9 tuned ops) -#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 15.8/ 13.9/ 17.7/ 31.6 untuned ops) -#pr: (and amortizes from untuned rsb in avg. 15.9, min. 14.0, max. 17.8 ops) +#pr: (in succ. cases rsb autotuning gave avg. 35638723.8 % faster, avg. sp. ratio 356388.238x, max sp. ratio 497758.364x, avg. ratio 0.000x) +#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 4147204.3/3789333.0/4505075.6/8294408.7 tuned ops) +#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 13.3/ 9.1/ 17.6/ 26.7 untuned ops) +#pr: (and amortizes from untuned rsb in avg. 13.3, min. 9.1, max. 17.6 ops) #pr: (avg/min/max (avg) nnz per subm before successful tuning were 2/ 2/ 2) #pr: (avg/min/max (avg) nnz per subm after successful tuning were 6/ 6/ 6) #pr: (avg/min/max (avg) bytes per subm before successful tuning were 32/ 32/ 32) #pr: (avg/min/max (avg) bytes per subm after successful tuning were 96/ 96/ 96) #pr: (avg/min/max (avg) bytes per nnz before successful tuning were 4.000/ 4.000/ 4.000) -#pr: (avg/min/max operands (mtx,lhs,rhs) read bandwidth lower bound 6.595/ 3.986/ 9.204,GBps) -#pr: (avg/min/max operands (mtx,rhs:r;lhs:rw) bandwidth lower bound 17.538/ 4.856/ 12.683,GBps) +#pr: (avg/min/max operands (mtx,lhs,rhs) read bandwidth lower bound 6.506/ 3.932/ 9.080,GBps) +#pr: (avg/min/max operands (mtx,rhs:r;lhs:rw) bandwidth lower bound 17.303/ 4.790/ 12.512,GBps) #pr: (avg/min/max code balance (bytes read at least once per flop) 1.807/ 1.323/ 2.292) #pr: (avg/min/max (avg) bytes per nnz after successful tuning were 4.667/ 4.667/ 4.667) #pr: (matrix has been subdivided more/less/same in resp. 0 / 2 /0 cases) #pr: (matrix has used more/less/same threads in resp. 0 / 0 /2 cases) #pr: no unsuccessful rsb autotuning attempt (according to 1.01x threshold) -#pr: rsb auto tuning (either succ. or uns.) time was: on avg.: 0.00 s, min 0.00 s, max 0.00 s, tot 0.00 s (2 samples) -#pr: rsb auto tuning ( only successful ) time was: on avg.: 0.00 s, min 0.00 s, max 0.00 s, tot 0.00 s (2 samples) -#pr: best tun. rsb canon. mflops were: on avg. 4.348e+03, min 1.739e+03, max 6.957e+03 (2 samples) -#pr: ref. unt. rsb canon. mflops were: on avg. 2.979e+01, min 1.220e+01, max 4.737e+01 (2 samples) -#pr: best tun. rsb operation time was: on avg. 5.519e-08s, min 5.519e-08s, max 5.519e-08s, tot 1.104e-07s (2 samples) -#pr: ref. unt. rsb operation time was: on avg. 7.987e-06s, min 7.868e-06s, max 8.106e-06s, tot 1.597e-05s (2 samples) -#pr: min / max ratio of in-memory MEMSET bandwidth to extrapolated read bandwidth ratio: 2.915e+00 6.730e+00 -#pr: in-cache to in-memory MEMSET bandwidth ratio: 1.773e+00 +#pr: rsb auto tuning (either succ. or uns.) time was: on avg.: 0.23 s, min 0.21 s, max 0.25 s, tot 0.46 s (2 samples) +#pr: rsb auto tuning ( only successful ) time was: on avg.: 0.23 s, min 0.21 s, max 0.25 s, tot 0.46 s (2 samples) +#pr: best tun. rsb canon. mflops were: on avg. 4.290e+03, min 1.716e+03, max 6.864e+03 (2 samples) +#pr: ref. unt. rsb canon. mflops were: on avg. 1.768e-02, min 3.447e-03, max 3.192e-02 (2 samples) +#pr: best tun. rsb operation time was: on avg. 5.594e-08s, min 5.594e-08s, max 5.594e-08s, tot 1.119e-07s (2 samples) +#pr: ref. unt. rsb operation time was: on avg. 1.994e-02s, min 1.203e-02s, max 2.785e-02s, tot 3.988e-02s (2 samples) +#pr: min / max ratio of in-memory MEMSET bandwidth to extrapolated read bandwidth ratio: 9.809e-01 2.265e+00 +#pr: # Warning: extrapolated memory I/O bandwidth exceeds memory bandwidth --- is this a tiny matrix ? +#pr: in-cache to in-memory MEMSET bandwidth ratio: 2.897e+00 #pr: rsb nrhs-to-overall-min-rhs speed ratio was: on avg. 4.000e+00 x, min 4.000e+00 x, max 4.000e+00 x (1 samples, the non-min-nrhs ones) #pr: ======== Limiting to nrhs=1: #pr: 4 samples (out of 8) matched the dump limiting criteria. #pr: Dump from a base of 8 samples (of max 16) ordered by (1,1,1,1,2,4,2) = (filename x cores x incX x incY x nrhs x typecode x transA). pr: BESTCODE MTX NR NC NNZ NRHS TYPE SYM TRANS NT AT-NT AT-MKL-NT BPNZ AT-BPNZ NSUBM AT-SUBM RSBBEST-MFLOPS OPTIME MKL-OPTIME AT-OPTIME AT-MKL-OPTIME AT-TIME RWminBW-GBps CB-bpf AT-MS CMFLOPS -pr: 1:R_R A 3 3 6 1 D S N 8 8 0 4.0000 4.6667 3 1 434.83 1.001e-05 0.000e+00 5.519e-08 0.000e+00 1.588e-04 2.68e+00 5.17e+00 1 2.40e-05 -pr: 3:R_R A 3 3 6 1 S S N 8 8 0 4.0000 4.6667 3 1 434.83 5.960e-06 0.000e+00 5.519e-08 0.000e+00 2.191e-04 1.59e+00 3.17e+00 1 2.40e-05 -pr: 5:R_R A 3 3 6 1 C S N 8 8 0 4.0000 4.6667 3 1 1739.32 9.060e-06 0.000e+00 5.519e-08 0.000e+00 3.500e-04 2.68e+00 1.29e+00 1 9.60e-05 -pr: 7:R_R A 3 3 6 1 Z S N 8 8 0 4.0000 4.6667 3 1 1739.32 7.868e-06 0.000e+00 5.519e-08 0.000e+00 1.390e-04 4.86e+00 2.29e+00 1 9.60e-05 +pr: 1:R_R A 3 3 6 1 D S N 8 8 0 4.0000 4.6667 3 1 428.99 1.199e-02 0.000e+00 5.594e-08 0.000e+00 2.640e-01 2.65e+00 5.17e+00 1 2.40e-05 +pr: 3:R_R A 3 3 6 1 S S N 8 8 0 4.0000 4.6667 3 1 428.99 1.599e-02 0.000e+00 5.594e-08 0.000e+00 2.214e-01 1.57e+00 3.17e+00 1 2.40e-05 +pr: 5:R_R A 3 3 6 1 C S N 8 8 0 4.0000 4.6667 3 1 1715.97 1.600e-02 0.000e+00 5.594e-08 0.000e+00 2.320e-01 2.65e+00 1.29e+00 1 9.60e-05 +pr: 7:R_R A 3 3 6 1 Z S N 8 8 0 4.0000 4.6667 3 1 1715.97 2.785e-02 0.000e+00 5.594e-08 0.000e+00 2.520e-01 4.79e+00 2.29e+00 1 9.60e-05 #pr: 4 samples (out of 8) matched the dump limiting criteria. #pr: below, we define 'successful' autotuning when speedup of 1.010000x is exceeded, and 'tuned' results even the ones which are same as untuned #pr: rsb autotuning was successful in 4 cases (100.00 %) and unsuccessful in 0 cases (0.00 %) -#pr: (in succ. cases rsb autotuning gave avg. 14802.8 % faster, avg. sp. ratio 149.028x, max sp. ratio 181.425x, avg. ratio 0.000x) -#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 3926.6/2518.4/6341.3/15706.3 tuned ops) -#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 27.2/ 15.9/ 38.6/108.9 untuned ops) -#pr: (and amortizes from untuned rsb in avg. 27.4, min. 15.9, max. 38.9 ops) +#pr: (in succ. cases rsb autotuning gave avg. 32098344.5 % faster, avg. sp. ratio 320984.445x, max sp. ratio 497758.364x, avg. ratio 0.000x) +#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 4331726.0/3956641.8/4718159.0/17326903.9 tuned ops) +#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 14.9/ 9.1/ 22.0/ 59.4 untuned ops) +#pr: (and amortizes from untuned rsb in avg. 14.9, min. 9.1, max. 22.0 ops) #pr: (avg/min/max (avg) nnz per subm before successful tuning were 2/ 2/ 2) #pr: (avg/min/max (avg) nnz per subm after successful tuning were 6/ 6/ 6) #pr: (avg/min/max (avg) bytes per subm before successful tuning were 18/ 8/ 32) #pr: (avg/min/max (avg) bytes per subm after successful tuning were 54/ 24/ 96) #pr: (avg/min/max (avg) bytes per nnz before successful tuning were 4.000/ 4.000/ 4.000) -#pr: (avg/min/max operands (mtx,lhs,rhs) read bandwidth lower bound 2.464/ 1.377/ 3.986,GBps) -#pr: (avg/min/max operands (mtx,rhs:r;lhs:rw) bandwidth lower bound 11.813/ 1.594/ 4.856,GBps) +#pr: (avg/min/max operands (mtx,lhs,rhs) read bandwidth lower bound 2.431/ 1.358/ 3.932,GBps) +#pr: (avg/min/max operands (mtx,rhs:r;lhs:rw) bandwidth lower bound 11.654/ 1.573/ 4.790,GBps) #pr: (avg/min/max code balance (bytes read at least once per flop) 2.979/ 1.292/ 5.167) #pr: (avg/min/max (avg) bytes per nnz after successful tuning were 4.667/ 4.667/ 4.667) #pr: (matrix has been subdivided more/less/same in resp. 0 / 4 /0 cases) #pr: (matrix has used more/less/same threads in resp. 0 / 0 /4 cases) #pr: no unsuccessful rsb autotuning attempt (according to 1.01x threshold) -#pr: rsb auto tuning (either succ. or uns.) time was: on avg.: 0.00 s, min 0.00 s, max 0.00 s, tot 0.00 s (4 samples) -#pr: rsb auto tuning ( only successful ) time was: on avg.: 0.00 s, min 0.00 s, max 0.00 s, tot 0.00 s (4 samples) -#pr: best tun. rsb canon. mflops were: on avg. 1.087e+03, min 4.348e+02, max 1.739e+03 (4 samples) -#pr: ref. unt. rsb canon. mflops were: on avg. 7.305e+00, min 2.397e+00, max 1.220e+01 (4 samples) -#pr: best tun. rsb operation time was: on avg. 5.519e-08s, min 5.519e-08s, max 5.519e-08s, tot 2.208e-07s (4 samples) -#pr: ref. unt. rsb operation time was: on avg. 8.225e-06s, min 5.960e-06s, max 1.001e-05s, tot 3.290e-05s (4 samples) -#pr: min / max ratio of in-memory MEMSET bandwidth to extrapolated read bandwidth ratio: 6.730e+00 1.948e+01 -#pr: in-cache to in-memory MEMSET bandwidth ratio: 1.773e+00 +#pr: rsb auto tuning (either succ. or uns.) time was: on avg.: 0.24 s, min 0.22 s, max 0.26 s, tot 0.97 s (4 samples) +#pr: rsb auto tuning ( only successful ) time was: on avg.: 0.24 s, min 0.22 s, max 0.26 s, tot 0.97 s (4 samples) +#pr: best tun. rsb canon. mflops were: on avg. 1.072e+03, min 4.290e+02, max 1.716e+03 (4 samples) +#pr: ref. unt. rsb canon. mflops were: on avg. 3.238e-03, min 1.501e-03, max 6.001e-03 (4 samples) +#pr: best tun. rsb operation time was: on avg. 5.594e-08s, min 5.594e-08s, max 5.594e-08s, tot 2.238e-07s (4 samples) +#pr: ref. unt. rsb operation time was: on avg. 1.796e-02s, min 1.199e-02s, max 2.785e-02s, tot 7.183e-02s (4 samples) +#pr: min / max ratio of in-memory MEMSET bandwidth to extrapolated read bandwidth ratio: 2.265e+00 6.557e+00 +#pr: in-cache to in-memory MEMSET bandwidth ratio: 2.897e+00 #pr: ======== Limiting to nrhs=4: #pr: 4 samples (out of 8) matched the dump limiting criteria. #pr: Dump from a base of 8 samples (of max 16) ordered by (1,1,1,1,2,4,2) = (filename x cores x incX x incY x nrhs x typecode x transA). pr: BESTCODE MTX NR NC NNZ NRHS TYPE SYM TRANS NT AT-NT AT-MKL-NT BPNZ AT-BPNZ NSUBM AT-SUBM RSBBEST-MFLOPS OPTIME MKL-OPTIME AT-OPTIME AT-MKL-OPTIME AT-TIME RWminBW-GBps CB-bpf AT-MS CMFLOPS -pr: 9:R_R A 3 3 6 4 D S N 8 8 0 4.0000 4.6667 3 1 1739.32 7.153e-06 0.000e+00 5.519e-08 0.000e+00 1.099e-04 6.59e+00 2.79e+00 1 9.60e-05 -pr: 11:R_R A 3 3 6 4 S S N 8 8 0 4.0000 4.6667 3 1 1739.32 8.106e-06 0.000e+00 5.519e-08 0.000e+00 3.121e-04 3.55e+00 1.54e+00 1 9.60e-05 -pr: 13:R_R A 3 3 6 4 C S N 8 8 0 4.0000 4.6667 3 1 6957.29 1.001e-05 0.000e+00 5.519e-08 0.000e+00 1.531e-04 6.59e+00 6.98e-01 1 3.84e-04 -pr: 15:R_R A 3 3 6 4 Z S N 8 8 0 4.0000 4.6667 3 1 6957.29 8.106e-06 0.000e+00 5.519e-08 0.000e+00 1.130e-04 1.27e+01 1.32e+00 1 3.84e-04 +pr: 9:R_R A 3 3 6 4 D S N 8 8 0 4.0000 4.6667 3 1 1715.97 2.253e-02 0.000e+00 5.594e-08 0.000e+00 2.280e-01 6.51e+00 2.79e+00 1 9.60e-05 +pr: 11:R_R A 3 3 6 4 S S N 8 8 0 4.0000 4.6667 3 1 1715.97 1.602e-02 0.000e+00 5.594e-08 0.000e+00 2.400e-01 3.50e+00 1.54e+00 1 9.60e-05 +pr: 13:R_R A 3 3 6 4 C S N 8 8 0 4.0000 4.6667 3 1 6863.89 1.200e-02 0.000e+00 5.594e-08 0.000e+00 2.330e-01 6.51e+00 6.98e-01 1 3.84e-04 +pr: 15:R_R A 3 3 6 4 Z S N 8 8 0 4.0000 4.6667 3 1 6863.89 1.203e-02 0.000e+00 5.594e-08 0.000e+00 2.120e-01 1.25e+01 1.32e+00 1 3.84e-04 #pr: 4 samples (out of 8) matched the dump limiting criteria. #pr: below, we define 'successful' autotuning when speedup of 1.010000x is exceeded, and 'tuned' results even the ones which are same as untuned #pr: rsb autotuning was successful in 4 cases (100.00 %) and unsuccessful in 0 cases (0.00 %) -#pr: (in succ. cases rsb autotuning gave avg. 15018.8 % faster, avg. sp. ratio 151.188x, max sp. ratio 181.425x, avg. ratio 0.000x) -#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 3116.6/1991.4/5654.4/12466.5 tuned ops) -#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 20.8/ 13.9/ 38.5/ 83.1 untuned ops) -#pr: (and amortizes from untuned rsb in avg. 20.9, min. 14.0, max. 38.8 ops) +#pr: (in succ. cases rsb autotuning gave avg. 27962717.0 % faster, avg. sp. ratio 279628.170x, max sp. ratio 402753.036x, avg. ratio 0.000x) +#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 4080128.9/3789333.0/4290326.0/16320515.7 tuned ops) +#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 15.5/ 10.1/ 19.4/ 62.2 untuned ops) +#pr: (and amortizes from untuned rsb in avg. 15.5, min. 10.1, max. 19.4 ops) #pr: (avg/min/max (avg) nnz per subm before successful tuning were 2/ 2/ 2) #pr: (avg/min/max (avg) nnz per subm after successful tuning were 6/ 6/ 6) #pr: (avg/min/max (avg) bytes per subm before successful tuning were 18/ 8/ 32) #pr: (avg/min/max (avg) bytes per subm after successful tuning were 54/ 24/ 96) #pr: (avg/min/max (avg) bytes per nnz before successful tuning were 4.000/ 4.000/ 4.000) -#pr: (avg/min/max operands (mtx,lhs,rhs) read bandwidth lower bound 5.399/ 2.681/ 9.204,GBps) -#pr: (avg/min/max operands (mtx,rhs:r;lhs:rw) bandwidth lower bound 29.424/ 3.551/ 12.683,GBps) +#pr: (avg/min/max operands (mtx,lhs,rhs) read bandwidth lower bound 5.327/ 2.645/ 9.080,GBps) +#pr: (avg/min/max operands (mtx,rhs:r;lhs:rw) bandwidth lower bound 29.029/ 3.503/ 12.512,GBps) #pr: (avg/min/max code balance (bytes read at least once per flop) 1.589/ 0.698/ 2.792) #pr: (avg/min/max (avg) bytes per nnz after successful tuning were 4.667/ 4.667/ 4.667) #pr: (matrix has been subdivided more/less/same in resp. 0 / 4 /0 cases) #pr: (matrix has used more/less/same threads in resp. 0 / 0 /4 cases) #pr: no unsuccessful rsb autotuning attempt (according to 1.01x threshold) -#pr: rsb auto tuning (either succ. or uns.) time was: on avg.: 0.00 s, min 0.00 s, max 0.00 s, tot 0.00 s (4 samples) -#pr: rsb auto tuning ( only successful ) time was: on avg.: 0.00 s, min 0.00 s, max 0.00 s, tot 0.00 s (4 samples) -#pr: best tun. rsb canon. mflops were: on avg. 4.348e+03, min 1.739e+03, max 6.957e+03 (4 samples) -#pr: ref. unt. rsb canon. mflops were: on avg. 2.775e+01, min 1.184e+01, max 4.737e+01 (4 samples) -#pr: best tun. rsb operation time was: on avg. 5.519e-08s, min 5.519e-08s, max 5.519e-08s, tot 2.208e-07s (4 samples) -#pr: ref. unt. rsb operation time was: on avg. 8.345e-06s, min 7.153e-06s, max 1.001e-05s, tot 3.338e-05s (4 samples) -#pr: min / max ratio of in-memory MEMSET bandwidth to extrapolated read bandwidth ratio: 2.915e+00 1.000e+01 -#pr: in-cache to in-memory MEMSET bandwidth ratio: 1.773e+00 +#pr: rsb auto tuning (either succ. or uns.) time was: on avg.: 0.23 s, min 0.21 s, max 0.24 s, tot 0.91 s (4 samples) +#pr: rsb auto tuning ( only successful ) time was: on avg.: 0.23 s, min 0.21 s, max 0.24 s, tot 0.91 s (4 samples) +#pr: best tun. rsb canon. mflops were: on avg. 4.290e+03, min 1.716e+03, max 6.864e+03 (4 samples) +#pr: ref. unt. rsb canon. mflops were: on avg. 1.855e-02, min 4.261e-03, max 3.200e-02 (4 samples) +#pr: best tun. rsb operation time was: on avg. 5.594e-08s, min 5.594e-08s, max 5.594e-08s, tot 2.238e-07s (4 samples) +#pr: ref. unt. rsb operation time was: on avg. 1.564e-02s, min 1.200e-02s, max 2.253e-02s, tot 6.258e-02s (4 samples) +#pr: min / max ratio of in-memory MEMSET bandwidth to extrapolated read bandwidth ratio: 9.809e-01 3.367e+00 +#pr: # Warning: extrapolated memory I/O bandwidth exceeds memory bandwidth --- is this a tiny matrix ? +#pr: in-cache to in-memory MEMSET bandwidth ratio: 2.897e+00 #pr: rsb nrhs-to-overall-min-rhs speed ratio was: on avg. 4.000e+00 x, min 4.000e+00 x, max 4.000e+00 x (4 samples, the non-min-nrhs ones) #pr: ======== Limiting to transA=N: #pr: Dump from a base of 8 samples (of max 16) ordered by (1,1,1,1,2,4,2) = (filename x cores x incX x incY x nrhs x typecode x transA). pr: BESTCODE MTX NR NC NNZ NRHS TYPE SYM TRANS NT AT-NT AT-MKL-NT BPNZ AT-BPNZ NSUBM AT-SUBM RSBBEST-MFLOPS OPTIME MKL-OPTIME AT-OPTIME AT-MKL-OPTIME AT-TIME RWminBW-GBps CB-bpf AT-MS CMFLOPS -pr: 1:R_R A 3 3 6 1 D S N 8 8 0 4.0000 4.6667 3 1 434.83 1.001e-05 0.000e+00 5.519e-08 0.000e+00 1.588e-04 2.68e+00 5.17e+00 1 2.40e-05 -pr: 3:R_R A 3 3 6 1 S S N 8 8 0 4.0000 4.6667 3 1 434.83 5.960e-06 0.000e+00 5.519e-08 0.000e+00 2.191e-04 1.59e+00 3.17e+00 1 2.40e-05 -pr: 5:R_R A 3 3 6 1 C S N 8 8 0 4.0000 4.6667 3 1 1739.32 9.060e-06 0.000e+00 5.519e-08 0.000e+00 3.500e-04 2.68e+00 1.29e+00 1 9.60e-05 -pr: 7:R_R A 3 3 6 1 Z S N 8 8 0 4.0000 4.6667 3 1 1739.32 7.868e-06 0.000e+00 5.519e-08 0.000e+00 1.390e-04 4.86e+00 2.29e+00 1 9.60e-05 -pr: 9:R_R A 3 3 6 4 D S N 8 8 0 4.0000 4.6667 3 1 1739.32 7.153e-06 0.000e+00 5.519e-08 0.000e+00 1.099e-04 6.59e+00 2.79e+00 1 9.60e-05 -pr: 11:R_R A 3 3 6 4 S S N 8 8 0 4.0000 4.6667 3 1 1739.32 8.106e-06 0.000e+00 5.519e-08 0.000e+00 3.121e-04 3.55e+00 1.54e+00 1 9.60e-05 -pr: 13:R_R A 3 3 6 4 C S N 8 8 0 4.0000 4.6667 3 1 6957.29 1.001e-05 0.000e+00 5.519e-08 0.000e+00 1.531e-04 6.59e+00 6.98e-01 1 3.84e-04 -pr: 15:R_R A 3 3 6 4 Z S N 8 8 0 4.0000 4.6667 3 1 6957.29 8.106e-06 0.000e+00 5.519e-08 0.000e+00 1.130e-04 1.27e+01 1.32e+00 1 3.84e-04 +pr: 1:R_R A 3 3 6 1 D S N 8 8 0 4.0000 4.6667 3 1 428.99 1.199e-02 0.000e+00 5.594e-08 0.000e+00 2.640e-01 2.65e+00 5.17e+00 1 2.40e-05 +pr: 3:R_R A 3 3 6 1 S S N 8 8 0 4.0000 4.6667 3 1 428.99 1.599e-02 0.000e+00 5.594e-08 0.000e+00 2.214e-01 1.57e+00 3.17e+00 1 2.40e-05 +pr: 5:R_R A 3 3 6 1 C S N 8 8 0 4.0000 4.6667 3 1 1715.97 1.600e-02 0.000e+00 5.594e-08 0.000e+00 2.320e-01 2.65e+00 1.29e+00 1 9.60e-05 +pr: 7:R_R A 3 3 6 1 Z S N 8 8 0 4.0000 4.6667 3 1 1715.97 2.785e-02 0.000e+00 5.594e-08 0.000e+00 2.520e-01 4.79e+00 2.29e+00 1 9.60e-05 +pr: 9:R_R A 3 3 6 4 D S N 8 8 0 4.0000 4.6667 3 1 1715.97 2.253e-02 0.000e+00 5.594e-08 0.000e+00 2.280e-01 6.51e+00 2.79e+00 1 9.60e-05 +pr: 11:R_R A 3 3 6 4 S S N 8 8 0 4.0000 4.6667 3 1 1715.97 1.602e-02 0.000e+00 5.594e-08 0.000e+00 2.400e-01 3.50e+00 1.54e+00 1 9.60e-05 +pr: 13:R_R A 3 3 6 4 C S N 8 8 0 4.0000 4.6667 3 1 6863.89 1.200e-02 0.000e+00 5.594e-08 0.000e+00 2.330e-01 6.51e+00 6.98e-01 1 3.84e-04 +pr: 15:R_R A 3 3 6 4 Z S N 8 8 0 4.0000 4.6667 3 1 6863.89 1.203e-02 0.000e+00 5.594e-08 0.000e+00 2.120e-01 1.25e+01 1.32e+00 1 3.84e-04 #pr: below, we define 'successful' autotuning when speedup of 1.010000x is exceeded, and 'tuned' results even the ones which are same as untuned #pr: rsb autotuning was successful in 8 cases (100.00 %) and unsuccessful in 0 cases (0.00 %) -#pr: (in succ. cases rsb autotuning gave avg. 14910.8 % faster, avg. sp. ratio 150.108x, max sp. ratio 181.425x, avg. ratio 0.000x) -#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 3521.6/1991.4/6341.3/28172.8 tuned ops) -#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 24.0/ 13.9/ 38.6/192.0 untuned ops) -#pr: (and amortizes from untuned rsb in avg. 24.2, min. 14.0, max. 38.9 ops) +#pr: (in succ. cases rsb autotuning gave avg. 30030530.7 % faster, avg. sp. ratio 300306.307x, max sp. ratio 497758.364x, avg. ratio 0.000x) +#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 4205927.4/3789333.0/4718159.0/33647419.6 tuned ops) +#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 15.2/ 9.1/ 22.0/121.6 untuned ops) +#pr: (and amortizes from untuned rsb in avg. 15.2, min. 9.1, max. 22.0 ops) #pr: (avg/min/max (avg) nnz per subm before successful tuning were 2/ 2/ 2) #pr: (avg/min/max (avg) nnz per subm after successful tuning were 6/ 6/ 6) #pr: (avg/min/max (avg) bytes per subm before successful tuning were 18/ 8/ 32) #pr: (avg/min/max (avg) bytes per subm after successful tuning were 54/ 24/ 96) #pr: (avg/min/max (avg) bytes per nnz before successful tuning were 4.000/ 4.000/ 4.000) -#pr: (avg/min/max operands (mtx,lhs,rhs) read bandwidth lower bound 3.932/ 1.377/ 9.204,GBps) -#pr: (avg/min/max operands (mtx,rhs:r;lhs:rw) bandwidth lower bound 41.236/ 1.594/ 12.683,GBps) +#pr: (avg/min/max operands (mtx,lhs,rhs) read bandwidth lower bound 3.879/ 1.358/ 9.080,GBps) +#pr: (avg/min/max operands (mtx,rhs:r;lhs:rw) bandwidth lower bound 40.683/ 1.573/ 12.512,GBps) #pr: (avg/min/max code balance (bytes read at least once per flop) 2.284/ 0.698/ 5.167) #pr: (avg/min/max (avg) bytes per nnz after successful tuning were 4.667/ 4.667/ 4.667) #pr: (matrix has been subdivided more/less/same in resp. 0 / 8 /0 cases) #pr: (matrix has used more/less/same threads in resp. 0 / 0 /8 cases) #pr: no unsuccessful rsb autotuning attempt (according to 1.01x threshold) -#pr: rsb auto tuning (either succ. or uns.) time was: on avg.: 0.00 s, min 0.00 s, max 0.00 s, tot 0.00 s (8 samples) -#pr: rsb auto tuning ( only successful ) time was: on avg.: 0.00 s, min 0.00 s, max 0.00 s, tot 0.00 s (8 samples) -#pr: best tun. rsb canon. mflops were: on avg. 2.718e+03, min 4.348e+02, max 6.957e+03 (8 samples) -#pr: ref. unt. rsb canon. mflops were: on avg. 1.753e+01, min 2.397e+00, max 4.737e+01 (8 samples) -#pr: best tun. rsb operation time was: on avg. 5.519e-08s, min 5.519e-08s, max 5.519e-08s, tot 4.416e-07s (8 samples) -#pr: ref. unt. rsb operation time was: on avg. 8.285e-06s, min 5.960e-06s, max 1.001e-05s, tot 6.628e-05s (8 samples) -#pr: min / max ratio of in-memory MEMSET bandwidth to extrapolated read bandwidth ratio: 2.915e+00 1.948e+01 -#pr: in-cache to in-memory MEMSET bandwidth ratio: 1.773e+00 +#pr: rsb auto tuning (either succ. or uns.) time was: on avg.: 0.24 s, min 0.21 s, max 0.26 s, tot 1.88 s (8 samples) +#pr: rsb auto tuning ( only successful ) time was: on avg.: 0.24 s, min 0.21 s, max 0.26 s, tot 1.88 s (8 samples) +#pr: best tun. rsb canon. mflops were: on avg. 2.681e+03, min 4.290e+02, max 6.864e+03 (8 samples) +#pr: ref. unt. rsb canon. mflops were: on avg. 1.089e-02, min 1.501e-03, max 3.200e-02 (8 samples) +#pr: best tun. rsb operation time was: on avg. 5.594e-08s, min 5.594e-08s, max 5.594e-08s, tot 4.476e-07s (8 samples) +#pr: ref. unt. rsb operation time was: on avg. 1.680e-02s, min 1.199e-02s, max 2.785e-02s, tot 1.344e-01s (8 samples) +#pr: min / max ratio of in-memory MEMSET bandwidth to extrapolated read bandwidth ratio: 9.809e-01 6.557e+00 +#pr: # Warning: extrapolated memory I/O bandwidth exceeds memory bandwidth --- is this a tiny matrix ? +#pr: in-cache to in-memory MEMSET bandwidth ratio: 2.897e+00 #pr: rsb nrhs-to-overall-min-rhs speed ratio was: on avg. 4.000e+00 x, min 4.000e+00 x, max 4.000e+00 x (4 samples, the non-min-nrhs ones) #pr: ======== Limiting to both transA=N and nrhs=1: #pr: 4 samples (out of 8) matched the dump limiting criteria. #pr: Dump from a base of 8 samples (of max 16) ordered by (1,1,1,1,2,4,2) = (filename x cores x incX x incY x nrhs x typecode x transA). pr: BESTCODE MTX NR NC NNZ NRHS TYPE SYM TRANS NT AT-NT AT-MKL-NT BPNZ AT-BPNZ NSUBM AT-SUBM RSBBEST-MFLOPS OPTIME MKL-OPTIME AT-OPTIME AT-MKL-OPTIME AT-TIME RWminBW-GBps CB-bpf AT-MS CMFLOPS -pr: 1:R_R A 3 3 6 1 D S N 8 8 0 4.0000 4.6667 3 1 434.83 1.001e-05 0.000e+00 5.519e-08 0.000e+00 1.588e-04 2.68e+00 5.17e+00 1 2.40e-05 -pr: 3:R_R A 3 3 6 1 S S N 8 8 0 4.0000 4.6667 3 1 434.83 5.960e-06 0.000e+00 5.519e-08 0.000e+00 2.191e-04 1.59e+00 3.17e+00 1 2.40e-05 -pr: 5:R_R A 3 3 6 1 C S N 8 8 0 4.0000 4.6667 3 1 1739.32 9.060e-06 0.000e+00 5.519e-08 0.000e+00 3.500e-04 2.68e+00 1.29e+00 1 9.60e-05 -pr: 7:R_R A 3 3 6 1 Z S N 8 8 0 4.0000 4.6667 3 1 1739.32 7.868e-06 0.000e+00 5.519e-08 0.000e+00 1.390e-04 4.86e+00 2.29e+00 1 9.60e-05 +pr: 1:R_R A 3 3 6 1 D S N 8 8 0 4.0000 4.6667 3 1 428.99 1.199e-02 0.000e+00 5.594e-08 0.000e+00 2.640e-01 2.65e+00 5.17e+00 1 2.40e-05 +pr: 3:R_R A 3 3 6 1 S S N 8 8 0 4.0000 4.6667 3 1 428.99 1.599e-02 0.000e+00 5.594e-08 0.000e+00 2.214e-01 1.57e+00 3.17e+00 1 2.40e-05 +pr: 5:R_R A 3 3 6 1 C S N 8 8 0 4.0000 4.6667 3 1 1715.97 1.600e-02 0.000e+00 5.594e-08 0.000e+00 2.320e-01 2.65e+00 1.29e+00 1 9.60e-05 +pr: 7:R_R A 3 3 6 1 Z S N 8 8 0 4.0000 4.6667 3 1 1715.97 2.785e-02 0.000e+00 5.594e-08 0.000e+00 2.520e-01 4.79e+00 2.29e+00 1 9.60e-05 #pr: 4 samples (out of 8) matched the dump limiting criteria. #pr: below, we define 'successful' autotuning when speedup of 1.010000x is exceeded, and 'tuned' results even the ones which are same as untuned #pr: rsb autotuning was successful in 4 cases (100.00 %) and unsuccessful in 0 cases (0.00 %) -#pr: (in succ. cases rsb autotuning gave avg. 14802.8 % faster, avg. sp. ratio 149.028x, max sp. ratio 181.425x, avg. ratio 0.000x) -#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 3926.6/2518.4/6341.3/15706.3 tuned ops) -#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 27.2/ 15.9/ 38.6/108.9 untuned ops) -#pr: (and amortizes from untuned rsb in avg. 27.4, min. 15.9, max. 38.9 ops) +#pr: (in succ. cases rsb autotuning gave avg. 32098344.5 % faster, avg. sp. ratio 320984.445x, max sp. ratio 497758.364x, avg. ratio 0.000x) +#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 4331726.0/3956641.8/4718159.0/17326903.9 tuned ops) +#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 14.9/ 9.1/ 22.0/ 59.4 untuned ops) +#pr: (and amortizes from untuned rsb in avg. 14.9, min. 9.1, max. 22.0 ops) #pr: (avg/min/max (avg) nnz per subm before successful tuning were 2/ 2/ 2) #pr: (avg/min/max (avg) nnz per subm after successful tuning were 6/ 6/ 6) #pr: (avg/min/max (avg) bytes per subm before successful tuning were 18/ 8/ 32) #pr: (avg/min/max (avg) bytes per subm after successful tuning were 54/ 24/ 96) #pr: (avg/min/max (avg) bytes per nnz before successful tuning were 4.000/ 4.000/ 4.000) -#pr: (avg/min/max operands (mtx,lhs,rhs) read bandwidth lower bound 2.464/ 1.377/ 3.986,GBps) -#pr: (avg/min/max operands (mtx,rhs:r;lhs:rw) bandwidth lower bound 11.813/ 1.594/ 4.856,GBps) +#pr: (avg/min/max operands (mtx,lhs,rhs) read bandwidth lower bound 2.431/ 1.358/ 3.932,GBps) +#pr: (avg/min/max operands (mtx,rhs:r;lhs:rw) bandwidth lower bound 11.654/ 1.573/ 4.790,GBps) #pr: (avg/min/max code balance (bytes read at least once per flop) 2.979/ 1.292/ 5.167) #pr: (avg/min/max (avg) bytes per nnz after successful tuning were 4.667/ 4.667/ 4.667) #pr: (matrix has been subdivided more/less/same in resp. 0 / 4 /0 cases) #pr: (matrix has used more/less/same threads in resp. 0 / 0 /4 cases) #pr: no unsuccessful rsb autotuning attempt (according to 1.01x threshold) -#pr: rsb auto tuning (either succ. or uns.) time was: on avg.: 0.00 s, min 0.00 s, max 0.00 s, tot 0.00 s (4 samples) -#pr: rsb auto tuning ( only successful ) time was: on avg.: 0.00 s, min 0.00 s, max 0.00 s, tot 0.00 s (4 samples) -#pr: best tun. rsb canon. mflops were: on avg. 1.087e+03, min 4.348e+02, max 1.739e+03 (4 samples) -#pr: ref. unt. rsb canon. mflops were: on avg. 7.305e+00, min 2.397e+00, max 1.220e+01 (4 samples) -#pr: best tun. rsb operation time was: on avg. 5.519e-08s, min 5.519e-08s, max 5.519e-08s, tot 2.208e-07s (4 samples) -#pr: ref. unt. rsb operation time was: on avg. 8.225e-06s, min 5.960e-06s, max 1.001e-05s, tot 3.290e-05s (4 samples) -#pr: min / max ratio of in-memory MEMSET bandwidth to extrapolated read bandwidth ratio: 6.730e+00 1.948e+01 -#pr: in-cache to in-memory MEMSET bandwidth ratio: 1.773e+00 +#pr: rsb auto tuning (either succ. or uns.) time was: on avg.: 0.24 s, min 0.22 s, max 0.26 s, tot 0.97 s (4 samples) +#pr: rsb auto tuning ( only successful ) time was: on avg.: 0.24 s, min 0.22 s, max 0.26 s, tot 0.97 s (4 samples) +#pr: best tun. rsb canon. mflops were: on avg. 1.072e+03, min 4.290e+02, max 1.716e+03 (4 samples) +#pr: ref. unt. rsb canon. mflops were: on avg. 3.238e-03, min 1.501e-03, max 6.001e-03 (4 samples) +#pr: best tun. rsb operation time was: on avg. 5.594e-08s, min 5.594e-08s, max 5.594e-08s, tot 2.238e-07s (4 samples) +#pr: ref. unt. rsb operation time was: on avg. 1.796e-02s, min 1.199e-02s, max 2.785e-02s, tot 7.183e-02s (4 samples) +#pr: min / max ratio of in-memory MEMSET bandwidth to extrapolated read bandwidth ratio: 2.265e+00 6.557e+00 +#pr: in-cache to in-memory MEMSET bandwidth ratio: 2.897e+00 #pr: ======== Limiting to both transA=N and nrhs=4: #pr: 4 samples (out of 8) matched the dump limiting criteria. #pr: Dump from a base of 8 samples (of max 16) ordered by (1,1,1,1,2,4,2) = (filename x cores x incX x incY x nrhs x typecode x transA). pr: BESTCODE MTX NR NC NNZ NRHS TYPE SYM TRANS NT AT-NT AT-MKL-NT BPNZ AT-BPNZ NSUBM AT-SUBM RSBBEST-MFLOPS OPTIME MKL-OPTIME AT-OPTIME AT-MKL-OPTIME AT-TIME RWminBW-GBps CB-bpf AT-MS CMFLOPS -pr: 9:R_R A 3 3 6 4 D S N 8 8 0 4.0000 4.6667 3 1 1739.32 7.153e-06 0.000e+00 5.519e-08 0.000e+00 1.099e-04 6.59e+00 2.79e+00 1 9.60e-05 -pr: 11:R_R A 3 3 6 4 S S N 8 8 0 4.0000 4.6667 3 1 1739.32 8.106e-06 0.000e+00 5.519e-08 0.000e+00 3.121e-04 3.55e+00 1.54e+00 1 9.60e-05 -pr: 13:R_R A 3 3 6 4 C S N 8 8 0 4.0000 4.6667 3 1 6957.29 1.001e-05 0.000e+00 5.519e-08 0.000e+00 1.531e-04 6.59e+00 6.98e-01 1 3.84e-04 -pr: 15:R_R A 3 3 6 4 Z S N 8 8 0 4.0000 4.6667 3 1 6957.29 8.106e-06 0.000e+00 5.519e-08 0.000e+00 1.130e-04 1.27e+01 1.32e+00 1 3.84e-04 +pr: 9:R_R A 3 3 6 4 D S N 8 8 0 4.0000 4.6667 3 1 1715.97 2.253e-02 0.000e+00 5.594e-08 0.000e+00 2.280e-01 6.51e+00 2.79e+00 1 9.60e-05 +pr: 11:R_R A 3 3 6 4 S S N 8 8 0 4.0000 4.6667 3 1 1715.97 1.602e-02 0.000e+00 5.594e-08 0.000e+00 2.400e-01 3.50e+00 1.54e+00 1 9.60e-05 +pr: 13:R_R A 3 3 6 4 C S N 8 8 0 4.0000 4.6667 3 1 6863.89 1.200e-02 0.000e+00 5.594e-08 0.000e+00 2.330e-01 6.51e+00 6.98e-01 1 3.84e-04 +pr: 15:R_R A 3 3 6 4 Z S N 8 8 0 4.0000 4.6667 3 1 6863.89 1.203e-02 0.000e+00 5.594e-08 0.000e+00 2.120e-01 1.25e+01 1.32e+00 1 3.84e-04 #pr: 4 samples (out of 8) matched the dump limiting criteria. #pr: below, we define 'successful' autotuning when speedup of 1.010000x is exceeded, and 'tuned' results even the ones which are same as untuned #pr: rsb autotuning was successful in 4 cases (100.00 %) and unsuccessful in 0 cases (0.00 %) -#pr: (in succ. cases rsb autotuning gave avg. 15018.8 % faster, avg. sp. ratio 151.188x, max sp. ratio 181.425x, avg. ratio 0.000x) -#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 3116.6/1991.4/5654.4/12466.5 tuned ops) -#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 20.8/ 13.9/ 38.5/ 83.1 untuned ops) -#pr: (and amortizes from untuned rsb in avg. 20.9, min. 14.0, max. 38.8 ops) +#pr: (in succ. cases rsb autotuning gave avg. 27962717.0 % faster, avg. sp. ratio 279628.170x, max sp. ratio 402753.036x, avg. ratio 0.000x) +#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 4080128.9/3789333.0/4290326.0/16320515.7 tuned ops) +#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 15.5/ 10.1/ 19.4/ 62.2 untuned ops) +#pr: (and amortizes from untuned rsb in avg. 15.5, min. 10.1, max. 19.4 ops) #pr: (avg/min/max (avg) nnz per subm before successful tuning were 2/ 2/ 2) #pr: (avg/min/max (avg) nnz per subm after successful tuning were 6/ 6/ 6) #pr: (avg/min/max (avg) bytes per subm before successful tuning were 18/ 8/ 32) #pr: (avg/min/max (avg) bytes per subm after successful tuning were 54/ 24/ 96) #pr: (avg/min/max (avg) bytes per nnz before successful tuning were 4.000/ 4.000/ 4.000) -#pr: (avg/min/max operands (mtx,lhs,rhs) read bandwidth lower bound 5.399/ 2.681/ 9.204,GBps) -#pr: (avg/min/max operands (mtx,rhs:r;lhs:rw) bandwidth lower bound 29.424/ 3.551/ 12.683,GBps) +#pr: (avg/min/max operands (mtx,lhs,rhs) read bandwidth lower bound 5.327/ 2.645/ 9.080,GBps) +#pr: (avg/min/max operands (mtx,rhs:r;lhs:rw) bandwidth lower bound 29.029/ 3.503/ 12.512,GBps) #pr: (avg/min/max code balance (bytes read at least once per flop) 1.589/ 0.698/ 2.792) #pr: (avg/min/max (avg) bytes per nnz after successful tuning were 4.667/ 4.667/ 4.667) #pr: (matrix has been subdivided more/less/same in resp. 0 / 4 /0 cases) #pr: (matrix has used more/less/same threads in resp. 0 / 0 /4 cases) #pr: no unsuccessful rsb autotuning attempt (according to 1.01x threshold) -#pr: rsb auto tuning (either succ. or uns.) time was: on avg.: 0.00 s, min 0.00 s, max 0.00 s, tot 0.00 s (4 samples) -#pr: rsb auto tuning ( only successful ) time was: on avg.: 0.00 s, min 0.00 s, max 0.00 s, tot 0.00 s (4 samples) -#pr: best tun. rsb canon. mflops were: on avg. 4.348e+03, min 1.739e+03, max 6.957e+03 (4 samples) -#pr: ref. unt. rsb canon. mflops were: on avg. 2.775e+01, min 1.184e+01, max 4.737e+01 (4 samples) -#pr: best tun. rsb operation time was: on avg. 5.519e-08s, min 5.519e-08s, max 5.519e-08s, tot 2.208e-07s (4 samples) -#pr: ref. unt. rsb operation time was: on avg. 8.345e-06s, min 7.153e-06s, max 1.001e-05s, tot 3.338e-05s (4 samples) -#pr: min / max ratio of in-memory MEMSET bandwidth to extrapolated read bandwidth ratio: 2.915e+00 1.000e+01 -#pr: in-cache to in-memory MEMSET bandwidth ratio: 1.773e+00 +#pr: rsb auto tuning (either succ. or uns.) time was: on avg.: 0.23 s, min 0.21 s, max 0.24 s, tot 0.91 s (4 samples) +#pr: rsb auto tuning ( only successful ) time was: on avg.: 0.23 s, min 0.21 s, max 0.24 s, tot 0.91 s (4 samples) +#pr: best tun. rsb canon. mflops were: on avg. 4.290e+03, min 1.716e+03, max 6.864e+03 (4 samples) +#pr: ref. unt. rsb canon. mflops were: on avg. 1.855e-02, min 4.261e-03, max 3.200e-02 (4 samples) +#pr: best tun. rsb operation time was: on avg. 5.594e-08s, min 5.594e-08s, max 5.594e-08s, tot 2.238e-07s (4 samples) +#pr: ref. unt. rsb operation time was: on avg. 1.564e-02s, min 1.200e-02s, max 2.253e-02s, tot 6.258e-02s (4 samples) +#pr: min / max ratio of in-memory MEMSET bandwidth to extrapolated read bandwidth ratio: 9.809e-01 3.367e+00 +#pr: # Warning: extrapolated memory I/O bandwidth exceeds memory bandwidth --- is this a tiny matrix ? +#pr: in-cache to in-memory MEMSET bandwidth ratio: 2.897e+00 #pr: rsb nrhs-to-overall-min-rhs speed ratio was: on avg. 4.000e+00 x, min 4.000e+00 x, max 4.000e+00 x (4 samples, the non-min-nrhs ones) #pr: ======== Limiting to transA=T: #pr: No sample (out of 8) matched the dump criteria -- skipping dump round. @@ -5022,62 +5062,63 @@ #pr: ======== All results (not limiting) #pr: Dump from a base of 8 samples (of max 16) ordered by (1,1,1,1,2,4,2) = (filename x cores x incX x incY x nrhs x typecode x transA). pr: BESTCODE MTX NR NC NNZ NRHS TYPE SYM TRANS NT AT-NT AT-MKL-NT BPNZ AT-BPNZ NSUBM AT-SUBM RSBBEST-MFLOPS OPTIME MKL-OPTIME AT-OPTIME AT-MKL-OPTIME AT-TIME RWminBW-GBps CB-bpf AT-MS CMFLOPS -pr: 1:R_R A 3 3 6 1 D S N 8 8 0 4.0000 4.6667 3 1 434.83 1.001e-05 0.000e+00 5.519e-08 0.000e+00 1.588e-04 2.68e+00 5.17e+00 1 2.40e-05 -pr: 3:R_R A 3 3 6 1 S S N 8 8 0 4.0000 4.6667 3 1 434.83 5.960e-06 0.000e+00 5.519e-08 0.000e+00 2.191e-04 1.59e+00 3.17e+00 1 2.40e-05 -pr: 5:R_R A 3 3 6 1 C S N 8 8 0 4.0000 4.6667 3 1 1739.32 9.060e-06 0.000e+00 5.519e-08 0.000e+00 3.500e-04 2.68e+00 1.29e+00 1 9.60e-05 -pr: 7:R_R A 3 3 6 1 Z S N 8 8 0 4.0000 4.6667 3 1 1739.32 7.868e-06 0.000e+00 5.519e-08 0.000e+00 1.390e-04 4.86e+00 2.29e+00 1 9.60e-05 -pr: 9:R_R A 3 3 6 4 D S N 8 8 0 4.0000 4.6667 3 1 1739.32 7.153e-06 0.000e+00 5.519e-08 0.000e+00 1.099e-04 6.59e+00 2.79e+00 1 9.60e-05 -pr: 11:R_R A 3 3 6 4 S S N 8 8 0 4.0000 4.6667 3 1 1739.32 8.106e-06 0.000e+00 5.519e-08 0.000e+00 3.121e-04 3.55e+00 1.54e+00 1 9.60e-05 -pr: 13:R_R A 3 3 6 4 C S N 8 8 0 4.0000 4.6667 3 1 6957.29 1.001e-05 0.000e+00 5.519e-08 0.000e+00 1.531e-04 6.59e+00 6.98e-01 1 3.84e-04 -pr: 15:R_R A 3 3 6 4 Z S N 8 8 0 4.0000 4.6667 3 1 6957.29 8.106e-06 0.000e+00 5.519e-08 0.000e+00 1.130e-04 1.27e+01 1.32e+00 1 3.84e-04 +pr: 1:R_R A 3 3 6 1 D S N 8 8 0 4.0000 4.6667 3 1 428.99 1.199e-02 0.000e+00 5.594e-08 0.000e+00 2.640e-01 2.65e+00 5.17e+00 1 2.40e-05 +pr: 3:R_R A 3 3 6 1 S S N 8 8 0 4.0000 4.6667 3 1 428.99 1.599e-02 0.000e+00 5.594e-08 0.000e+00 2.214e-01 1.57e+00 3.17e+00 1 2.40e-05 +pr: 5:R_R A 3 3 6 1 C S N 8 8 0 4.0000 4.6667 3 1 1715.97 1.600e-02 0.000e+00 5.594e-08 0.000e+00 2.320e-01 2.65e+00 1.29e+00 1 9.60e-05 +pr: 7:R_R A 3 3 6 1 Z S N 8 8 0 4.0000 4.6667 3 1 1715.97 2.785e-02 0.000e+00 5.594e-08 0.000e+00 2.520e-01 4.79e+00 2.29e+00 1 9.60e-05 +pr: 9:R_R A 3 3 6 4 D S N 8 8 0 4.0000 4.6667 3 1 1715.97 2.253e-02 0.000e+00 5.594e-08 0.000e+00 2.280e-01 6.51e+00 2.79e+00 1 9.60e-05 +pr: 11:R_R A 3 3 6 4 S S N 8 8 0 4.0000 4.6667 3 1 1715.97 1.602e-02 0.000e+00 5.594e-08 0.000e+00 2.400e-01 3.50e+00 1.54e+00 1 9.60e-05 +pr: 13:R_R A 3 3 6 4 C S N 8 8 0 4.0000 4.6667 3 1 6863.89 1.200e-02 0.000e+00 5.594e-08 0.000e+00 2.330e-01 6.51e+00 6.98e-01 1 3.84e-04 +pr: 15:R_R A 3 3 6 4 Z S N 8 8 0 4.0000 4.6667 3 1 6863.89 1.203e-02 0.000e+00 5.594e-08 0.000e+00 2.120e-01 1.25e+01 1.32e+00 1 3.84e-04 #pr: below, we define 'successful' autotuning when speedup of 1.010000x is exceeded, and 'tuned' results even the ones which are same as untuned #pr: rsb autotuning was successful in 8 cases (100.00 %) and unsuccessful in 0 cases (0.00 %) -#pr: (in succ. cases rsb autotuning gave avg. 14910.8 % faster, avg. sp. ratio 150.108x, max sp. ratio 181.425x, avg. ratio 0.000x) -#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 3521.6/1991.4/6341.3/28172.8 tuned ops) -#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 24.0/ 13.9/ 38.6/192.0 untuned ops) -#pr: (and amortizes from untuned rsb in avg. 24.2, min. 14.0, max. 38.9 ops) +#pr: (in succ. cases rsb autotuning gave avg. 30030530.7 % faster, avg. sp. ratio 300306.307x, max sp. ratio 497758.364x, avg. ratio 0.000x) +#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 4205927.4/3789333.0/4718159.0/33647419.6 tuned ops) +#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 15.2/ 9.1/ 22.0/121.6 untuned ops) +#pr: (and amortizes from untuned rsb in avg. 15.2, min. 9.1, max. 22.0 ops) #pr: (avg/min/max (avg) nnz per subm before successful tuning were 2/ 2/ 2) #pr: (avg/min/max (avg) nnz per subm after successful tuning were 6/ 6/ 6) #pr: (avg/min/max (avg) bytes per subm before successful tuning were 18/ 8/ 32) #pr: (avg/min/max (avg) bytes per subm after successful tuning were 54/ 24/ 96) #pr: (avg/min/max (avg) bytes per nnz before successful tuning were 4.000/ 4.000/ 4.000) -#pr: (avg/min/max operands (mtx,lhs,rhs) read bandwidth lower bound 3.932/ 1.377/ 9.204,GBps) -#pr: (avg/min/max operands (mtx,rhs:r;lhs:rw) bandwidth lower bound 41.236/ 1.594/ 12.683,GBps) +#pr: (avg/min/max operands (mtx,lhs,rhs) read bandwidth lower bound 3.879/ 1.358/ 9.080,GBps) +#pr: (avg/min/max operands (mtx,rhs:r;lhs:rw) bandwidth lower bound 40.683/ 1.573/ 12.512,GBps) #pr: (avg/min/max code balance (bytes read at least once per flop) 2.284/ 0.698/ 5.167) #pr: (avg/min/max (avg) bytes per nnz after successful tuning were 4.667/ 4.667/ 4.667) #pr: (matrix has been subdivided more/less/same in resp. 0 / 8 /0 cases) #pr: (matrix has used more/less/same threads in resp. 0 / 0 /8 cases) #pr: no unsuccessful rsb autotuning attempt (according to 1.01x threshold) -#pr: rsb auto tuning (either succ. or uns.) time was: on avg.: 0.00 s, min 0.00 s, max 0.00 s, tot 0.00 s (8 samples) -#pr: rsb auto tuning ( only successful ) time was: on avg.: 0.00 s, min 0.00 s, max 0.00 s, tot 0.00 s (8 samples) -#pr: best tun. rsb canon. mflops were: on avg. 2.718e+03, min 4.348e+02, max 6.957e+03 (8 samples) -#pr: ref. unt. rsb canon. mflops were: on avg. 1.753e+01, min 2.397e+00, max 4.737e+01 (8 samples) -#pr: best tun. rsb operation time was: on avg. 5.519e-08s, min 5.519e-08s, max 5.519e-08s, tot 4.416e-07s (8 samples) -#pr: ref. unt. rsb operation time was: on avg. 8.285e-06s, min 5.960e-06s, max 1.001e-05s, tot 6.628e-05s (8 samples) -#pr: min / max ratio of in-memory MEMSET bandwidth to extrapolated read bandwidth ratio: 2.915e+00 1.948e+01 -#pr: in-cache to in-memory MEMSET bandwidth ratio: 1.773e+00 +#pr: rsb auto tuning (either succ. or uns.) time was: on avg.: 0.24 s, min 0.21 s, max 0.26 s, tot 1.88 s (8 samples) +#pr: rsb auto tuning ( only successful ) time was: on avg.: 0.24 s, min 0.21 s, max 0.26 s, tot 1.88 s (8 samples) +#pr: best tun. rsb canon. mflops were: on avg. 2.681e+03, min 4.290e+02, max 6.864e+03 (8 samples) +#pr: ref. unt. rsb canon. mflops were: on avg. 1.089e-02, min 1.501e-03, max 3.200e-02 (8 samples) +#pr: best tun. rsb operation time was: on avg. 5.594e-08s, min 5.594e-08s, max 5.594e-08s, tot 4.476e-07s (8 samples) +#pr: ref. unt. rsb operation time was: on avg. 1.680e-02s, min 1.199e-02s, max 2.785e-02s, tot 1.344e-01s (8 samples) +#pr: min / max ratio of in-memory MEMSET bandwidth to extrapolated read bandwidth ratio: 9.809e-01 6.557e+00 +#pr: # Warning: extrapolated memory I/O bandwidth exceeds memory bandwidth --- is this a tiny matrix ? +#pr: in-cache to in-memory MEMSET bandwidth ratio: 2.897e+00 #pr: rsb nrhs-to-overall-min-rhs speed ratio was: on avg. 4.000e+00 x, min 4.000e+00 x, max 4.000e+00 x (4 samples, the non-min-nrhs ones) -#pr: Record collection took 0.55 s. +#pr: Record collection took 15.13 s. #pr: Record comprises 50 memory benchmark samples (prepend RSB_PR_MBW=1 to dump this). -#pr: Record comprises 100 environment variables in 4759 bytes (prepend RSB_PR_ENV=1 to dump this). +#pr: Record comprises 100 environment variables in 4813 bytes (prepend RSB_PR_ENV=1 to dump this). # ====== END Total summary record. -#pr: ======== Saved a performance record of 16 samples to rsbench_pr__1767573713_gcc-14.2.rpr -# Removing the temporary record file rsbench_pr__1767573713_gcc-14.2.rpr.tmp. -# terminating run at 1767573722 (after 9.5s of w.c.t.) -srcdir="/build/reproducible-path/librsb-1.3.0.2+dfsg" /bin/bash ./scripts/doc-tests.sh +#pr: ======== Saved a performance record of 16 samples to rsbench_pr__1733165264_gcc-14.2.rpr +# Removing the temporary record file rsbench_pr__1733165264_gcc-14.2.rpr.tmp. +# terminating run at 1733165293 (after 28.6s of w.c.t.) +srcdir="/build/reproducible-path/librsb-1.3.0.2+dfsg" /bin/sh ./scripts/doc-tests.sh + set -o pipefail + test x/build/reproducible-path/librsb-1.3.0.2+dfsg = x -+ cat /build/reproducible-path/librsb-1.3.0.2+dfsg/examples/autotune.c /build/reproducible-path/librsb-1.3.0.2+dfsg/examples/backsolve.c /build/reproducible-path/librsb-1.3.0.2+dfsg/examples/hello-spblas.c /build/reproducible-path/librsb-1.3.0.2+dfsg/examples/hello.c /build/reproducible-path/librsb-1.3.0.2+dfsg/examples/io-spblas.c /build/reproducible-path/librsb-1.3.0.2+dfsg/examples/power.c /build/reproducible-path/librsb-1.3.0.2+dfsg/examples/snippets.c /build/reproducible-path/librsb-1.3.0.2+dfsg/examples/transpose.c + grep '^.\{71,\}' ++ cat /build/reproducible-path/librsb-1.3.0.2+dfsg/examples/autotune.c /build/reproducible-path/librsb-1.3.0.2+dfsg/examples/backsolve.c /build/reproducible-path/librsb-1.3.0.2+dfsg/examples/hello-spblas.c /build/reproducible-path/librsb-1.3.0.2+dfsg/examples/hello.c /build/reproducible-path/librsb-1.3.0.2+dfsg/examples/io-spblas.c /build/reproducible-path/librsb-1.3.0.2+dfsg/examples/power.c /build/reproducible-path/librsb-1.3.0.2+dfsg/examples/snippets.c /build/reproducible-path/librsb-1.3.0.2+dfsg/examples/transpose.c + true -+ cat /build/reproducible-path/librsb-1.3.0.2+dfsg/README + grep '^[^ ].\{80,\}' ++ cat /build/reproducible-path/librsb-1.3.0.2+dfsg/README + true ++ /build/reproducible-path/librsb-1.3.0.2+dfsg/rsbench -h ++ wc -l + test 63 -ge 61 -++ /build/reproducible-path/librsb-1.3.0.2+dfsg/rsbench -h ++ wc -c +++ /build/reproducible-path/librsb-1.3.0.2+dfsg/rsbench -h + test 2014 -ge 1966 ++ /build/reproducible-path/librsb-1.3.0.2+dfsg/rsbench -oa -Ob -h ++ wc -l @@ -5118,7 +5159,7 @@ type char codes:D S C Z gmake[4]: Entering directory '/build/reproducible-path/librsb-1.3.0.2+dfsg/examples' if test /build/reproducible-path/librsb-1.3.0.2+dfsg != /build/reproducible-path/librsb-1.3.0.2+dfsg ; then cp /build/reproducible-path/librsb-1.3.0.2+dfsg/pd.mtx /build/reproducible-path/librsb-1.3.0.2+dfsg/vf.mtx /build/reproducible-path/librsb-1.3.0.2+dfsg/examples ; fi -( PATH="/build/reproducible-path/librsb-1.3.0.2+dfsg:/usr/sbin:/usr/bin:/sbin:/bin:/usr/games" /bin/bash /build/reproducible-path/librsb-1.3.0.2+dfsg/examples/bench.sh; ) +( PATH="/build/reproducible-path/librsb-1.3.0.2+dfsg:/usr/sbin:/usr/bin:/sbin:/bin:/usr/games:/i/capture/the/path" /bin/sh /build/reproducible-path/librsb-1.3.0.2+dfsg/examples/bench.sh; ) + which rsbench /build/reproducible-path/librsb-1.3.0.2+dfsg/rsbench + BRF=test.rpr @@ -5128,15 +5169,15 @@ Will invoke autotuning for ~10.000000 s x 1 rounds, specifying verbosity=0 and threads=0. (>0 means no structure tuning; 0 means only structure tuning, <0 means tuning of both with (negated) thread count suggestion). # Requested no transposition. # performance record file set to: test.rpr -# beginning run at 1767573722 +# beginning run at 1733165294 # /build/reproducible-path/librsb-1.3.0.2+dfsg/.libs/rsbench -oa -Ob --bench --lower 100 --as-symmetric --types : -n 1 --notranspose --compare-competitors --verbose --verbose --write-performance-record=test.rpr # compiled with: CC=gcc CFLAGS=-g -O2 -Werror=implicit-function-declaration -fstack-protector-strong -Wformat -Werror=format-security -O3 -std=c99 -# average timer granularity: 5.11e-08 s +# average timer granularity: 5.34e-08 s # Will write a final performance record to file test.rpr and periodic checkpoints to test.rpr.tmp # will NOT perform ancillary tests. # will flush cache memory: between each operation measurement series, and NOT between each operation. # will keep any zero encountered in the matrix. -# env: export PATH=/build/reproducible-path/librsb-1.3.0.2+dfsg:/usr/sbin:/usr/bin:/sbin:/bin:/usr/games +# env: export PATH=/build/reproducible-path/librsb-1.3.0.2+dfsg:/usr/sbin:/usr/bin:/sbin:/bin:/usr/games:/i/capture/the/path # env: export LD_LIBRARY_PATH=/build/reproducible-path/librsb-1.3.0.2+dfsg/.libs:/usr/lib/libeatmydata # env: HOSTNAME is not set # env: KMP_AFFINITY is not set @@ -5175,7 +5216,7 @@ # env: SLURM_NTASKS is not set # env: SLURM_STEP_TASKS_PER_NODE is not set # env: SLURM_TASKS_PER_NODE is not set -# detected hostname: infom08-i386 +# detected hostname: i-capture-the-hostname # user specified a verbosity level of 2 (each --verbose occurrence counts +1) # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 16777216 bytes, per-thread 2097152 bytes @@ -5195,29 +5236,29 @@ # This test will measure times in scanning arrays sized and aligned to fit in caches. # 3 cache levels detected Will fill struct with 50 samples... -# Memory benchmark took 8.743s +# Memory benchmark took 11.772s # auto-tuning oriented output implies times==0 iterations and sort-after-load. #pr: allocated a performance record for 4 samples (1008 bytes). # multi-type benchmarking (DSCZ) -- now using typecode D (last was D). # Cache block size total 16777216 bytes, per-thread 2097152 bytes -# so far, program took 8.745s of wall clock time; ancillary tests 0.000s; I/O 0.000s; checks 0.000s; conversions 0.000s; rsb/mkl tuning 0.000s/0.000s . +# so far, program took 11.778s of wall clock time; ancillary tests 0.000s; I/O 0.000s; checks 0.000s; conversions 0.000s; rsb/mkl tuning 0.000s/0.000s . # Using 1 threads # Using alpha=1 beta=1 order=cols for rsb_spmv/rsb_spsv/rsb_spmm/rsb_spsm. # will use input matrix flags: RSB_FLAG_USE_HALFWORD_INDICES, RSB_FLAG_SORTED_INPUT, RSB_FLAG_LOWER, RSB_FLAG_QUAD_PARTITIONING, RSB_FLAG_SYMMETRIC, RSB_FLAG_OWN_PARTITIONING_ARRAYS # Using 1 threads Building a matrix with 5050 nnz, 100 x 100 Duplicates check: 5050 - 0 = 5050 - converted COO to RSB in 6.790e-04 s (100.00 %) - analyzed arrays in 4.840e-04 s (71.28 %) - cleaned-up arrays in 1.287e-05 s (1.90 %) - deduplicated arrays in 7.153e-06 s (1.05 %) + converted COO to RSB in 1.997e-01 s (100.00 %) + analyzed arrays in 3.972e-02 s (19.89 %) + cleaned-up arrays in 1.192e-05 s (0.01 %) + deduplicated arrays in 7.153e-06 s (0.00 %) sorted arrays in 0.000e+00 s (0.00 %) - shuffled partitions in 9.918e-05 s (14.61 %) - memory allocations took 1.168e-05 s (1.72 %) - leafs setup took 2.098e-05 s (3.09 %) - halfword conversion took 4.101e-05 s (6.04 %) -Built (100 x 100)[0x58175fa0]{D} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x2446196 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'LS' -# Constructed matrix (took 0.001s): (100 x 100)[0x58175fa0]{D} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x2446196 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'LS' + shuffled partitions in 1.120e-01 s (56.06 %) + memory allocations took 1.097e-05 s (0.01 %) + leafs setup took 6.914e-06 s (0.00 %) + halfword conversion took 4.800e-02 s (24.03 %) +Built (100 x 100)[0x57220fe0]{D} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x2446196 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'LS' +# Constructed matrix (took 0.200s): (100 x 100)[0x57220fe0]{D} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x2446196 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'LS' # matrix consistency check took 0.000s (ok) RSB Sparse Blocks Autotuner invoked requesting max 6 splits and max 6 merges in 1 rounds, threads spec.0 (specify negative values to enable threads tuning). Will autotune matrix: 100 x 100, type D, 5050 nnz, 50 nnz/r, 4 subms, 3 lsubms, 2.1212 bpnz. @@ -5268,10 +5309,10 @@ # RSB_IO_WANT_SORT_METHOD: 0 # RSB_IO_WANT_SUBDIVISION_MULTIPLIER: 1 # librsb version 1.3.0.2 - 202212201855: Initialization success -3 iterations (1 th.) took 9.608e-05s; avg 3.203e-05s ( +/- 21.84/ 43.67 %); best 2.503e-05s; worst 4.601e-05s; std dev. 9.89e-06 (taking best). -Reference operation time is 2.5034e-05 s (806.9 Mflops) with 1 threads. -Starting merge (same threads) based auto-tuning procedure (transA=N, nrhs=1, order=cols) (max 6 steps, inclusive 3 grace steps) on: 100 x 100, type D, 5050 nnz, 50 nnz/r, 4 subms, 3 lsubms, 2.1212 bpnz (tpop: 2.503e-05 Mflops: 806.904) -Merge (3 -> 1 leaves) took w.c.t. of 4.911e-05s, ~4.196e-05s of computing time (of which 2.003e-05s sorting, 2.146e-06s analysis) +3 iterations (1 th.) took 0.06397s; avg 0.02132s ( +/- 25.01/ 49.85 %); best 0.01599s; worst 0.03195s; std dev. 0.007516 (taking best). +Reference operation time is 0.0159912 s (1.263 Mflops) with 1 threads. +Starting merge (same threads) based auto-tuning procedure (transA=N, nrhs=1, order=cols) (max 6 steps, inclusive 3 grace steps) on: 100 x 100, type D, 5050 nnz, 50 nnz/r, 4 subms, 3 lsubms, 2.1212 bpnz (tpop: 0.01599 Mflops: 1.263) +Merge (3 -> 1 leaves) took w.c.t. of 0.0001099s, ~9.084e-05s of computing time (of which 3.886e-05s sorting, 6.914e-06s analysis) # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 16777216 bytes, per-thread 16777216 bytes # RSB_IO_WANT_MEMORY_HIERARCHY_INFO_STRING: unset @@ -5302,7 +5343,7 @@ # RSB_IO_WANT_SORT_METHOD: 0 # RSB_IO_WANT_SUBDIVISION_MULTIPLIER: 1 # librsb version 1.3.0.2 - 202212201855: Initialization success -3 iterations (1 th.) took 3.004e-05s; avg 1.001e-05s ( +/- 0.00/ 0.00 %); best 1.001e-05s; worst 1.001e-05s; std dev. 0 (taking best). +3 iterations (1 th.) took 3.29e-05s; avg 1.097e-05s ( +/- 8.70/ 8.70 %); best 1.001e-05s; worst 1.192e-05s; std dev. 7.787e-07 (taking best). Reference operation time is 1.00136e-05 s (2017 Mflops) with 1 threads. # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 16777216 bytes, per-thread 16777216 bytes @@ -5320,15 +5361,15 @@ # RSB_IO_WANT_SUBDIVISION_MULTIPLIER: 1 # librsb version 1.3.0.2 - 202212201855: Initialization success After merge step 1: tpop: 1.001e-05 s ~Mflops: 2017.260 nsubm:1 otn:1 -Applying merge (3 -> 1 leaves, 1 th.) yielded SPEEDUP of 2.500x: 2.503e-05s -> 1.001e-05s, so taking this instance. +Applying merge (3 -> 1 leaves, 1 th.) yielded SPEEDUP of 1596.952x: 0.01599s -> 1.001e-05s, so taking this instance. Saved plot to test-tuning-lower-100x100-5050nz--D-N-1--mv-tuned_merge1_1x1th.eps Merged all the matrix leaves: no reason to continue merging. -A total of 1 merge steps (of max 6) (3 -> 1 subms) took 0.001916s (of which 5.102e-05s partitioning, 0.00178s I/O); computing times: 4.196e-05s in par. loops, 2.003e-05s sorting, 2.146e-06s analyzing) -Total merge + benchmarking process took 0.001916s, equivalent to 191.4/76.5 new/old ops (5.007e-05s for 2 clones -- as 5.0/2.0 ops, or 2.5/1.0 ops per clone), SPEEDUP of 2.500x -Applying multi-merge (3 -> 1 leaves, 1 steps, 0 -> 1 th.sp.) yielded SPEEDUP of 2.500x (2.503e-05s -> 1.001e-05s), will amortize in 127.6 ops by saving 1.502e-05s per op. -In 1 tuning rounds (tot. 0.0021s, 5e-05s for constructor, 2 clones) obtained a SPEEDUP of 150.0% (2.5x) (from 806.9 to 2017 Mflops). Employed 0.0019s for I/O of matrix plots. +A total of 1 merge steps (of max 6) (3 -> 1 subms) took 0.2281s (of which 0.0001152s partitioning, 0.1641s I/O); computing times: 9.084e-05s in par. loops, 3.886e-05s sorting, 6.914e-06s analyzing) +Total merge + benchmarking process took 0.2281s, equivalent to 22775.8/14.3 new/old ops (0.1437s for 2 clones -- as 14348.5/9.0 ops, or 7174.3/4.5 ops per clone), SPEEDUP of 1596.952x +Applying multi-merge (3 -> 1 leaves, 1 steps, 0 -> 1 th.sp.) yielded SPEEDUP of 1596.952x (0.01599s -> 1.001e-05s), will amortize in 14.3 ops by saving 0.01598s per op. +In 1 tuning rounds (tot. 0.37s, 0.14s for constructor, 2 clones) obtained a SPEEDUP of 159595.2% (1597x) (from 1.263 to 2017 Mflops). Employed 0.16s for I/O of matrix plots. #pr: updating sample at index 1 (0^th of 4), 0^th touch for (0,0,0,0,0,0,0). -First run of RSB Autotuner took 0.00398803 s (2.503e-05 s -> 1.001e-05 s per spmv_sxsa) (tuned: 3 -> 1 lsubm). +First run of RSB Autotuner took 0.532079 s (1.599e-02 s -> 1.001e-05 s per spmv_sxsa) (tuned: 3 -> 1 lsubm). RSB Sparse Blocks Autotuner invoked requesting max 0 splits and max 0 merges in 1 rounds, auto threads spec. Will autotune matrix: 100 x 100, type D, 5050 nnz, 50 nnz/r, 1 subms, 1 lsubms, 2.0800 bpnz. Parameters: verbosity:1 mintimes:3 maxtimes:10 mindt:0 maxdt:10 @@ -5394,20 +5435,20 @@ # RSB_IO_WANT_SORT_METHOD: 0 # RSB_IO_WANT_SUBDIVISION_MULTIPLIER: 1 # librsb version 1.3.0.2 - 202212201855: Initialization success -3 iterations (1 th.) took 3.219e-05s; avg 1.073e-05s ( +/- 6.67/ 13.33 %); best 1.001e-05s; worst 1.216e-05s; std dev. 1.012e-06 (taking best). +3 iterations (1 th.) took 3.886e-05s; avg 1.295e-05s ( +/- 22.70/ 38.04 %); best 1.001e-05s; worst 1.788e-05s; std dev. 3.506e-06 (taking best). Reference operation time is 1.00136e-05 s (2017 Mflops) with 1 threads. Building a matrix with 5050 nnz, 100 x 100 Duplicates check: 5050 - 0 = 5050 - converted COO to RSB in 5.007e-05 s (100.00 %) - analyzed arrays in 1.502e-05 s (30.00 %) - cleaned-up arrays in 7.153e-06 s (14.29 %) - deduplicated arrays in 5.960e-06 s (11.90 %) + converted COO to RSB in 9.991e-02 s (100.00 %) + analyzed arrays in 5.169e-02 s (51.74 %) + cleaned-up arrays in 5.960e-06 s (0.01 %) + deduplicated arrays in 6.914e-06 s (0.01 %) sorted arrays in 0.000e+00 s (0.00 %) - shuffled partitions in 1.502e-05 s (30.00 %) - memory allocations took 1.907e-06 s (3.81 %) - leafs setup took 0.000e+00 s (0.00 %) - halfword conversion took 5.007e-06 s (10.00 %) -Built (100 x 100)[0x5817eaa0]{D} @ (0(0..100),0(0..100)) (5050 nnz, 50 nnz/r) flags 0x42644094 (coo:0, csr:1, hw:0, ic:1, fi:0), storage: 1, subm: 1, symflags:'LS' + shuffled partitions in 4.818e-02 s (48.23 %) + memory allocations took 3.815e-06 s (0.00 %) + leafs setup took 2.861e-06 s (0.00 %) + halfword conversion took 8.106e-06 s (0.01 %) +Built (100 x 100)[0x57229ae0]{D} @ (0(0..100),0(0..100)) (5050 nnz, 50 nnz/r) flags 0x42644094 (coo:0, csr:1, hw:0, ic:1, fi:0), storage: 1, subm: 1, symflags:'LS' Starting autotuning stage, with subdivision of 1 (current threads=1, requested threads=0, max threads = 8). # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 16777216 bytes, per-thread 16777216 bytes @@ -5441,16 +5482,16 @@ # librsb version 1.3.0.2 - 202212201855: Initialization success Building a matrix with 5050 nnz, 100 x 100 Duplicates check: 5050 - 0 = 5050 - converted COO to RSB in 1.159e-04 s (100.00 %) - analyzed arrays in 3.099e-05 s (26.75 %) - cleaned-up arrays in 5.960e-06 s (5.14 %) - deduplicated arrays in 5.960e-06 s (5.14 %) + converted COO to RSB in 1.797e-01 s (100.00 %) + analyzed arrays in 6.769e-02 s (37.67 %) + cleaned-up arrays in 7.153e-06 s (0.00 %) + deduplicated arrays in 6.914e-06 s (0.00 %) sorted arrays in 0.000e+00 s (0.00 %) - shuffled partitions in 5.579e-05 s (48.15 %) - memory allocations took 9.537e-07 s (0.82 %) - leafs setup took 1.192e-06 s (1.03 %) - halfword conversion took 1.383e-05 s (11.93 %) -Built (100 x 100)[0x581762e0]{D} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x42646096 (coo:0, csr:1, hw:1, ic:1, fi:0), storage: 1, subm: 3, symflags:'LS' + shuffled partitions in 6.400e-02 s (35.61 %) + memory allocations took 5.007e-06 s (0.00 %) + leafs setup took 4.053e-06 s (0.00 %) + halfword conversion took 4.799e-02 s (26.70 %) +Built (100 x 100)[0x57221320]{D} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x42646096 (coo:0, csr:1, hw:1, ic:1, fi:0), storage: 1, subm: 3, symflags:'LS' # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 16777216 bytes, per-thread 16777216 bytes # RSB_IO_WANT_MEMORY_HIERARCHY_INFO_STRING: unset @@ -5496,9 +5537,9 @@ # RSB_IO_WANT_SORT_METHOD: 0 # RSB_IO_WANT_SUBDIVISION_MULTIPLIER: 0.25 # librsb version 1.3.0.2 - 202212201855: Initialization success -3 iterations (1 th.) took 7.796e-05s; avg 2.599e-05s ( +/- 7.34/ 7.34 %); best 2.408e-05s; worst 2.789e-05s; std dev. 1.557e-06 (taking best). -Reference operation time is 2.40803e-05 s (838.9 Mflops) with 1 threads. -Challenging best inner round reference (1.00136e-05 s/1 threads) with: subdivision 0.25, 3 leaves, 2.121 bytes/nz, 2.40803e-05 s/0 threads (speedup 0.415842 x), same?n. +3 iterations (1 th.) took 0.06394s; avg 0.02131s ( +/- 25.20/ 49.98 %); best 0.01594s; worst 0.03197s; std dev. 0.007533 (taking best). +Reference operation time is 0.0159431 s (1.267 Mflops) with 1 threads. +Challenging best inner round reference (1.00136e-05 s/1 threads) with: subdivision 0.25, 3 leaves, 2.121 bytes/nz, 0.0159431 s/0 threads (speedup 0.000628084 x), same?n. New candidate clone performs slowly; discarding it: 100 x 100, type D, 5050 nnz, 50 nnz/r, 4 subms, 3 lsubms, 2.1212 bpnz # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 16777216 bytes, per-thread 16777216 bytes @@ -5532,16 +5573,16 @@ # librsb version 1.3.0.2 - 202212201855: Initialization success Building a matrix with 5050 nnz, 100 x 100 Duplicates check: 5050 - 0 = 5050 - converted COO to RSB in 1.311e-04 s (100.00 %) - analyzed arrays in 3.791e-05 s (28.91 %) - cleaned-up arrays in 7.153e-06 s (5.45 %) - deduplicated arrays in 5.960e-06 s (4.55 %) + converted COO to RSB in 1.599e-01 s (100.00 %) + analyzed arrays in 6.386e-02 s (39.94 %) + cleaned-up arrays in 6.914e-06 s (0.00 %) + deduplicated arrays in 5.960e-06 s (0.00 %) sorted arrays in 0.000e+00 s (0.00 %) - shuffled partitions in 6.413e-05 s (48.91 %) - memory allocations took 1.907e-06 s (1.45 %) - leafs setup took 9.537e-07 s (0.73 %) - halfword conversion took 1.311e-05 s (10.00 %) -Built (100 x 100)[0x58176a70]{D} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x42646096 (coo:0, csr:1, hw:1, ic:1, fi:0), storage: 1, subm: 10, symflags:'LS' + shuffled partitions in 4.800e-02 s (30.02 %) + memory allocations took 6.199e-06 s (0.00 %) + leafs setup took 4.053e-06 s (0.00 %) + halfword conversion took 4.799e-02 s (30.02 %) +Built (100 x 100)[0x57221ab0]{D} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x42646096 (coo:0, csr:1, hw:1, ic:1, fi:0), storage: 1, subm: 10, symflags:'LS' # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 16777216 bytes, per-thread 16777216 bytes # RSB_IO_WANT_MEMORY_HIERARCHY_INFO_STRING: unset @@ -5587,9 +5628,9 @@ # RSB_IO_WANT_SORT_METHOD: 0 # RSB_IO_WANT_SUBDIVISION_MULTIPLIER: 0.5 # librsb version 1.3.0.2 - 202212201855: Initialization success -3 iterations (1 th.) took 8.893e-05s; avg 2.964e-05s ( +/- 5.90/ 7.77 %); best 2.789e-05s; worst 3.195e-05s; std dev. 1.701e-06 (taking best). -Reference operation time is 2.7895e-05 s (724.1 Mflops) with 1 threads. -Challenging best inner round reference (1.00136e-05 s/1 threads) with: subdivision 0.5, 10 leaves, 2.206 bytes/nz, 2.7895e-05 s/0 threads (speedup 0.358974 x), same?n. +3 iterations (1 th.) took 0.06398s; avg 0.02133s ( +/- 25.07/ 49.92 %); best 0.01598s; worst 0.03197s; std dev. 0.007527 (taking best). +Reference operation time is 0.01598 s (1.264 Mflops) with 1 threads. +Challenging best inner round reference (1.00136e-05 s/1 threads) with: subdivision 0.5, 10 leaves, 2.206 bytes/nz, 0.01598 s/0 threads (speedup 0.000626632 x), same?n. New candidate clone performs slowly; discarding it: 100 x 100, type D, 5050 nnz, 50 nnz/r, 14 subms, 10 lsubms, 2.2059 bpnz # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 16777216 bytes, per-thread 16777216 bytes @@ -5623,16 +5664,16 @@ # librsb version 1.3.0.2 - 202212201855: Initialization success Building a matrix with 5050 nnz, 100 x 100 Duplicates check: 5050 - 0 = 5050 - converted COO to RSB in 1.581e-04 s (100.00 %) - analyzed arrays in 4.816e-05 s (30.47 %) - cleaned-up arrays in 6.914e-06 s (4.37 %) - deduplicated arrays in 5.960e-06 s (3.77 %) + converted COO to RSB in 1.439e-01 s (100.00 %) + analyzed arrays in 6.383e-02 s (44.37 %) + cleaned-up arrays in 7.153e-06 s (0.00 %) + deduplicated arrays in 5.960e-06 s (0.00 %) sorted arrays in 0.000e+00 s (0.00 %) - shuffled partitions in 7.796e-05 s (49.32 %) - memory allocations took 3.099e-06 s (1.96 %) - leafs setup took 1.907e-06 s (1.21 %) - halfword conversion took 1.407e-05 s (8.90 %) -Built (100 x 100)[0x5817eb80]{D} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x42646096 (coo:0, csr:1, hw:1, ic:1, fi:0), storage: 1, subm: 22, symflags:'LS' + shuffled partitions in 3.202e-02 s (22.26 %) + memory allocations took 5.722e-06 s (0.00 %) + leafs setup took 5.007e-06 s (0.00 %) + halfword conversion took 4.798e-02 s (33.35 %) +Built (100 x 100)[0x57229bc0]{D} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x42646096 (coo:0, csr:1, hw:1, ic:1, fi:0), storage: 1, subm: 22, symflags:'LS' # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 16777216 bytes, per-thread 16777216 bytes # RSB_IO_WANT_MEMORY_HIERARCHY_INFO_STRING: unset @@ -5678,10 +5719,10 @@ # RSB_IO_WANT_SORT_METHOD: 0 # RSB_IO_WANT_SUBDIVISION_MULTIPLIER: 1 # librsb version 1.3.0.2 - 202212201855: Initialization success -3 iterations (1 th.) took 8.392e-05s; avg 2.797e-05s ( +/- 7.10/ 10.80 %); best 2.599e-05s; worst 3.099e-05s; std dev. 2.171e-06 (taking best). -Reference operation time is 2.59876e-05 s (777.3 Mflops) with 1 threads. -Challenging best inner round reference (1.00136e-05 s/1 threads) with: subdivision 1, 22 leaves, 2.284 bytes/nz, 2.59876e-05 s/0 threads (speedup 0.385321 x), same?n. -New candidate clone performs slowly; discarding it: 100 x 100, type D, 5050 nnz, 50 nnz/r, 30 subms, 22 lsubms, 2.2844 bpnz +3 iterations (1 th.) took 0.07994s; avg 0.02665s ( +/- 39.99/ 20.09 %); best 0.01599s; worst 0.032s; std dev. 0.007534 (taking best). +Reference operation time is 0.0159912 s (1.263 Mflops) with 1 threads. +Challenging best inner round reference (1.00136e-05 s/1 threads) with: subdivision 1, 22 leaves, 2.295 bytes/nz, 0.0159912 s/0 threads (speedup 0.000626193 x), same?n. +New candidate clone performs slowly; discarding it: 100 x 100, type D, 5050 nnz, 50 nnz/r, 30 subms, 22 lsubms, 2.2947 bpnz # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 16777216 bytes, per-thread 16777216 bytes # RSB_IO_WANT_MEMORY_HIERARCHY_INFO_STRING: unset @@ -5714,16 +5755,16 @@ # librsb version 1.3.0.2 - 202212201855: Initialization success Building a matrix with 5050 nnz, 100 x 100 Duplicates check: 5050 - 0 = 5050 - converted COO to RSB in 1.891e-04 s (100.00 %) - analyzed arrays in 6.294e-05 s (33.29 %) - cleaned-up arrays in 5.960e-06 s (3.15 %) - deduplicated arrays in 5.960e-06 s (3.15 %) + converted COO to RSB in 1.519e-01 s (100.00 %) + analyzed arrays in 5.585e-02 s (36.77 %) + cleaned-up arrays in 5.960e-06 s (0.00 %) + deduplicated arrays in 7.153e-06 s (0.00 %) sorted arrays in 0.000e+00 s (0.00 %) - shuffled partitions in 8.798e-05 s (46.53 %) - memory allocations took 7.153e-06 s (3.78 %) - leafs setup took 3.099e-06 s (1.64 %) - halfword conversion took 1.597e-05 s (8.45 %) -Built (100 x 100)[0x5817eb80]{D} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x42646096 (coo:0, csr:1, hw:1, ic:1, fi:0), storage: 1, subm: 36, symflags:'LS' + shuffled partitions in 4.801e-02 s (31.61 %) + memory allocations took 7.153e-06 s (0.00 %) + leafs setup took 5.960e-06 s (0.00 %) + halfword conversion took 4.801e-02 s (31.61 %) +Built (100 x 100)[0x57229bc0]{D} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x42646096 (coo:0, csr:1, hw:1, ic:1, fi:0), storage: 1, subm: 36, symflags:'LS' # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 16777216 bytes, per-thread 16777216 bytes # RSB_IO_WANT_MEMORY_HIERARCHY_INFO_STRING: unset @@ -5769,9 +5810,9 @@ # RSB_IO_WANT_SORT_METHOD: 0 # RSB_IO_WANT_SUBDIVISION_MULTIPLIER: 2 # librsb version 1.3.0.2 - 202212201855: Initialization success -3 iterations (1 th.) took 9.608e-05s; avg 3.203e-05s ( +/- 9.18/ 16.13 %); best 2.909e-05s; worst 3.719e-05s; std dev. 3.664e-06 (taking best). -Reference operation time is 2.90871e-05 s (694.5 Mflops) with 1 threads. -Challenging best inner round reference (1.00136e-05 s/1 threads) with: subdivision 2, 36 leaves, 2.383 bytes/nz, 2.90871e-05 s/0 threads (speedup 0.344262 x), same?n. +3 iterations (1 th.) took 0.07189s; avg 0.02396s ( +/- 0.31/ 0.16 %); best 0.02389s; worst 0.024s; std dev. 5.187e-05 (taking best). +Reference operation time is 0.0238891 s (0.8456 Mflops) with 1 threads. +Challenging best inner round reference (1.00136e-05 s/1 threads) with: subdivision 2, 36 leaves, 2.383 bytes/nz, 0.0238891 s/0 threads (speedup 0.00041917 x), same?n. New candidate clone performs slowly; discarding it: 100 x 100, type D, 5050 nnz, 50 nnz/r, 50 subms, 36 lsubms, 2.3834 bpnz # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 16777216 bytes, per-thread 16777216 bytes @@ -5805,16 +5846,16 @@ # librsb version 1.3.0.2 - 202212201855: Initialization success Building a matrix with 5050 nnz, 100 x 100 Duplicates check: 5050 - 0 = 5050 - converted COO to RSB in 1.841e-04 s (100.00 %) - analyzed arrays in 5.913e-05 s (32.12 %) - cleaned-up arrays in 5.960e-06 s (3.24 %) - deduplicated arrays in 5.960e-06 s (3.24 %) + converted COO to RSB in 1.479e-01 s (100.00 %) + analyzed arrays in 5.190e-02 s (35.09 %) + cleaned-up arrays in 6.914e-06 s (0.00 %) + deduplicated arrays in 6.199e-06 s (0.00 %) sorted arrays in 0.000e+00 s (0.00 %) - shuffled partitions in 8.583e-05 s (46.63 %) - memory allocations took 1.001e-05 s (5.44 %) - leafs setup took 3.099e-06 s (1.68 %) - halfword conversion took 1.407e-05 s (7.64 %) -Built (100 x 100)[0x581a5a00]{D} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x42646096 (coo:0, csr:1, hw:1, ic:1, fi:0), storage: 1, subm: 36, symflags:'LS' + shuffled partitions in 4.797e-02 s (32.43 %) + memory allocations took 7.868e-06 s (0.01 %) + leafs setup took 4.053e-06 s (0.00 %) + halfword conversion took 4.800e-02 s (32.46 %) +Built (100 x 100)[0x57250a40]{D} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x42646096 (coo:0, csr:1, hw:1, ic:1, fi:0), storage: 1, subm: 36, symflags:'LS' # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 16777216 bytes, per-thread 16777216 bytes # RSB_IO_WANT_MEMORY_HIERARCHY_INFO_STRING: unset @@ -5860,9 +5901,9 @@ # RSB_IO_WANT_SORT_METHOD: 0 # RSB_IO_WANT_SUBDIVISION_MULTIPLIER: 4 # librsb version 1.3.0.2 - 202212201855: Initialization success -3 iterations (1 th.) took 0.0001011s; avg 3.37e-05s ( +/- 10.85/ 6.84 %); best 3.004e-05s; worst 3.6e-05s; std dev. 2.614e-06 (taking best). -Reference operation time is 3.00407e-05 s (672.4 Mflops) with 1 threads. -Challenging best inner round reference (1.00136e-05 s/1 threads) with: subdivision 4, 36 leaves, 2.383 bytes/nz, 3.00407e-05 s/0 threads (speedup 0.333333 x), same?n. +3 iterations (1 th.) took 0.1099s; avg 0.03664s ( +/- 40.46/ 53.01 %); best 0.02182s; worst 0.05607s; std dev. 0.01436 (taking best). +Reference operation time is 0.021816 s (0.9259 Mflops) with 1 threads. +Challenging best inner round reference (1.00136e-05 s/1 threads) with: subdivision 4, 36 leaves, 2.383 bytes/nz, 0.021816 s/0 threads (speedup 0.000459001 x), same?n. New candidate clone performs slowly; discarding it: 100 x 100, type D, 5050 nnz, 50 nnz/r, 50 subms, 36 lsubms, 2.3834 bpnz Best sparse multiply performance with subdivision multiplier of 1: 2017.26 Mflops. # librsb version 1.3.0.2 - 202212201855: Initializing @@ -5880,23 +5921,23 @@ # RSB_IO_WANT_SORT_METHOD: 0 # RSB_IO_WANT_SUBDIVISION_MULTIPLIER: 1 # librsb version 1.3.0.2 - 202212201855: Initialization success -Last tuner inner round (1 of 1) took 0.00189495 s (eq. to 2e+02/ 2e+02 old/new op.times), gained local/global speedup 1 x (1.00136e-05 : 1.00136e-05) / 1 x (1.00136e-05 : 1.00136e-05). This is not amortizable ! +Last tuner inner round (1 of 1) took 1.27388 s (eq. to 1e+05/ 1e+05 old/new op.times), gained local/global speedup 1 x (1.00136e-05 : 1.00136e-05) / 1 x (1.00136e-05 : 1.00136e-05). This is not amortizable ! Auto tuning inner round 1 did not find a configuration better than the original. -In 1 tuning rounds (tot. 0.0019s, 0.0012s for constructor, 0 clones) obtained NO speedup (best stays 2017 Mflops). -Second run of RSB Autotuner took 0.00191402 s and estimated a speedup of 1.000000 x (1.001e-05 s -> 1.001e-05 s per op) in same matrix (1 -> 1 lsubm) +In 1 tuning rounds (tot. 1.3s, 0.88s for constructor, 0 clones) obtained NO speedup (best stays 2017 Mflops). +Second run of RSB Autotuner took 1.27393 s and estimated a speedup of 1.000000 x (1.001e-05 s -> 1.001e-05 s per op) in same matrix (1 -> 1 lsubm) #min:1 #max:1 #sum:100 #norm:10 #used index storage compared to COO:10504 vs 40400 bytes (26.00%) ; compared to CSR:10504 vs 20604 bytes (50.99%) #%:CONSTRUCTOR_*:SORT SCAN INSERT SCAN+INSERT -%:CONSTRUCTOR_TIMES:lower-100x100-5050nz S N 1 100 100 5050 0.000000 0.000484 0.000099 0.000583 -%:UNSORTEDCOO2RSB_TIME:lower-100x100-5050nz S N 1 100 100 5050 0.000583 -%:RSB_SUBDIVISION_TIME:lower-100x100-5050nz S N 1 100 100 5050 0.000484 -%:RSB_SHUFFLE_TIME:lower-100x100-5050nz S N 1 100 100 5050 0.000099 +%:CONSTRUCTOR_TIMES:lower-100x100-5050nz S N 1 100 100 5050 0.000000 0.039718 0.111979 0.151697 +%:UNSORTEDCOO2RSB_TIME:lower-100x100-5050nz S N 1 100 100 5050 0.151697 +%:RSB_SUBDIVISION_TIME:lower-100x100-5050nz S N 1 100 100 5050 0.039718 +%:RSB_SHUFFLE_TIME:lower-100x100-5050nz S N 1 100 100 5050 0.111979 %:ROW_MAJOR_SORT_TIME:lower-100x100-5050nz S N 1 100 100 5050 0.000000 %:ROW_MAJOR_SORT_SCALING:lower-100x100-5050nz S N 1 100 100 5050 -nan -%:SORTEDCOO2RSB_TIME:lower-100x100-5050nz S N 1 100 100 5050 0.000583 +%:SORTEDCOO2RSB_TIME:lower-100x100-5050nz S N 1 100 100 5050 0.151697 %:ROW_MAJOR_SORT_TO_MOP:lower-100x100-5050nz S N 1 100 100 5050 0.000 %:UNSORTEDCOO2RSB_SCALING:lower-100x100-5050nz S N 1 100 100 5050 1.00 %:SORTEDCOO2RSB_SCALING:lower-100x100-5050nz S N 1 100 100 5050 1.00 @@ -5911,34 +5952,34 @@ %:SM_MINMAXAVGNNZ:lower-100x100-5050nz S N 1 100 100 5050 5050 5050 5050 # %operation:matrix CONSTRUCTOR[1] SPMV[1] SPMV[1] -%operation:lower-100x100-5050nz 0.000679016 1e+09 1e+09 +%operation:lower-100x100-5050nz 0.199734 1e+09 1e+09 %constructor:matrix SORT[1] SCAN[1] SHUFFLE[1] INSERT[1] -%constructor:lower-100x100-5050nz 0 0.00048399 0 9.91821e-05 -# so far, program took 8.822s of wall clock time; ancillary tests 0.000s; I/O 0.000s; checks 0.000s; conversions 0.000s; rsb/mkl tuning 0.006s/0.000s . +%constructor:lower-100x100-5050nz 0 0.0397182 0 0.111979 +# so far, program took 14.068s of wall clock time; ancillary tests 0.000s; I/O 0.000s; checks 0.000s; conversions 0.000s; rsb/mkl tuning 1.806s/0.000s . getrusage() stats: -ru_maxrss: 72 (maximum resident set size -- MB) -ru_stime : 0.2639s (system CPU time used) -ru_utime : 8.953s (user CPU time used) +ru_maxrss: 69 (maximum resident set size -- MB) +ru_stime : 0.1409s (system CPU time used) +ru_utime : 9.248s (user CPU time used) # multi-type benchmarking (DSCZ) -- now using typecode S (last was D). # Cache block size total 16777216 bytes, per-thread 16777216 bytes -# so far, program took 8.822s of wall clock time; ancillary tests 0.000s; I/O 0.000s; checks 0.000s; conversions 0.000s; rsb/mkl tuning 0.006s/0.000s . +# so far, program took 14.068s of wall clock time; ancillary tests 0.000s; I/O 0.000s; checks 0.000s; conversions 0.000s; rsb/mkl tuning 1.806s/0.000s . # Using 1 threads # Using alpha=1 beta=1 order=cols for rsb_spmv/rsb_spsv/rsb_spmm/rsb_spsm. # will use input matrix flags: RSB_FLAG_USE_HALFWORD_INDICES, RSB_FLAG_SORTED_INPUT, RSB_FLAG_LOWER, RSB_FLAG_QUAD_PARTITIONING, RSB_FLAG_SYMMETRIC, RSB_FLAG_OWN_PARTITIONING_ARRAYS # Using 1 threads Building a matrix with 5050 nnz, 100 x 100 Duplicates check: 5050 - 0 = 5050 - converted COO to RSB in 1.950e-04 s (100.00 %) - analyzed arrays in 2.694e-05 s (13.81 %) - cleaned-up arrays in 6.199e-06 s (3.18 %) - deduplicated arrays in 6.914e-06 s (3.55 %) + converted COO to RSB in 2.816e-01 s (100.00 %) + analyzed arrays in 3.756e-02 s (13.34 %) + cleaned-up arrays in 5.960e-06 s (0.00 %) + deduplicated arrays in 6.914e-06 s (0.00 %) sorted arrays in 0.000e+00 s (0.00 %) - shuffled partitions in 1.318e-04 s (67.60 %) - memory allocations took 4.053e-06 s (2.08 %) - leafs setup took 9.537e-07 s (0.49 %) - halfword conversion took 1.812e-05 s (9.29 %) -Built (100 x 100)[0x5817eb80]{S} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x2446196 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'LS' -# Constructed matrix (took 0.000s): (100 x 100)[0x5817eb80]{S} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x2446196 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'LS' + shuffled partitions in 1.840e-01 s (65.34 %) + memory allocations took 4.292e-06 s (0.00 %) + leafs setup took 3.815e-06 s (0.00 %) + halfword conversion took 6.002e-02 s (21.32 %) +Built (100 x 100)[0x57229bc0]{S} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x2446196 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'LS' +# Constructed matrix (took 0.282s): (100 x 100)[0x57229bc0]{S} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x2446196 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'LS' # matrix consistency check took 0.000s (ok) RSB Sparse Blocks Autotuner invoked requesting max 6 splits and max 6 merges in 1 rounds, threads spec.0 (specify negative values to enable threads tuning). Will autotune matrix: 100 x 100, type S, 5050 nnz, 50 nnz/r, 4 subms, 3 lsubms, 2.1212 bpnz. @@ -5989,10 +6030,10 @@ # RSB_IO_WANT_SORT_METHOD: 0 # RSB_IO_WANT_SUBDIVISION_MULTIPLIER: 1 # librsb version 1.3.0.2 - 202212201855: Initialization success -3 iterations (1 th.) took 7.2e-05s; avg 2.4e-05s ( +/- 25.50/ 50.00 %); best 1.788e-05s; worst 3.6e-05s; std dev. 8.486e-06 (taking best). -Reference operation time is 1.78814e-05 s (1130 Mflops) with 1 threads. -Starting merge (same threads) based auto-tuning procedure (transA=N, nrhs=1, order=cols) (max 6 steps, inclusive 3 grace steps) on: 100 x 100, type S, 5050 nnz, 50 nnz/r, 4 subms, 3 lsubms, 2.1212 bpnz (tpop: 1.788e-05 Mflops: 1129.666) -Merge (3 -> 1 leaves) took w.c.t. of 3.409e-05s, ~3.004e-05s of computing time (of which 1.383e-05s sorting, 1.192e-06s analysis) +3 iterations (1 th.) took 0.07999s; avg 0.02666s ( +/- 9.97/ 19.92 %); best 0.02401s; worst 0.03197s; std dev. 0.003756 (taking best). +Reference operation time is 0.0240059 s (0.8415 Mflops) with 1 threads. +Starting merge (same threads) based auto-tuning procedure (transA=N, nrhs=1, order=cols) (max 6 steps, inclusive 3 grace steps) on: 100 x 100, type S, 5050 nnz, 50 nnz/r, 4 subms, 3 lsubms, 2.1212 bpnz (tpop: 0.02401 Mflops: 0.841) +Merge (3 -> 1 leaves) took w.c.t. of 4.506e-05s, ~3.099e-05s of computing time (of which 1.287e-05s sorting, 3.099e-06s analysis) # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 16777216 bytes, per-thread 16777216 bytes # RSB_IO_WANT_MEMORY_HIERARCHY_INFO_STRING: unset @@ -6023,7 +6064,7 @@ # RSB_IO_WANT_SORT_METHOD: 0 # RSB_IO_WANT_SUBDIVISION_MULTIPLIER: 1 # librsb version 1.3.0.2 - 202212201855: Initialization success -3 iterations (1 th.) took 3.004e-05s; avg 1.001e-05s ( +/- 0.00/ 0.00 %); best 1.001e-05s; worst 1.001e-05s; std dev. 0 (taking best). +3 iterations (1 th.) took 3.386e-05s; avg 1.129e-05s ( +/- 11.27/ 14.08 %); best 1.001e-05s; worst 1.287e-05s; std dev. 1.189e-06 (taking best). Reference operation time is 1.00136e-05 s (2017 Mflops) with 1 threads. # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 16777216 bytes, per-thread 16777216 bytes @@ -6041,15 +6082,15 @@ # RSB_IO_WANT_SUBDIVISION_MULTIPLIER: 1 # librsb version 1.3.0.2 - 202212201855: Initialization success After merge step 1: tpop: 1.001e-05 s ~Mflops: 2017.260 nsubm:1 otn:1 -Applying merge (3 -> 1 leaves, 1 th.) yielded SPEEDUP of 1.786x: 1.788e-05s -> 1.001e-05s, so taking this instance. +Applying merge (3 -> 1 leaves, 1 th.) yielded SPEEDUP of 2397.333x: 0.02401s -> 1.001e-05s, so taking this instance. Saved plot to test-tuning-lower-100x100-5050nz--S-N-1--mv-tuned_merge1_1x1th.eps Merged all the matrix leaves: no reason to continue merging. -A total of 1 merge steps (of max 6) (3 -> 1 subms) took 0.002014s (of which 3.695e-05s partitioning, 0.001894s I/O); computing times: 3.004e-05s in par. loops, 1.383e-05s sorting, 1.192e-06s analyzing) -Total merge + benchmarking process took 0.002014s, equivalent to 201.1/112.6 new/old ops (4.601e-05s for 2 clones -- as 4.6/2.6 ops, or 2.3/1.3 ops per clone), SPEEDUP of 1.786x -Applying multi-merge (3 -> 1 leaves, 1 steps, 0 -> 1 th.sp.) yielded SPEEDUP of 1.786x (1.788e-05s -> 1.001e-05s), will amortize in 256.0 ops by saving 7.868e-06s per op. -In 1 tuning rounds (tot. 0.0022s, 4.6e-05s for constructor, 2 clones) obtained a SPEEDUP of 78.6% (1.786x) (from 1130 to 2017 Mflops). Employed 0.0017s for I/O of matrix plots. +A total of 1 merge steps (of max 6) (3 -> 1 subms) took 0.2035s (of which 4.816e-05s partitioning, 0.1315s I/O); computing times: 3.099e-05s in par. loops, 1.287e-05s sorting, 3.099e-06s analyzing) +Total merge + benchmarking process took 0.2035s, equivalent to 20321.4/8.5 new/old ops (0.1398s for 2 clones -- as 13956.5/5.8 ops, or 6978.2/2.9 ops per clone), SPEEDUP of 2397.333x +Applying multi-merge (3 -> 1 leaves, 1 steps, 0 -> 1 th.sp.) yielded SPEEDUP of 2397.333x (0.02401s -> 1.001e-05s), will amortize in 8.5 ops by saving 0.024s per op. +In 1 tuning rounds (tot. 0.35s, 0.14s for constructor, 2 clones) obtained a SPEEDUP of 239633.3% (2397x) (from 0.8415 to 2017 Mflops). Employed 0.16s for I/O of matrix plots. #pr: updating sample at index 2 (1^th of 4), 0^th touch for (0,0,0,0,0,1,0). -First run of RSB Autotuner took 0.00395083 s (1.788e-05 s -> 1.001e-05 s per spmv_sxsa) (tuned: 3 -> 1 lsubm). +First run of RSB Autotuner took 0.515556 s (2.401e-02 s -> 1.001e-05 s per spmv_sxsa) (tuned: 3 -> 1 lsubm). RSB Sparse Blocks Autotuner invoked requesting max 0 splits and max 0 merges in 1 rounds, auto threads spec. Will autotune matrix: 100 x 100, type S, 5050 nnz, 50 nnz/r, 1 subms, 1 lsubms, 2.0800 bpnz. Parameters: verbosity:1 mintimes:3 maxtimes:10 mindt:0 maxdt:10 @@ -6115,20 +6156,20 @@ # RSB_IO_WANT_SORT_METHOD: 0 # RSB_IO_WANT_SUBDIVISION_MULTIPLIER: 1 # librsb version 1.3.0.2 - 202212201855: Initialization success -3 iterations (1 th.) took 3.099e-05s; avg 1.033e-05s ( +/- 14.62/ 17.69 %); best 8.821e-06s; worst 1.216e-05s; std dev. 1.381e-06 (taking best). -Reference operation time is 8.82149e-06 s (2290 Mflops) with 1 threads. +3 iterations (1 th.) took 3.6e-05s; avg 1.2e-05s ( +/- 16.56/ 33.11 %); best 1.001e-05s; worst 1.597e-05s; std dev. 2.81e-06 (taking best). +Reference operation time is 1.00136e-05 s (2017 Mflops) with 1 threads. Building a matrix with 5050 nnz, 100 x 100 Duplicates check: 5050 - 0 = 5050 - converted COO to RSB in 4.697e-05 s (100.00 %) - analyzed arrays in 1.407e-05 s (29.95 %) - cleaned-up arrays in 6.199e-06 s (13.20 %) - deduplicated arrays in 5.960e-06 s (12.69 %) + converted COO to RSB in 9.630e-02 s (100.00 %) + analyzed arrays in 3.227e-02 s (33.51 %) + cleaned-up arrays in 5.960e-06 s (0.01 %) + deduplicated arrays in 5.960e-06 s (0.01 %) sorted arrays in 0.000e+00 s (0.00 %) - shuffled partitions in 1.383e-05 s (29.44 %) - memory allocations took 1.907e-06 s (4.06 %) - leafs setup took 1.192e-06 s (2.54 %) - halfword conversion took 3.815e-06 s (8.12 %) -Built (100 x 100)[0x5817eaa0]{S} @ (0(0..100),0(0..100)) (5050 nnz, 50 nnz/r) flags 0x42644094 (coo:0, csr:1, hw:0, ic:1, fi:0), storage: 1, subm: 1, symflags:'LS' + shuffled partitions in 6.399e-02 s (66.45 %) + memory allocations took 1.502e-05 s (0.02 %) + leafs setup took 4.053e-06 s (0.00 %) + halfword conversion took 4.768e-06 s (0.00 %) +Built (100 x 100)[0x57229ae0]{S} @ (0(0..100),0(0..100)) (5050 nnz, 50 nnz/r) flags 0x42644094 (coo:0, csr:1, hw:0, ic:1, fi:0), storage: 1, subm: 1, symflags:'LS' Starting autotuning stage, with subdivision of 1 (current threads=1, requested threads=0, max threads = 8). # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 16777216 bytes, per-thread 16777216 bytes @@ -6162,16 +6203,16 @@ # librsb version 1.3.0.2 - 202212201855: Initialization success Building a matrix with 5050 nnz, 100 x 100 Duplicates check: 5050 - 0 = 5050 - converted COO to RSB in 4.697e-05 s (100.00 %) - analyzed arrays in 1.884e-05 s (40.10 %) - cleaned-up arrays in 6.914e-06 s (14.72 %) - deduplicated arrays in 6.199e-06 s (13.20 %) + converted COO to RSB in 5.993e-02 s (100.00 %) + analyzed arrays in 3.598e-02 s (60.03 %) + cleaned-up arrays in 5.960e-06 s (0.01 %) + deduplicated arrays in 6.914e-06 s (0.01 %) sorted arrays in 0.000e+00 s (0.00 %) - shuffled partitions in 9.060e-06 s (19.29 %) - memory allocations took 0.000e+00 s (0.00 %) - leafs setup took 9.537e-07 s (2.03 %) - halfword conversion took 5.007e-06 s (10.66 %) -Built (100 x 100)[0x58176db0]{S} @ (0(0..100),0(0..100)) (5050 nnz, 50 nnz/r) flags 0x42644096 (coo:0, csr:1, hw:1, ic:1, fi:0), storage: 1, subm: 1, symflags:'LS' + shuffled partitions in 2.392e-02 s (39.92 %) + memory allocations took 4.053e-06 s (0.01 %) + leafs setup took 4.053e-06 s (0.01 %) + halfword conversion took 7.868e-06 s (0.01 %) +Built (100 x 100)[0x57221df0]{S} @ (0(0..100),0(0..100)) (5050 nnz, 50 nnz/r) flags 0x42644096 (coo:0, csr:1, hw:1, ic:1, fi:0), storage: 1, subm: 1, symflags:'LS' # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 16777216 bytes, per-thread 16777216 bytes # RSB_IO_WANT_MEMORY_HIERARCHY_INFO_STRING: unset @@ -6217,9 +6258,9 @@ # RSB_IO_WANT_SORT_METHOD: 0 # RSB_IO_WANT_SUBDIVISION_MULTIPLIER: 0.25 # librsb version 1.3.0.2 - 202212201855: Initialization success -3 iterations (1 th.) took 3.099e-05s; avg 1.033e-05s ( +/- 3.08/ 6.15 %); best 1.001e-05s; worst 1.097e-05s; std dev. 4.496e-07 (taking best). +3 iterations (1 th.) took 3.695e-05s; avg 1.232e-05s ( +/- 18.71/ 29.68 %); best 1.001e-05s; worst 1.597e-05s; std dev. 2.614e-06 (taking best). Reference operation time is 1.00136e-05 s (2017 Mflops) with 1 threads. -Challenging best inner round reference (8.82149e-06 s/1 threads) with: subdivision 0.25, 1 leaves, 2.08 bytes/nz, 1.00136e-05 s/0 threads (speedup 0.880952 x), same?n. +Challenging best inner round reference (1.00136e-05 s/1 threads) with: subdivision 0.25, 1 leaves, 2.08 bytes/nz, 1.00136e-05 s/0 threads (speedup 1 x), same?n. New candidate clone performs slowly; discarding it: 100 x 100, type S, 5050 nnz, 50 nnz/r, 1 subms, 1 lsubms, 2.0800 bpnz # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 16777216 bytes, per-thread 16777216 bytes @@ -6253,16 +6294,16 @@ # librsb version 1.3.0.2 - 202212201855: Initialization success Building a matrix with 5050 nnz, 100 x 100 Duplicates check: 5050 - 0 = 5050 - converted COO to RSB in 1.099e-04 s (100.00 %) - analyzed arrays in 3.409e-05 s (31.02 %) - cleaned-up arrays in 5.960e-06 s (5.42 %) - deduplicated arrays in 5.960e-06 s (5.42 %) + converted COO to RSB in 1.439e-01 s (100.00 %) + analyzed arrays in 6.784e-02 s (47.16 %) + cleaned-up arrays in 5.960e-06 s (0.00 %) + deduplicated arrays in 6.199e-06 s (0.00 %) sorted arrays in 0.000e+00 s (0.00 %) - shuffled partitions in 4.506e-05 s (41.00 %) - memory allocations took 2.861e-06 s (2.60 %) - leafs setup took 0.000e+00 s (0.00 %) - halfword conversion took 1.597e-05 s (14.53 %) -Built (100 x 100)[0x58176db0]{S} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x42646096 (coo:0, csr:1, hw:1, ic:1, fi:0), storage: 1, subm: 6, symflags:'LS' + shuffled partitions in 4.400e-02 s (30.58 %) + memory allocations took 5.960e-06 s (0.00 %) + leafs setup took 4.053e-06 s (0.00 %) + halfword conversion took 3.200e-02 s (22.24 %) +Built (100 x 100)[0x57221df0]{S} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x42646096 (coo:0, csr:1, hw:1, ic:1, fi:0), storage: 1, subm: 6, symflags:'LS' # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 16777216 bytes, per-thread 16777216 bytes # RSB_IO_WANT_MEMORY_HIERARCHY_INFO_STRING: unset @@ -6308,9 +6349,9 @@ # RSB_IO_WANT_SORT_METHOD: 0 # RSB_IO_WANT_SUBDIVISION_MULTIPLIER: 0.5 # librsb version 1.3.0.2 - 202212201855: Initialization success -3 iterations (1 th.) took 7.081e-05s; avg 2.36e-05s ( +/- 24.24/ 43.43 %); best 1.788e-05s; worst 3.386e-05s; std dev. 7.266e-06 (taking best). -Reference operation time is 1.78814e-05 s (1130 Mflops) with 1 threads. -Challenging best inner round reference (8.82149e-06 s/1 threads) with: subdivision 0.5, 6 leaves, 2.163 bytes/nz, 1.78814e-05 s/0 threads (speedup 0.493333 x), same?n. +3 iterations (1 th.) took 0.07594s; avg 0.02531s ( +/- 5.19/ 10.38 %); best 0.024s; worst 0.02794s; std dev. 0.001859 (taking best). +Reference operation time is 0.0239971 s (0.8418 Mflops) with 1 threads. +Challenging best inner round reference (1.00136e-05 s/1 threads) with: subdivision 0.5, 6 leaves, 2.163 bytes/nz, 0.0239971 s/0 threads (speedup 0.000417283 x), same?n. New candidate clone performs slowly; discarding it: 100 x 100, type S, 5050 nnz, 50 nnz/r, 8 subms, 6 lsubms, 2.1632 bpnz # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 16777216 bytes, per-thread 16777216 bytes @@ -6344,16 +6385,16 @@ # librsb version 1.3.0.2 - 202212201855: Initialization success Building a matrix with 5050 nnz, 100 x 100 Duplicates check: 5050 - 0 = 5050 - converted COO to RSB in 1.261e-04 s (100.00 %) - analyzed arrays in 4.411e-05 s (34.97 %) - cleaned-up arrays in 6.199e-06 s (4.91 %) - deduplicated arrays in 5.960e-06 s (4.73 %) + converted COO to RSB in 1.480e-01 s (100.00 %) + analyzed arrays in 4.792e-02 s (32.39 %) + cleaned-up arrays in 6.914e-06 s (0.00 %) + deduplicated arrays in 5.960e-06 s (0.00 %) sorted arrays in 0.000e+00 s (0.00 %) - shuffled partitions in 4.983e-05 s (39.51 %) - memory allocations took 2.861e-06 s (2.27 %) - leafs setup took 1.192e-06 s (0.95 %) - halfword conversion took 1.597e-05 s (12.67 %) -Built (100 x 100)[0x5817eb80]{S} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x42646096 (coo:0, csr:1, hw:1, ic:1, fi:0), storage: 1, subm: 16, symflags:'LS' + shuffled partitions in 6.417e-02 s (43.37 %) + memory allocations took 7.153e-06 s (0.00 %) + leafs setup took 5.007e-06 s (0.00 %) + halfword conversion took 3.583e-02 s (24.22 %) +Built (100 x 100)[0x57229bc0]{S} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x42646096 (coo:0, csr:1, hw:1, ic:1, fi:0), storage: 1, subm: 16, symflags:'LS' # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 16777216 bytes, per-thread 16777216 bytes # RSB_IO_WANT_MEMORY_HIERARCHY_INFO_STRING: unset @@ -6399,9 +6440,9 @@ # RSB_IO_WANT_SORT_METHOD: 0 # RSB_IO_WANT_SUBDIVISION_MULTIPLIER: 1 # librsb version 1.3.0.2 - 202212201855: Initialization success -3 iterations (1 th.) took 7.415e-05s; avg 2.472e-05s ( +/- 18.97/ 34.08 %); best 2.003e-05s; worst 3.314e-05s; std dev. 5.969e-06 (taking best). -Reference operation time is 2.00272e-05 s (1009 Mflops) with 1 threads. -Challenging best inner round reference (8.82149e-06 s/1 threads) with: subdivision 1, 16 leaves, 2.25 bytes/nz, 2.00272e-05 s/0 threads (speedup 0.440476 x), same?n. +3 iterations (1 th.) took 0.06789s; avg 0.02263s ( +/- 11.47/ 5.85 %); best 0.02003s; worst 0.02395s; std dev. 0.001835 (taking best). +Reference operation time is 0.0200338 s (1.008 Mflops) with 1 threads. +Challenging best inner round reference (1.00136e-05 s/1 threads) with: subdivision 1, 16 leaves, 2.25 bytes/nz, 0.0200338 s/0 threads (speedup 0.000499833 x), same?n. New candidate clone performs slowly; discarding it: 100 x 100, type S, 5050 nnz, 50 nnz/r, 22 subms, 16 lsubms, 2.2503 bpnz # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 16777216 bytes, per-thread 16777216 bytes @@ -6435,16 +6476,16 @@ # librsb version 1.3.0.2 - 202212201855: Initialization success Building a matrix with 5050 nnz, 100 x 100 Duplicates check: 5050 - 0 = 5050 - converted COO to RSB in 1.719e-04 s (100.00 %) - analyzed arrays in 6.104e-05 s (35.51 %) - cleaned-up arrays in 5.960e-06 s (3.47 %) - deduplicated arrays in 6.914e-06 s (4.02 %) + converted COO to RSB in 1.480e-01 s (100.00 %) + analyzed arrays in 4.794e-02 s (32.40 %) + cleaned-up arrays in 5.960e-06 s (0.00 %) + deduplicated arrays in 5.960e-06 s (0.00 %) sorted arrays in 0.000e+00 s (0.00 %) - shuffled partitions in 7.701e-05 s (44.80 %) - memory allocations took 4.053e-06 s (2.36 %) - leafs setup took 2.146e-06 s (1.25 %) - halfword conversion took 1.478e-05 s (8.60 %) -Built (100 x 100)[0x5817eb80]{S} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x42646096 (coo:0, csr:1, hw:1, ic:1, fi:0), storage: 1, subm: 36, symflags:'LS' + shuffled partitions in 4.801e-02 s (32.45 %) + memory allocations took 6.199e-06 s (0.00 %) + leafs setup took 5.007e-06 s (0.00 %) + halfword conversion took 5.198e-02 s (35.13 %) +Built (100 x 100)[0x57229bc0]{S} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x42646096 (coo:0, csr:1, hw:1, ic:1, fi:0), storage: 1, subm: 36, symflags:'LS' # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 16777216 bytes, per-thread 16777216 bytes # RSB_IO_WANT_MEMORY_HIERARCHY_INFO_STRING: unset @@ -6490,9 +6531,9 @@ # RSB_IO_WANT_SORT_METHOD: 0 # RSB_IO_WANT_SUBDIVISION_MULTIPLIER: 2 # librsb version 1.3.0.2 - 202212201855: Initialization success -3 iterations (1 th.) took 8.106e-05s; avg 2.702e-05s ( +/- 22.35/ 41.18 %); best 2.098e-05s; worst 3.815e-05s; std dev. 7.877e-06 (taking best). -Reference operation time is 2.09808e-05 s (962.8 Mflops) with 1 threads. -Challenging best inner round reference (8.82149e-06 s/1 threads) with: subdivision 2, 36 leaves, 2.383 bytes/nz, 2.09808e-05 s/0 threads (speedup 0.420455 x), same?n. +3 iterations (1 th.) took 0.06796s; avg 0.02265s ( +/- 29.36/ 41.28 %); best 0.016s; worst 0.032s; std dev. 0.006806 (taking best). +Reference operation time is 0.016001 s (1.262 Mflops) with 1 threads. +Challenging best inner round reference (1.00136e-05 s/1 threads) with: subdivision 2, 36 leaves, 2.383 bytes/nz, 0.016001 s/0 threads (speedup 0.00062581 x), same?n. New candidate clone performs slowly; discarding it: 100 x 100, type S, 5050 nnz, 50 nnz/r, 50 subms, 36 lsubms, 2.3834 bpnz # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 16777216 bytes, per-thread 16777216 bytes @@ -6526,16 +6567,16 @@ # librsb version 1.3.0.2 - 202212201855: Initialization success Building a matrix with 5050 nnz, 100 x 100 Duplicates check: 5050 - 0 = 5050 - converted COO to RSB in 1.709e-04 s (100.00 %) - analyzed arrays in 6.104e-05 s (35.70 %) - cleaned-up arrays in 6.914e-06 s (4.04 %) - deduplicated arrays in 5.960e-06 s (3.49 %) + converted COO to RSB in 1.719e-01 s (100.00 %) + analyzed arrays in 7.191e-02 s (41.83 %) + cleaned-up arrays in 6.914e-06 s (0.00 %) + deduplicated arrays in 5.960e-06 s (0.00 %) sorted arrays in 0.000e+00 s (0.00 %) - shuffled partitions in 7.200e-05 s (42.12 %) - memory allocations took 6.914e-06 s (4.04 %) - leafs setup took 3.099e-06 s (1.81 %) - halfword conversion took 1.502e-05 s (8.79 %) -Built (100 x 100)[0x58191e40]{S} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x42646096 (coo:0, csr:1, hw:1, ic:1, fi:0), storage: 1, subm: 36, symflags:'LS' + shuffled partitions in 4.800e-02 s (27.92 %) + memory allocations took 7.153e-06 s (0.00 %) + leafs setup took 5.007e-06 s (0.00 %) + halfword conversion took 5.199e-02 s (30.24 %) +Built (100 x 100)[0x5723ce80]{S} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x42646096 (coo:0, csr:1, hw:1, ic:1, fi:0), storage: 1, subm: 36, symflags:'LS' # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 16777216 bytes, per-thread 16777216 bytes # RSB_IO_WANT_MEMORY_HIERARCHY_INFO_STRING: unset @@ -6581,11 +6622,11 @@ # RSB_IO_WANT_SORT_METHOD: 0 # RSB_IO_WANT_SUBDIVISION_MULTIPLIER: 4 # librsb version 1.3.0.2 - 202212201855: Initialization success -3 iterations (1 th.) took 7.677e-05s; avg 2.559e-05s ( +/- 10.56/ 21.12 %); best 2.289e-05s; worst 3.099e-05s; std dev. 3.821e-06 (taking best). -Reference operation time is 2.28882e-05 s (882.6 Mflops) with 1 threads. -Challenging best inner round reference (8.82149e-06 s/1 threads) with: subdivision 4, 36 leaves, 2.383 bytes/nz, 2.28882e-05 s/0 threads (speedup 0.385417 x), same?n. +3 iterations (1 th.) took 0.08492s; avg 0.02831s ( +/- 14.49/ 18.54 %); best 0.0242s; worst 0.03355s; std dev. 0.003901 (taking best). +Reference operation time is 0.024204 s (0.8346 Mflops) with 1 threads. +Challenging best inner round reference (1.00136e-05 s/1 threads) with: subdivision 4, 36 leaves, 2.383 bytes/nz, 0.024204 s/0 threads (speedup 0.000413716 x), same?n. New candidate clone performs slowly; discarding it: 100 x 100, type S, 5050 nnz, 50 nnz/r, 50 subms, 36 lsubms, 2.3834 bpnz -Best sparse multiply performance with subdivision multiplier of 1: 2289.86 Mflops. +Best sparse multiply performance with subdivision multiplier of 1: 2017.26 Mflops. # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 16777216 bytes, per-thread 16777216 bytes # RSB_IO_WANT_MEMORY_HIERARCHY_INFO_STRING: unset @@ -6601,23 +6642,23 @@ # RSB_IO_WANT_SORT_METHOD: 0 # RSB_IO_WANT_SUBDIVISION_MULTIPLIER: 1 # librsb version 1.3.0.2 - 202212201855: Initialization success -Last tuner inner round (1 of 1) took 0.00153399 s (eq. to 2e+02/ 2e+02 old/new op.times), gained local/global speedup 1 x (8.82149e-06 : 8.82149e-06) / 1 x (8.82149e-06 : 8.82149e-06). This is not amortizable ! +Last tuner inner round (1 of 1) took 1.06537 s (eq. to 1e+05/ 1e+05 old/new op.times), gained local/global speedup 1 x (1.00136e-05 : 1.00136e-05) / 1 x (1.00136e-05 : 1.00136e-05). This is not amortizable ! Auto tuning inner round 1 did not find a configuration better than the original. -In 1 tuning rounds (tot. 0.0015s, 0.00092s for constructor, 0 clones) obtained NO speedup (best stays 2290 Mflops). -Second run of RSB Autotuner took 0.00155115 s and estimated a speedup of 1.000000 x (8.821e-06 s -> 8.821e-06 s per op) in same matrix (1 -> 1 lsubm) +In 1 tuning rounds (tot. 1.1s, 0.77s for constructor, 0 clones) obtained NO speedup (best stays 2017 Mflops). +Second run of RSB Autotuner took 1.0654 s and estimated a speedup of 1.000000 x (1.001e-05 s -> 1.001e-05 s per op) in same matrix (1 -> 1 lsubm) #min:1 #max:1 #sum:100 #norm:10 #used index storage compared to COO:10504 vs 40400 bytes (26.00%) ; compared to CSR:10504 vs 20604 bytes (50.99%) #%:CONSTRUCTOR_*:SORT SCAN INSERT SCAN+INSERT -%:CONSTRUCTOR_TIMES:lower-100x100-5050nz S N 1 100 100 5050 0.000000 0.000027 0.000132 0.000159 -%:UNSORTEDCOO2RSB_TIME:lower-100x100-5050nz S N 1 100 100 5050 0.000159 -%:RSB_SUBDIVISION_TIME:lower-100x100-5050nz S N 1 100 100 5050 0.000027 -%:RSB_SHUFFLE_TIME:lower-100x100-5050nz S N 1 100 100 5050 0.000132 +%:CONSTRUCTOR_TIMES:lower-100x100-5050nz S N 1 100 100 5050 0.000000 0.037558 0.183970 0.221528 +%:UNSORTEDCOO2RSB_TIME:lower-100x100-5050nz S N 1 100 100 5050 0.221528 +%:RSB_SUBDIVISION_TIME:lower-100x100-5050nz S N 1 100 100 5050 0.037558 +%:RSB_SHUFFLE_TIME:lower-100x100-5050nz S N 1 100 100 5050 0.183970 %:ROW_MAJOR_SORT_TIME:lower-100x100-5050nz S N 1 100 100 5050 0.000000 %:ROW_MAJOR_SORT_SCALING:lower-100x100-5050nz S N 1 100 100 5050 -nan -%:SORTEDCOO2RSB_TIME:lower-100x100-5050nz S N 1 100 100 5050 0.000159 +%:SORTEDCOO2RSB_TIME:lower-100x100-5050nz S N 1 100 100 5050 0.221528 %:ROW_MAJOR_SORT_TO_MOP:lower-100x100-5050nz S N 1 100 100 5050 0.000 %:UNSORTEDCOO2RSB_SCALING:lower-100x100-5050nz S N 1 100 100 5050 1.00 %:SORTEDCOO2RSB_SCALING:lower-100x100-5050nz S N 1 100 100 5050 1.00 @@ -6632,34 +6673,34 @@ %:SM_MINMAXAVGNNZ:lower-100x100-5050nz S N 1 100 100 5050 5050 5050 5050 # %operation:matrix CONSTRUCTOR[1] SPMV[1] SPMV[1] -%operation:lower-100x100-5050nz 0.000195026 1e+09 1e+09 +%operation:lower-100x100-5050nz 0.281571 1e+09 1e+09 %constructor:matrix SORT[1] SCAN[1] SHUFFLE[1] INSERT[1] -%constructor:lower-100x100-5050nz 0 2.69413e-05 0 0.000131845 -# so far, program took 8.902s of wall clock time; ancillary tests 0.000s; I/O 0.000s; checks 0.000s; conversions 0.000s; rsb/mkl tuning 0.011s/0.000s . +%constructor:lower-100x100-5050nz 0 0.0375581 0 0.18397 +# so far, program took 16.229s of wall clock time; ancillary tests 0.000s; I/O 0.000s; checks 0.000s; conversions 0.000s; rsb/mkl tuning 3.387s/0.000s . getrusage() stats: -ru_maxrss: 72 (maximum resident set size -- MB) -ru_stime : 0.3241s (system CPU time used) -ru_utime : 9.398s (user CPU time used) +ru_maxrss: 69 (maximum resident set size -- MB) +ru_stime : 0.2089s (system CPU time used) +ru_utime : 13.93s (user CPU time used) # multi-type benchmarking (DSCZ) -- now using typecode C (last was D). # Cache block size total 16777216 bytes, per-thread 16777216 bytes -# so far, program took 8.902s of wall clock time; ancillary tests 0.000s; I/O 0.000s; checks 0.000s; conversions 0.000s; rsb/mkl tuning 0.011s/0.000s . +# so far, program took 16.229s of wall clock time; ancillary tests 0.000s; I/O 0.000s; checks 0.000s; conversions 0.000s; rsb/mkl tuning 3.387s/0.000s . # Using 1 threads # Using alpha=1 beta=1 order=cols for rsb_spmv/rsb_spsv/rsb_spmm/rsb_spsm. # will use input matrix flags: RSB_FLAG_USE_HALFWORD_INDICES, RSB_FLAG_SORTED_INPUT, RSB_FLAG_LOWER, RSB_FLAG_QUAD_PARTITIONING, RSB_FLAG_SYMMETRIC, RSB_FLAG_OWN_PARTITIONING_ARRAYS # Using 1 threads Building a matrix with 5050 nnz, 100 x 100 Duplicates check: 5050 - 0 = 5050 - converted COO to RSB in 2.010e-04 s (100.00 %) - analyzed arrays in 7.796e-05 s (38.79 %) - cleaned-up arrays in 5.960e-06 s (2.97 %) - deduplicated arrays in 7.153e-06 s (3.56 %) + converted COO to RSB in 1.965e-01 s (100.00 %) + analyzed arrays in 4.500e-02 s (22.90 %) + cleaned-up arrays in 5.960e-06 s (0.00 %) + deduplicated arrays in 6.914e-06 s (0.00 %) sorted arrays in 0.000e+00 s (0.00 %) - shuffled partitions in 7.296e-05 s (36.30 %) - memory allocations took 2.861e-06 s (1.42 %) - leafs setup took 9.537e-07 s (0.47 %) - halfword conversion took 3.314e-05 s (16.49 %) -Built (100 x 100)[0x5817eb80]{C} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x2446196 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'LS' -# Constructed matrix (took 0.000s): (100 x 100)[0x5817eb80]{C} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x2446196 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'LS' + shuffled partitions in 8.597e-02 s (43.74 %) + memory allocations took 5.245e-06 s (0.00 %) + leafs setup took 3.099e-06 s (0.00 %) + halfword conversion took 6.554e-02 s (33.35 %) +Built (100 x 100)[0x57229bc0]{C} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x2446196 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'LS' +# Constructed matrix (took 0.197s): (100 x 100)[0x57229bc0]{C} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x2446196 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'LS' # matrix consistency check took 0.000s (ok) RSB Sparse Blocks Autotuner invoked requesting max 6 splits and max 6 merges in 1 rounds, threads spec.0 (specify negative values to enable threads tuning). Will autotune matrix: 100 x 100, type C, 5050 nnz, 50 nnz/r, 4 subms, 3 lsubms, 2.1212 bpnz. @@ -6710,10 +6751,10 @@ # RSB_IO_WANT_SORT_METHOD: 0 # RSB_IO_WANT_SUBDIVISION_MULTIPLIER: 1 # librsb version 1.3.0.2 - 202212201855: Initialization success -3 iterations (1 th.) took 0.000164s; avg 5.468e-05s ( +/- 12.35/ 24.27 %); best 4.792e-05s; worst 6.795e-05s; std dev. 9.385e-06 (taking best). -Reference operation time is 4.79221e-05 s (1686 Mflops) with 1 threads. -Starting merge (same threads) based auto-tuning procedure (transA=N, nrhs=1, order=cols) (max 6 steps, inclusive 3 grace steps) on: 100 x 100, type C, 5050 nnz, 50 nnz/r, 4 subms, 3 lsubms, 2.1212 bpnz (tpop: 4.792e-05 Mflops: 1686.068) -Merge (3 -> 1 leaves) took w.c.t. of 3.386e-05s, ~2.909e-05s of computing time (of which 1.407e-05s sorting, 9.537e-07s analysis) +3 iterations (1 th.) took 0.08397s; avg 0.02799s ( +/- 14.26/ 14.24 %); best 0.024s; worst 0.03198s; std dev. 0.003257 (taking best). +Reference operation time is 0.0239999 s (3.367 Mflops) with 1 threads. +Starting merge (same threads) based auto-tuning procedure (transA=N, nrhs=1, order=cols) (max 6 steps, inclusive 3 grace steps) on: 100 x 100, type C, 5050 nnz, 50 nnz/r, 4 subms, 3 lsubms, 2.1212 bpnz (tpop: 0.024 Mflops: 3.367) +Merge (3 -> 1 leaves) took w.c.t. of 4.411e-05s, ~3.29e-05s of computing time (of which 1.407e-05s sorting, 2.861e-06s analysis) # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 16777216 bytes, per-thread 16777216 bytes # RSB_IO_WANT_MEMORY_HIERARCHY_INFO_STRING: unset @@ -6744,8 +6785,8 @@ # RSB_IO_WANT_SORT_METHOD: 0 # RSB_IO_WANT_SUBDIVISION_MULTIPLIER: 1 # librsb version 1.3.0.2 - 202212201855: Initialization success -3 iterations (1 th.) took 0.000124s; avg 4.133e-05s ( +/- 8.27/ 6.73 %); best 3.791e-05s; worst 4.411e-05s; std dev. 2.57e-06 (taking best). -Reference operation time is 3.79086e-05 s (2131 Mflops) with 1 threads. +3 iterations (1 th.) took 0.0001099s; avg 3.664e-05s ( +/- 1.74/ 3.47 %); best 3.6e-05s; worst 3.791e-05s; std dev. 8.991e-07 (taking best). +Reference operation time is 3.60012e-05 s (2244 Mflops) with 1 threads. # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 16777216 bytes, per-thread 16777216 bytes # RSB_IO_WANT_MEMORY_HIERARCHY_INFO_STRING: unset @@ -6761,16 +6802,16 @@ # RSB_IO_WANT_SORT_METHOD: 0 # RSB_IO_WANT_SUBDIVISION_MULTIPLIER: 1 # librsb version 1.3.0.2 - 202212201855: Initialization success -After merge step 1: tpop: 3.791e-05 s ~Mflops: 2131.445 nsubm:1 otn:1 -Applying merge (3 -> 1 leaves, 1 th.) yielded SPEEDUP of 1.264x: 4.792e-05s -> 3.791e-05s, so taking this instance. +After merge step 1: tpop: 3.6e-05 s ~Mflops: 2244.369 nsubm:1 otn:1 +Applying merge (3 -> 1 leaves, 1 th.) yielded SPEEDUP of 666.642x: 0.024s -> 3.6e-05s, so taking this instance. Saved plot to test-tuning-lower-100x100-5050nz--C-N-1--mv-tuned_merge1_1x1th.eps Merged all the matrix leaves: no reason to continue merging. -A total of 1 merge steps (of max 6) (3 -> 1 subms) took 0.002205s (of which 3.695e-05s partitioning, 0.001994s I/O); computing times: 2.909e-05s in par. loops, 1.407e-05s sorting, 9.537e-07s analyzing) -Total merge + benchmarking process took 0.002205s, equivalent to 58.2/46.0 new/old ops (6.08e-05s for 2 clones -- as 1.6/1.3 ops, or 0.8/0.6 ops per clone), SPEEDUP of 1.264x -Applying multi-merge (3 -> 1 leaves, 1 steps, 0 -> 1 th.sp.) yielded SPEEDUP of 1.264x (4.792e-05s -> 3.791e-05s), will amortize in 220.2 ops by saving 1.001e-05s per op. -In 1 tuning rounds (tot. 0.0025s, 6.1e-05s for constructor, 2 clones) obtained a SPEEDUP of 26.4% (1.264x) (from 1686 to 2131 Mflops). Employed 0.002s for I/O of matrix plots. +A total of 1 merge steps (of max 6) (3 -> 1 subms) took 0.2161s (of which 4.697e-05s partitioning, 0.1401s I/O); computing times: 3.29e-05s in par. loops, 1.407e-05s sorting, 2.861e-06s analyzing) +Total merge + benchmarking process took 0.2161s, equivalent to 6001.4/9.0 new/old ops (0.1757s for 2 clones -- as 4880.4/7.3 ops, or 2440.2/3.7 ops per clone), SPEEDUP of 666.642x +Applying multi-merge (3 -> 1 leaves, 1 steps, 0 -> 1 th.sp.) yielded SPEEDUP of 666.642x (0.024s -> 3.6e-05s), will amortize in 9.0 ops by saving 0.02396s per op. +In 1 tuning rounds (tot. 0.4s, 0.18s for constructor, 2 clones) obtained a SPEEDUP of 66564.2% (666.6x) (from 3.367 to 2244 Mflops). Employed 0.14s for I/O of matrix plots. #pr: updating sample at index 3 (2^th of 4), 0^th touch for (0,0,0,0,0,2,0). -First run of RSB Autotuner took 0.004493 s (4.792e-05 s -> 3.791e-05 s per spmv_sxsa) (tuned: 3 -> 1 lsubm). +First run of RSB Autotuner took 0.536454 s (2.400e-02 s -> 3.600e-05 s per spmv_sxsa) (tuned: 3 -> 1 lsubm). RSB Sparse Blocks Autotuner invoked requesting max 0 splits and max 0 merges in 1 rounds, auto threads spec. Will autotune matrix: 100 x 100, type C, 5050 nnz, 50 nnz/r, 1 subms, 1 lsubms, 2.0800 bpnz. Parameters: verbosity:1 mintimes:3 maxtimes:10 mindt:0 maxdt:10 @@ -6836,20 +6877,20 @@ # RSB_IO_WANT_SORT_METHOD: 0 # RSB_IO_WANT_SUBDIVISION_MULTIPLIER: 1 # librsb version 1.3.0.2 - 202212201855: Initialization success -3 iterations (1 th.) took 0.0001111s; avg 3.703e-05s ( +/- 2.79/ 3.00 %); best 3.6e-05s; worst 3.815e-05s; std dev. 8.778e-07 (taking best). +3 iterations (1 th.) took 0.000113s; avg 3.767e-05s ( +/- 4.43/ 8.86 %); best 3.6e-05s; worst 4.101e-05s; std dev. 2.36e-06 (taking best). Reference operation time is 3.60012e-05 s (2244 Mflops) with 1 threads. Building a matrix with 5050 nnz, 100 x 100 Duplicates check: 5050 - 0 = 5050 - converted COO to RSB in 4.792e-05 s (100.00 %) - analyzed arrays in 1.502e-05 s (31.34 %) - cleaned-up arrays in 6.914e-06 s (14.43 %) - deduplicated arrays in 6.199e-06 s (12.94 %) + converted COO to RSB in 1.021e-01 s (100.00 %) + analyzed arrays in 4.767e-02 s (46.67 %) + cleaned-up arrays in 7.153e-06 s (0.01 %) + deduplicated arrays in 5.960e-06 s (0.01 %) sorted arrays in 0.000e+00 s (0.00 %) - shuffled partitions in 1.383e-05 s (28.86 %) - memory allocations took 1.907e-06 s (3.98 %) - leafs setup took 0.000e+00 s (0.00 %) - halfword conversion took 4.053e-06 s (8.46 %) -Built (100 x 100)[0x5817eaa0]{C} @ (0(0..100),0(0..100)) (5050 nnz, 50 nnz/r) flags 0x42644094 (coo:0, csr:1, hw:0, ic:1, fi:0), storage: 1, subm: 1, symflags:'LS' + shuffled partitions in 5.443e-02 s (53.30 %) + memory allocations took 3.099e-06 s (0.00 %) + leafs setup took 4.053e-06 s (0.00 %) + halfword conversion took 5.007e-06 s (0.00 %) +Built (100 x 100)[0x57229ae0]{C} @ (0(0..100),0(0..100)) (5050 nnz, 50 nnz/r) flags 0x42644094 (coo:0, csr:1, hw:0, ic:1, fi:0), storage: 1, subm: 1, symflags:'LS' Starting autotuning stage, with subdivision of 1 (current threads=1, requested threads=0, max threads = 8). # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 16777216 bytes, per-thread 16777216 bytes @@ -6883,16 +6924,16 @@ # librsb version 1.3.0.2 - 202212201855: Initialization success Building a matrix with 5050 nnz, 100 x 100 Duplicates check: 5050 - 0 = 5050 - converted COO to RSB in 1.149e-04 s (100.00 %) - analyzed arrays in 3.195e-05 s (27.80 %) - cleaned-up arrays in 5.960e-06 s (5.19 %) - deduplicated arrays in 5.960e-06 s (5.19 %) - sorted arrays in 0.000e+00 s (0.00 %) - shuffled partitions in 5.698e-05 s (49.59 %) - memory allocations took 2.146e-06 s (1.87 %) - leafs setup took 9.537e-07 s (0.83 %) - halfword conversion took 1.097e-05 s (9.54 %) -Built (100 x 100)[0x58177070]{C} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x42646096 (coo:0, csr:1, hw:1, ic:1, fi:0), storage: 1, subm: 3, symflags:'LS' + converted COO to RSB in 1.633e-01 s (100.00 %) + analyzed arrays in 6.144e-02 s (37.62 %) + cleaned-up arrays in 5.960e-06 s (0.00 %) + deduplicated arrays in 5.960e-06 s (0.00 %) + sorted arrays in 9.537e-07 s (0.00 %) + shuffled partitions in 4.405e-02 s (26.98 %) + memory allocations took 8.106e-06 s (0.00 %) + leafs setup took 4.053e-06 s (0.00 %) + halfword conversion took 5.778e-02 s (35.38 %) +Built (100 x 100)[0x572220b0]{C} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x42646096 (coo:0, csr:1, hw:1, ic:1, fi:0), storage: 1, subm: 3, symflags:'LS' # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 16777216 bytes, per-thread 16777216 bytes # RSB_IO_WANT_MEMORY_HIERARCHY_INFO_STRING: unset @@ -6938,9 +6979,9 @@ # RSB_IO_WANT_SORT_METHOD: 0 # RSB_IO_WANT_SUBDIVISION_MULTIPLIER: 0.25 # librsb version 1.3.0.2 - 202212201855: Initialization success -3 iterations (1 th.) took 0.000144s; avg 4.8e-05s ( +/- 0.17/ 0.33 %); best 4.792e-05s; worst 4.816e-05s; std dev. 1.124e-07 (taking best). -Reference operation time is 4.79221e-05 s (1686 Mflops) with 1 threads. -Challenging best inner round reference (3.60012e-05 s/1 threads) with: subdivision 0.25, 3 leaves, 2.121 bytes/nz, 4.79221e-05 s/0 threads (speedup 0.751244 x), same?n. +3 iterations (1 th.) took 0.05412s; avg 0.01804s ( +/- 21.79/ 20.43 %); best 0.01411s; worst 0.02172s; std dev. 0.003114 (taking best). +Reference operation time is 0.014107 s (5.728 Mflops) with 1 threads. +Challenging best inner round reference (3.60012e-05 s/1 threads) with: subdivision 0.25, 3 leaves, 2.121 bytes/nz, 0.014107 s/0 threads (speedup 0.00255201 x), same?n. New candidate clone performs slowly; discarding it: 100 x 100, type C, 5050 nnz, 50 nnz/r, 4 subms, 3 lsubms, 2.1212 bpnz # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 16777216 bytes, per-thread 16777216 bytes @@ -6974,16 +7015,16 @@ # librsb version 1.3.0.2 - 202212201855: Initialization success Building a matrix with 5050 nnz, 100 x 100 Duplicates check: 5050 - 0 = 5050 - converted COO to RSB in 1.559e-04 s (100.00 %) - analyzed arrays in 4.292e-05 s (27.52 %) - cleaned-up arrays in 5.960e-06 s (3.82 %) - deduplicated arrays in 6.199e-06 s (3.98 %) - sorted arrays in 9.537e-07 s (0.61 %) - shuffled partitions in 8.297e-05 s (53.21 %) - memory allocations took 9.537e-07 s (0.61 %) - leafs setup took 9.537e-07 s (0.61 %) - halfword conversion took 1.407e-05 s (9.02 %) -Built (100 x 100)[0x5817eb80]{C} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x42646096 (coo:0, csr:1, hw:1, ic:1, fi:0), storage: 1, subm: 10, symflags:'LS' + converted COO to RSB in 1.519e-01 s (100.00 %) + analyzed arrays in 5.984e-02 s (39.40 %) + cleaned-up arrays in 5.960e-06 s (0.00 %) + deduplicated arrays in 7.153e-06 s (0.00 %) + sorted arrays in 0.000e+00 s (0.00 %) + shuffled partitions in 4.801e-02 s (31.61 %) + memory allocations took 5.007e-06 s (0.00 %) + leafs setup took 4.053e-06 s (0.00 %) + halfword conversion took 4.399e-02 s (28.97 %) +Built (100 x 100)[0x57229bc0]{C} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x42646096 (coo:0, csr:1, hw:1, ic:1, fi:0), storage: 1, subm: 10, symflags:'LS' # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 16777216 bytes, per-thread 16777216 bytes # RSB_IO_WANT_MEMORY_HIERARCHY_INFO_STRING: unset @@ -7029,10 +7070,10 @@ # RSB_IO_WANT_SORT_METHOD: 0 # RSB_IO_WANT_SUBDIVISION_MULTIPLIER: 0.5 # librsb version 1.3.0.2 - 202212201855: Initialization success -3 iterations (1 th.) took 0.00015s; avg 4.999e-05s ( +/- 2.23/ 3.97 %); best 4.888e-05s; worst 5.198e-05s; std dev. 1.408e-06 (taking best). -Reference operation time is 4.88758e-05 s (1653 Mflops) with 1 threads. -Challenging best inner round reference (3.60012e-05 s/1 threads) with: subdivision 0.5, 10 leaves, 2.196 bytes/nz, 4.88758e-05 s/0 threads (speedup 0.736585 x), same?n. -New candidate clone performs slowly; discarding it: 100 x 100, type C, 5050 nnz, 50 nnz/r, 14 subms, 10 lsubms, 2.1956 bpnz +3 iterations (1 th.) took 0.06395s; avg 0.02132s ( +/- 23.69/ 12.60 %); best 0.01627s; worst 0.024s; std dev. 0.003573 (taking best). +Reference operation time is 0.0162671 s (4.967 Mflops) with 1 threads. +Challenging best inner round reference (3.60012e-05 s/1 threads) with: subdivision 0.5, 10 leaves, 2.206 bytes/nz, 0.0162671 s/0 threads (speedup 0.00221314 x), same?n. +New candidate clone performs slowly; discarding it: 100 x 100, type C, 5050 nnz, 50 nnz/r, 14 subms, 10 lsubms, 2.2059 bpnz # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 16777216 bytes, per-thread 16777216 bytes # RSB_IO_WANT_MEMORY_HIERARCHY_INFO_STRING: unset @@ -7065,16 +7106,16 @@ # librsb version 1.3.0.2 - 202212201855: Initialization success Building a matrix with 5050 nnz, 100 x 100 Duplicates check: 5050 - 0 = 5050 - converted COO to RSB in 1.531e-04 s (100.00 %) - analyzed arrays in 5.007e-05 s (32.71 %) - cleaned-up arrays in 5.960e-06 s (3.89 %) - deduplicated arrays in 6.914e-06 s (4.52 %) + converted COO to RSB in 1.538e-01 s (100.00 %) + analyzed arrays in 5.584e-02 s (36.31 %) + cleaned-up arrays in 6.199e-06 s (0.00 %) + deduplicated arrays in 6.914e-06 s (0.00 %) sorted arrays in 0.000e+00 s (0.00 %) - shuffled partitions in 7.105e-05 s (46.42 %) - memory allocations took 3.099e-06 s (2.02 %) - leafs setup took 1.907e-06 s (1.25 %) - halfword conversion took 1.407e-05 s (9.19 %) -Built (100 x 100)[0x5817eb80]{C} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x42646096 (coo:0, csr:1, hw:1, ic:1, fi:0), storage: 1, subm: 23, symflags:'LS' + shuffled partitions in 4.804e-02 s (31.23 %) + memory allocations took 6.676e-06 s (0.00 %) + leafs setup took 4.053e-06 s (0.00 %) + halfword conversion took 4.990e-02 s (32.44 %) +Built (100 x 100)[0x57229bc0]{C} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x42646096 (coo:0, csr:1, hw:1, ic:1, fi:0), storage: 1, subm: 22, symflags:'LS' # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 16777216 bytes, per-thread 16777216 bytes # RSB_IO_WANT_MEMORY_HIERARCHY_INFO_STRING: unset @@ -7120,10 +7161,10 @@ # RSB_IO_WANT_SORT_METHOD: 0 # RSB_IO_WANT_SUBDIVISION_MULTIPLIER: 1 # librsb version 1.3.0.2 - 202212201855: Initialization success -3 iterations (1 th.) took 0.0001578s; avg 5.261e-05s ( +/- 3.47/ 6.50 %); best 5.078e-05s; worst 5.603e-05s; std dev. 2.418e-06 (taking best). -Reference operation time is 5.07832e-05 s (1591 Mflops) with 1 threads. -Challenging best inner round reference (3.60012e-05 s/1 threads) with: subdivision 1, 23 leaves, 2.295 bytes/nz, 5.07832e-05 s/0 threads (speedup 0.70892 x), same?n. -New candidate clone performs slowly; discarding it: 100 x 100, type C, 5050 nnz, 50 nnz/r, 32 subms, 23 lsubms, 2.2947 bpnz +3 iterations (1 th.) took 0.06582s; avg 0.02194s ( +/- 39.73/ 21.04 %); best 0.01322s; worst 0.02656s; std dev. 0.006167 (taking best). +Reference operation time is 0.0132241 s (6.11 Mflops) with 1 threads. +Challenging best inner round reference (3.60012e-05 s/1 threads) with: subdivision 1, 22 leaves, 2.295 bytes/nz, 0.0132241 s/0 threads (speedup 0.00272239 x), same?n. +New candidate clone performs slowly; discarding it: 100 x 100, type C, 5050 nnz, 50 nnz/r, 30 subms, 22 lsubms, 2.2947 bpnz # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 16777216 bytes, per-thread 16777216 bytes # RSB_IO_WANT_MEMORY_HIERARCHY_INFO_STRING: unset @@ -7156,16 +7197,16 @@ # librsb version 1.3.0.2 - 202212201855: Initialization success Building a matrix with 5050 nnz, 100 x 100 Duplicates check: 5050 - 0 = 5050 - converted COO to RSB in 1.810e-04 s (100.00 %) - analyzed arrays in 5.817e-05 s (32.15 %) - cleaned-up arrays in 5.960e-06 s (3.29 %) - deduplicated arrays in 5.960e-06 s (3.29 %) + converted COO to RSB in 1.440e-01 s (100.00 %) + analyzed arrays in 6.398e-02 s (44.42 %) + cleaned-up arrays in 3.505e-05 s (0.02 %) + deduplicated arrays in 5.960e-06 s (0.00 %) sorted arrays in 0.000e+00 s (0.00 %) - shuffled partitions in 8.488e-05 s (46.90 %) - memory allocations took 5.960e-06 s (3.29 %) - leafs setup took 3.099e-06 s (1.71 %) - halfword conversion took 1.597e-05 s (8.83 %) -Built (100 x 100)[0x5817eb80]{C} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x42646096 (coo:0, csr:1, hw:1, ic:1, fi:0), storage: 1, subm: 36, symflags:'LS' + shuffled partitions in 4.119e-02 s (28.60 %) + memory allocations took 7.153e-06 s (0.00 %) + leafs setup took 5.007e-06 s (0.00 %) + halfword conversion took 3.880e-02 s (26.94 %) +Built (100 x 100)[0x57229bc0]{C} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x42646096 (coo:0, csr:1, hw:1, ic:1, fi:0), storage: 1, subm: 36, symflags:'LS' # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 16777216 bytes, per-thread 16777216 bytes # RSB_IO_WANT_MEMORY_HIERARCHY_INFO_STRING: unset @@ -7211,9 +7252,9 @@ # RSB_IO_WANT_SORT_METHOD: 0 # RSB_IO_WANT_SUBDIVISION_MULTIPLIER: 2 # librsb version 1.3.0.2 - 202212201855: Initialization success -3 iterations (1 th.) took 0.000164s; avg 5.468e-05s ( +/- 3.20/ 6.40 %); best 5.293e-05s; worst 5.817e-05s; std dev. 2.473e-06 (taking best). -Reference operation time is 5.29289e-05 s (1527 Mflops) with 1 threads. -Challenging best inner round reference (3.60012e-05 s/1 threads) with: subdivision 2, 36 leaves, 2.383 bytes/nz, 5.29289e-05 s/0 threads (speedup 0.68018 x), same?n. +3 iterations (1 th.) took 0.07194s; avg 0.02398s ( +/- 0.16/ 0.14 %); best 0.02394s; worst 0.02401s; std dev. 2.911e-05 (taking best). +Reference operation time is 0.0239432 s (3.375 Mflops) with 1 threads. +Challenging best inner round reference (3.60012e-05 s/1 threads) with: subdivision 2, 36 leaves, 2.383 bytes/nz, 0.0239432 s/0 threads (speedup 0.00150361 x), same?n. New candidate clone performs slowly; discarding it: 100 x 100, type C, 5050 nnz, 50 nnz/r, 50 subms, 36 lsubms, 2.3834 bpnz # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 16777216 bytes, per-thread 16777216 bytes @@ -7247,16 +7288,16 @@ # librsb version 1.3.0.2 - 202212201855: Initialization success Building a matrix with 5050 nnz, 100 x 100 Duplicates check: 5050 - 0 = 5050 - converted COO to RSB in 1.860e-04 s (100.00 %) - analyzed arrays in 6.104e-05 s (32.82 %) - cleaned-up arrays in 6.199e-06 s (3.33 %) - deduplicated arrays in 5.960e-06 s (3.21 %) + converted COO to RSB in 1.559e-01 s (100.00 %) + analyzed arrays in 5.985e-02 s (38.40 %) + cleaned-up arrays in 5.960e-06 s (0.00 %) + deduplicated arrays in 6.914e-06 s (0.00 %) sorted arrays in 0.000e+00 s (0.00 %) - shuffled partitions in 8.583e-05 s (46.15 %) - memory allocations took 8.821e-06 s (4.74 %) - leafs setup took 2.146e-06 s (1.15 %) - halfword conversion took 1.502e-05 s (8.08 %) -Built (100 x 100)[0x581a5a00]{C} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x42646096 (coo:0, csr:1, hw:1, ic:1, fi:0), storage: 1, subm: 36, symflags:'LS' + shuffled partitions in 4.804e-02 s (30.82 %) + memory allocations took 7.868e-06 s (0.01 %) + leafs setup took 5.007e-06 s (0.00 %) + halfword conversion took 4.795e-02 s (30.76 %) +Built (100 x 100)[0x57250a40]{C} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x42646096 (coo:0, csr:1, hw:1, ic:1, fi:0), storage: 1, subm: 36, symflags:'LS' # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 16777216 bytes, per-thread 16777216 bytes # RSB_IO_WANT_MEMORY_HIERARCHY_INFO_STRING: unset @@ -7302,9 +7343,9 @@ # RSB_IO_WANT_SORT_METHOD: 0 # RSB_IO_WANT_SUBDIVISION_MULTIPLIER: 4 # librsb version 1.3.0.2 - 202212201855: Initialization success -3 iterations (1 th.) took 0.0001631s; avg 5.436e-05s ( +/- 4.39/ 6.58 %); best 5.198e-05s; worst 5.794e-05s; std dev. 2.575e-06 (taking best). -Reference operation time is 5.19753e-05 s (1555 Mflops) with 1 threads. -Challenging best inner round reference (3.60012e-05 s/1 threads) with: subdivision 4, 36 leaves, 2.383 bytes/nz, 5.19753e-05 s/0 threads (speedup 0.692661 x), same?n. +3 iterations (1 th.) took 0.07194s; avg 0.02398s ( +/- 0.16/ 0.15 %); best 0.02394s; worst 0.02401s; std dev. 3.064e-05 (taking best). +Reference operation time is 0.0239401 s (3.375 Mflops) with 1 threads. +Challenging best inner round reference (3.60012e-05 s/1 threads) with: subdivision 4, 36 leaves, 2.383 bytes/nz, 0.0239401 s/0 threads (speedup 0.0015038 x), same?n. New candidate clone performs slowly; discarding it: 100 x 100, type C, 5050 nnz, 50 nnz/r, 50 subms, 36 lsubms, 2.3834 bpnz Best sparse multiply performance with subdivision multiplier of 1: 2244.37 Mflops. # librsb version 1.3.0.2 - 202212201855: Initializing @@ -7322,23 +7363,23 @@ # RSB_IO_WANT_SORT_METHOD: 0 # RSB_IO_WANT_SUBDIVISION_MULTIPLIER: 1 # librsb version 1.3.0.2 - 202212201855: Initialization success -Last tuner inner round (1 of 1) took 0.00248384 s (eq. to 7e+01/ 7e+01 old/new op.times), gained local/global speedup 1 x (3.60012e-05 : 3.60012e-05) / 1 x (3.60012e-05 : 3.60012e-05). This is not amortizable ! +Last tuner inner round (1 of 1) took 1.19993 s (eq. to 3e+04/ 3e+04 old/new op.times), gained local/global speedup 1 x (3.60012e-05 : 3.60012e-05) / 1 x (3.60012e-05 : 3.60012e-05). This is not amortizable ! Auto tuning inner round 1 did not find a configuration better than the original. -In 1 tuning rounds (tot. 0.0025s, 0.0013s for constructor, 0 clones) obtained NO speedup (best stays 2244 Mflops). -Second run of RSB Autotuner took 0.00253081 s and estimated a speedup of 1.000000 x (3.600e-05 s -> 3.600e-05 s per op) in same matrix (1 -> 1 lsubm) +In 1 tuning rounds (tot. 1.2s, 0.87s for constructor, 0 clones) obtained NO speedup (best stays 2244 Mflops). +Second run of RSB Autotuner took 1.19996 s and estimated a speedup of 1.000000 x (3.600e-05 s -> 3.600e-05 s per op) in same matrix (1 -> 1 lsubm) #min:1 0 #max:1 0 #sum:100 0 #norm:10 0 #used index storage compared to COO:10504 vs 40400 bytes (26.00%) ; compared to CSR:10504 vs 20604 bytes (50.99%) #%:CONSTRUCTOR_*:SORT SCAN INSERT SCAN+INSERT -%:CONSTRUCTOR_TIMES:lower-100x100-5050nz S N 1 100 100 5050 0.000000 0.000078 0.000073 0.000151 -%:UNSORTEDCOO2RSB_TIME:lower-100x100-5050nz S N 1 100 100 5050 0.000151 -%:RSB_SUBDIVISION_TIME:lower-100x100-5050nz S N 1 100 100 5050 0.000078 -%:RSB_SHUFFLE_TIME:lower-100x100-5050nz S N 1 100 100 5050 0.000073 +%:CONSTRUCTOR_TIMES:lower-100x100-5050nz S N 1 100 100 5050 0.000000 0.044997 0.085966 0.130963 +%:UNSORTEDCOO2RSB_TIME:lower-100x100-5050nz S N 1 100 100 5050 0.130963 +%:RSB_SUBDIVISION_TIME:lower-100x100-5050nz S N 1 100 100 5050 0.044997 +%:RSB_SHUFFLE_TIME:lower-100x100-5050nz S N 1 100 100 5050 0.085966 %:ROW_MAJOR_SORT_TIME:lower-100x100-5050nz S N 1 100 100 5050 0.000000 %:ROW_MAJOR_SORT_SCALING:lower-100x100-5050nz S N 1 100 100 5050 -nan -%:SORTEDCOO2RSB_TIME:lower-100x100-5050nz S N 1 100 100 5050 0.000151 +%:SORTEDCOO2RSB_TIME:lower-100x100-5050nz S N 1 100 100 5050 0.130963 %:ROW_MAJOR_SORT_TO_MOP:lower-100x100-5050nz S N 1 100 100 5050 0.000 %:UNSORTEDCOO2RSB_SCALING:lower-100x100-5050nz S N 1 100 100 5050 1.00 %:SORTEDCOO2RSB_SCALING:lower-100x100-5050nz S N 1 100 100 5050 1.00 @@ -7353,34 +7394,34 @@ %:SM_MINMAXAVGNNZ:lower-100x100-5050nz S N 1 100 100 5050 5050 5050 5050 # %operation:matrix CONSTRUCTOR[1] SPMV[1] SPMV[1] -%operation:lower-100x100-5050nz 0.000200987 1e+09 1e+09 +%operation:lower-100x100-5050nz 0.196526 1e+09 1e+09 %constructor:matrix SORT[1] SCAN[1] SHUFFLE[1] INSERT[1] -%constructor:lower-100x100-5050nz 0 7.79629e-05 0 7.29561e-05 -# so far, program took 8.985s of wall clock time; ancillary tests 0.000s; I/O 0.000s; checks 0.000s; conversions 0.000s; rsb/mkl tuning 0.018s/0.000s . +%constructor:lower-100x100-5050nz 0 0.044997 0 0.0859659 +# so far, program took 18.392s of wall clock time; ancillary tests 0.000s; I/O 0.000s; checks 0.000s; conversions 0.000s; rsb/mkl tuning 5.123s/0.000s . getrusage() stats: -ru_maxrss: 72 (maximum resident set size -- MB) -ru_stime : 0.3841s (system CPU time used) -ru_utime : 9.875s (user CPU time used) +ru_maxrss: 69 (maximum resident set size -- MB) +ru_stime : 0.2647s (system CPU time used) +ru_utime : 19.19s (user CPU time used) # multi-type benchmarking (DSCZ) -- now using typecode Z (last was D). # Cache block size total 16777216 bytes, per-thread 16777216 bytes -# so far, program took 8.985s of wall clock time; ancillary tests 0.000s; I/O 0.000s; checks 0.000s; conversions 0.000s; rsb/mkl tuning 0.018s/0.000s . +# so far, program took 18.392s of wall clock time; ancillary tests 0.000s; I/O 0.000s; checks 0.000s; conversions 0.000s; rsb/mkl tuning 5.123s/0.000s . # Using 1 threads # Using alpha=1 beta=1 order=cols for rsb_spmv/rsb_spsv/rsb_spmm/rsb_spsm. # will use input matrix flags: RSB_FLAG_USE_HALFWORD_INDICES, RSB_FLAG_SORTED_INPUT, RSB_FLAG_LOWER, RSB_FLAG_QUAD_PARTITIONING, RSB_FLAG_SYMMETRIC, RSB_FLAG_OWN_PARTITIONING_ARRAYS # Using 1 threads Building a matrix with 5050 nnz, 100 x 100 Duplicates check: 5050 - 0 = 5050 - converted COO to RSB in 1.950e-04 s (100.00 %) - analyzed arrays in 2.408e-05 s (12.35 %) - cleaned-up arrays in 5.960e-06 s (3.06 %) - deduplicated arrays in 5.960e-06 s (3.06 %) - sorted arrays in 9.537e-07 s (0.49 %) - shuffled partitions in 1.290e-04 s (66.14 %) - memory allocations took 1.311e-05 s (6.72 %) - leafs setup took 9.537e-07 s (0.49 %) - halfword conversion took 1.502e-05 s (7.70 %) -Built (100 x 100)[0x5817eb80]{Z} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x2446196 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'LS' -# Constructed matrix (took 0.000s): (100 x 100)[0x5817eb80]{Z} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x2446196 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'LS' + converted COO to RSB in 2.024e-01 s (100.00 %) + analyzed arrays in 3.835e-02 s (18.94 %) + cleaned-up arrays in 5.960e-06 s (0.00 %) + deduplicated arrays in 5.960e-06 s (0.00 %) + sorted arrays in 0.000e+00 s (0.00 %) + shuffled partitions in 1.160e-01 s (57.29 %) + memory allocations took 2.122e-05 s (0.01 %) + leafs setup took 3.099e-06 s (0.00 %) + halfword conversion took 4.808e-02 s (23.75 %) +Built (100 x 100)[0x57229bc0]{Z} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x2446196 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'LS' +# Constructed matrix (took 0.202s): (100 x 100)[0x57229bc0]{Z} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x2446196 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'LS' # matrix consistency check took 0.000s (ok) RSB Sparse Blocks Autotuner invoked requesting max 6 splits and max 6 merges in 1 rounds, threads spec.0 (specify negative values to enable threads tuning). Will autotune matrix: 100 x 100, type Z, 5050 nnz, 50 nnz/r, 4 subms, 3 lsubms, 2.1212 bpnz. @@ -7431,10 +7472,10 @@ # RSB_IO_WANT_SORT_METHOD: 0 # RSB_IO_WANT_SUBDIVISION_MULTIPLIER: 1 # librsb version 1.3.0.2 - 202212201855: Initialization success -3 iterations (1 th.) took 0.000205s; avg 6.835e-05s ( +/- 12.09/ 20.00 %); best 6.008e-05s; worst 8.202e-05s; std dev. 9.736e-06 (taking best). -Reference operation time is 6.00815e-05 s (1345 Mflops) with 1 threads. -Starting merge (same threads) based auto-tuning procedure (transA=N, nrhs=1, order=cols) (max 6 steps, inclusive 3 grace steps) on: 100 x 100, type Z, 5050 nnz, 50 nnz/r, 4 subms, 3 lsubms, 2.1212 bpnz (tpop: 6.008e-05 Mflops: 1344.840) -Merge (3 -> 1 leaves) took w.c.t. of 9.704e-05s, ~8.297e-05s of computing time (of which 5.889e-05s sorting, 9.537e-07s analysis) +3 iterations (1 th.) took 0.0678s; avg 0.0226s ( +/- 28.92/ 41.22 %); best 0.01607s; worst 0.03192s; std dev. 0.006763 (taking best). +Reference operation time is 0.0160661 s (5.029 Mflops) with 1 threads. +Starting merge (same threads) based auto-tuning procedure (transA=N, nrhs=1, order=cols) (max 6 steps, inclusive 3 grace steps) on: 100 x 100, type Z, 5050 nnz, 50 nnz/r, 4 subms, 3 lsubms, 2.1212 bpnz (tpop: 0.01607 Mflops: 5.029) +Merge (3 -> 1 leaves) took w.c.t. of 9.203e-05s, ~7.105e-05s of computing time (of which 3.505e-05s sorting, 2.146e-06s analysis) # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 16777216 bytes, per-thread 16777216 bytes # RSB_IO_WANT_MEMORY_HIERARCHY_INFO_STRING: unset @@ -7465,8 +7506,8 @@ # RSB_IO_WANT_SORT_METHOD: 0 # RSB_IO_WANT_SUBDIVISION_MULTIPLIER: 1 # librsb version 1.3.0.2 - 202212201855: Initialization success -3 iterations (1 th.) took 0.0001099s; avg 3.664e-05s ( +/- 1.74/ 0.87 %); best 3.6e-05s; worst 3.695e-05s; std dev. 4.496e-07 (taking best). -Reference operation time is 3.60012e-05 s (2244 Mflops) with 1 threads. +3 iterations (1 th.) took 0.01212s; avg 0.00404s ( +/- 99.09/198.17 %); best 3.695e-05s; worst 0.01205s; std dev. 0.005661 (taking best). +Reference operation time is 3.69549e-05 s (2186 Mflops) with 1 threads. # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 16777216 bytes, per-thread 16777216 bytes # RSB_IO_WANT_MEMORY_HIERARCHY_INFO_STRING: unset @@ -7482,16 +7523,16 @@ # RSB_IO_WANT_SORT_METHOD: 0 # RSB_IO_WANT_SUBDIVISION_MULTIPLIER: 1 # librsb version 1.3.0.2 - 202212201855: Initialization success -After merge step 1: tpop: 3.6e-05 s ~Mflops: 2244.369 nsubm:1 otn:1 -Applying merge (3 -> 1 leaves, 1 th.) yielded SPEEDUP of 1.669x: 6.008e-05s -> 3.6e-05s, so taking this instance. +After merge step 1: tpop: 3.695e-05 s ~Mflops: 2186.450 nsubm:1 otn:1 +Applying merge (3 -> 1 leaves, 1 th.) yielded SPEEDUP of 434.748x: 0.01607s -> 3.695e-05s, so taking this instance. Saved plot to test-tuning-lower-100x100-5050nz--Z-N-1--mv-tuned_merge1_1x1th.eps Merged all the matrix leaves: no reason to continue merging. -A total of 1 merge steps (of max 6) (3 -> 1 subms) took 0.002927s (of which 9.894e-05s partitioning, 0.002606s I/O); computing times: 8.297e-05s in par. loops, 5.889e-05s sorting, 9.537e-07s analyzing) -Total merge + benchmarking process took 0.002927s, equivalent to 81.3/48.7 new/old ops (0.0002029s for 2 clones -- as 5.6/3.4 ops, or 2.8/1.7 ops per clone), SPEEDUP of 1.669x -Applying multi-merge (3 -> 1 leaves, 1 steps, 0 -> 1 th.sp.) yielded SPEEDUP of 1.669x (6.008e-05s -> 3.6e-05s), will amortize in 121.6 ops by saving 2.408e-05s per op. -In 1 tuning rounds (tot. 0.0033s, 0.0002s for constructor, 2 clones) obtained a SPEEDUP of 66.9% (1.669x) (from 1345 to 2244 Mflops). Employed 0.0026s for I/O of matrix plots. +A total of 1 merge steps (of max 6) (3 -> 1 subms) took 0.2123s (of which 9.513e-05s partitioning, 0.1321s I/O); computing times: 7.105e-05s in par. loops, 3.505e-05s sorting, 2.146e-06s analyzing) +Total merge + benchmarking process took 0.2123s, equivalent to 5744.3/13.2 new/old ops (0.1478s for 2 clones -- as 3999.8/9.2 ops, or 1999.9/4.6 ops per clone), SPEEDUP of 434.748x +Applying multi-merge (3 -> 1 leaves, 1 steps, 0 -> 1 th.sp.) yielded SPEEDUP of 434.748x (0.01607s -> 3.695e-05s), will amortize in 13.2 ops by saving 0.01603s per op. +In 1 tuning rounds (tot. 0.36s, 0.15s for constructor, 2 clones) obtained a SPEEDUP of 43374.8% (434.7x) (from 5.029 to 2186 Mflops). Employed 0.16s for I/O of matrix plots. #pr: updating sample at index 4 (3^th of 4), 0^th touch for (0,0,0,0,0,3,0). -First run of RSB Autotuner took 0.0060041 s (6.008e-05 s -> 3.600e-05 s per spmv_sxsa) (tuned: 3 -> 1 lsubm). +First run of RSB Autotuner took 0.520009 s (1.607e-02 s -> 3.695e-05 s per spmv_sxsa) (tuned: 3 -> 1 lsubm). RSB Sparse Blocks Autotuner invoked requesting max 0 splits and max 0 merges in 1 rounds, auto threads spec. Will autotune matrix: 100 x 100, type Z, 5050 nnz, 50 nnz/r, 1 subms, 1 lsubms, 2.0800 bpnz. Parameters: verbosity:1 mintimes:3 maxtimes:10 mindt:0 maxdt:10 @@ -7557,20 +7598,20 @@ # RSB_IO_WANT_SORT_METHOD: 0 # RSB_IO_WANT_SUBDIVISION_MULTIPLIER: 1 # librsb version 1.3.0.2 - 202212201855: Initialization success -3 iterations (1 th.) took 0.0001121s; avg 3.735e-05s ( +/- 3.62/ 4.68 %); best 3.6e-05s; worst 3.91e-05s; std dev. 1.296e-06 (taking best). +3 iterations (1 th.) took 0.0001149s; avg 3.831e-05s ( +/- 6.02/ 9.54 %); best 3.6e-05s; worst 4.196e-05s; std dev. 2.614e-06 (taking best). Reference operation time is 3.60012e-05 s (2244 Mflops) with 1 threads. Building a matrix with 5050 nnz, 100 x 100 Duplicates check: 5050 - 0 = 5050 - converted COO to RSB in 4.816e-05 s (100.00 %) - analyzed arrays in 1.216e-05 s (25.25 %) - cleaned-up arrays in 5.960e-06 s (12.38 %) - deduplicated arrays in 5.960e-06 s (12.38 %) + converted COO to RSB in 8.350e-02 s (100.00 %) + analyzed arrays in 3.549e-02 s (42.50 %) + cleaned-up arrays in 5.960e-06 s (0.01 %) + deduplicated arrays in 6.199e-06 s (0.01 %) sorted arrays in 0.000e+00 s (0.00 %) - shuffled partitions in 1.597e-05 s (33.17 %) - memory allocations took 3.099e-06 s (6.44 %) - leafs setup took 9.537e-07 s (1.98 %) - halfword conversion took 4.053e-06 s (8.42 %) -Built (100 x 100)[0x5817eaa0]{Z} @ (0(0..100),0(0..100)) (5050 nnz, 50 nnz/r) flags 0x42644094 (coo:0, csr:1, hw:0, ic:1, fi:0), storage: 1, subm: 1, symflags:'LS' + shuffled partitions in 4.799e-02 s (57.47 %) + memory allocations took 3.815e-06 s (0.00 %) + leafs setup took 3.099e-06 s (0.00 %) + halfword conversion took 5.007e-06 s (0.01 %) +Built (100 x 100)[0x57229ae0]{Z} @ (0(0..100),0(0..100)) (5050 nnz, 50 nnz/r) flags 0x42644094 (coo:0, csr:1, hw:0, ic:1, fi:0), storage: 1, subm: 1, symflags:'LS' Starting autotuning stage, with subdivision of 1 (current threads=1, requested threads=0, max threads = 8). # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 16777216 bytes, per-thread 16777216 bytes @@ -7604,16 +7645,16 @@ # librsb version 1.3.0.2 - 202212201855: Initialization success Building a matrix with 5050 nnz, 100 x 100 Duplicates check: 5050 - 0 = 5050 - converted COO to RSB in 1.662e-04 s (100.00 %) - analyzed arrays in 3.600e-05 s (21.66 %) - cleaned-up arrays in 5.960e-06 s (3.59 %) - deduplicated arrays in 5.960e-06 s (3.59 %) + converted COO to RSB in 1.557e-01 s (100.00 %) + analyzed arrays in 4.773e-02 s (30.65 %) + cleaned-up arrays in 7.153e-06 s (0.00 %) + deduplicated arrays in 5.960e-06 s (0.00 %) sorted arrays in 0.000e+00 s (0.00 %) - shuffled partitions in 1.001e-04 s (60.26 %) - memory allocations took 2.146e-06 s (1.29 %) - leafs setup took 9.537e-07 s (0.57 %) - halfword conversion took 1.502e-05 s (9.04 %) -Built (100 x 100)[0x58181c30]{Z} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x42646096 (coo:0, csr:1, hw:1, ic:1, fi:0), storage: 1, subm: 6, symflags:'LS' + shuffled partitions in 4.800e-02 s (30.82 %) + memory allocations took 5.007e-06 s (0.00 %) + leafs setup took 2.146e-06 s (0.00 %) + halfword conversion took 5.999e-02 s (38.52 %) +Built (100 x 100)[0x5722cc70]{Z} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x42646096 (coo:0, csr:1, hw:1, ic:1, fi:0), storage: 1, subm: 6, symflags:'LS' # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 16777216 bytes, per-thread 16777216 bytes # RSB_IO_WANT_MEMORY_HIERARCHY_INFO_STRING: unset @@ -7659,9 +7700,9 @@ # RSB_IO_WANT_SORT_METHOD: 0 # RSB_IO_WANT_SUBDIVISION_MULTIPLIER: 0.25 # librsb version 1.3.0.2 - 202212201855: Initialization success -3 iterations (1 th.) took 0.0001879s; avg 6.262e-05s ( +/- 7.49/ 10.03 %); best 5.794e-05s; worst 6.89e-05s; std dev. 4.616e-06 (taking best). -Reference operation time is 5.79357e-05 s (1395 Mflops) with 1 threads. -Challenging best inner round reference (3.60012e-05 s/1 threads) with: subdivision 0.25, 6 leaves, 2.163 bytes/nz, 5.79357e-05 s/0 threads (speedup 0.621399 x), same?n. +3 iterations (1 th.) took 0.06394s; avg 0.02131s ( +/- 25.20/ 49.78 %); best 0.01594s; worst 0.03192s; std dev. 0.007503 (taking best). +Reference operation time is 0.0159421 s (5.068 Mflops) with 1 threads. +Challenging best inner round reference (3.60012e-05 s/1 threads) with: subdivision 0.25, 6 leaves, 2.163 bytes/nz, 0.0159421 s/0 threads (speedup 0.00225825 x), same?n. New candidate clone performs slowly; discarding it: 100 x 100, type Z, 5050 nnz, 50 nnz/r, 8 subms, 6 lsubms, 2.1632 bpnz # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 16777216 bytes, per-thread 16777216 bytes @@ -7695,16 +7736,16 @@ # librsb version 1.3.0.2 - 202212201855: Initialization success Building a matrix with 5050 nnz, 100 x 100 Duplicates check: 5050 - 0 = 5050 - converted COO to RSB in 1.760e-04 s (100.00 %) - analyzed arrays in 4.005e-05 s (22.76 %) - cleaned-up arrays in 5.960e-06 s (3.39 %) - deduplicated arrays in 6.199e-06 s (3.52 %) + converted COO to RSB in 1.437e-01 s (100.00 %) + analyzed arrays in 4.776e-02 s (33.23 %) + cleaned-up arrays in 5.960e-06 s (0.00 %) + deduplicated arrays in 6.914e-06 s (0.00 %) sorted arrays in 0.000e+00 s (0.00 %) - shuffled partitions in 1.059e-04 s (60.16 %) - memory allocations took 1.907e-06 s (1.08 %) - leafs setup took 2.146e-06 s (1.22 %) - halfword conversion took 1.287e-05 s (7.32 %) -Built (100 x 100)[0x5817eb80]{Z} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x42646096 (coo:0, csr:1, hw:1, ic:1, fi:0), storage: 1, subm: 15, symflags:'LS' + shuffled partitions in 6.394e-02 s (44.49 %) + memory allocations took 7.153e-06 s (0.00 %) + leafs setup took 4.053e-06 s (0.00 %) + halfword conversion took 3.200e-02 s (22.27 %) +Built (100 x 100)[0x57229bc0]{Z} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x42646096 (coo:0, csr:1, hw:1, ic:1, fi:0), storage: 1, subm: 16, symflags:'LS' # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 16777216 bytes, per-thread 16777216 bytes # RSB_IO_WANT_MEMORY_HIERARCHY_INFO_STRING: unset @@ -7750,10 +7791,10 @@ # RSB_IO_WANT_SORT_METHOD: 0 # RSB_IO_WANT_SUBDIVISION_MULTIPLIER: 0.5 # librsb version 1.3.0.2 - 202212201855: Initialization success -3 iterations (1 th.) took 0.000175s; avg 5.833e-05s ( +/- 2.32/ 4.63 %); best 5.698e-05s; worst 6.104e-05s; std dev. 1.911e-06 (taking best). -Reference operation time is 5.6982e-05 s (1418 Mflops) with 1 threads. -Challenging best inner round reference (3.60012e-05 s/1 threads) with: subdivision 0.5, 15 leaves, 2.23 bytes/nz, 5.6982e-05 s/0 threads (speedup 0.631799 x), same?n. -New candidate clone performs slowly; discarding it: 100 x 100, type Z, 5050 nnz, 50 nnz/r, 20 subms, 15 lsubms, 2.2297 bpnz +3 iterations (1 th.) took 0.06401s; avg 0.02134s ( +/- 25.11/ 49.79 %); best 0.01598s; worst 0.03196s; std dev. 0.007511 (taking best). +Reference operation time is 0.0159781 s (5.057 Mflops) with 1 threads. +Challenging best inner round reference (3.60012e-05 s/1 threads) with: subdivision 0.5, 16 leaves, 2.25 bytes/nz, 0.0159781 s/0 threads (speedup 0.00225316 x), same?n. +New candidate clone performs slowly; discarding it: 100 x 100, type Z, 5050 nnz, 50 nnz/r, 22 subms, 16 lsubms, 2.2503 bpnz # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 16777216 bytes, per-thread 16777216 bytes # RSB_IO_WANT_MEMORY_HIERARCHY_INFO_STRING: unset @@ -7786,16 +7827,16 @@ # librsb version 1.3.0.2 - 202212201855: Initialization success Building a matrix with 5050 nnz, 100 x 100 Duplicates check: 5050 - 0 = 5050 - converted COO to RSB in 2.220e-04 s (100.00 %) - analyzed arrays in 6.700e-05 s (30.18 %) - cleaned-up arrays in 7.153e-06 s (3.22 %) - deduplicated arrays in 5.960e-06 s (2.69 %) + converted COO to RSB in 1.717e-01 s (100.00 %) + analyzed arrays in 6.364e-02 s (37.07 %) + cleaned-up arrays in 5.960e-06 s (0.00 %) + deduplicated arrays in 7.153e-06 s (0.00 %) sorted arrays in 0.000e+00 s (0.00 %) - shuffled partitions in 1.202e-04 s (54.14 %) - memory allocations took 4.768e-06 s (2.15 %) - leafs setup took 1.907e-06 s (0.86 %) - halfword conversion took 1.502e-05 s (6.77 %) -Built (100 x 100)[0x5817eb80]{Z} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x42646096 (coo:0, csr:1, hw:1, ic:1, fi:0), storage: 1, subm: 34, symflags:'LS' + shuffled partitions in 6.000e-02 s (34.95 %) + memory allocations took 1.001e-05 s (0.01 %) + leafs setup took 5.960e-06 s (0.00 %) + halfword conversion took 4.799e-02 s (27.96 %) +Built (100 x 100)[0x57229bc0]{Z} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x42646096 (coo:0, csr:1, hw:1, ic:1, fi:0), storage: 1, subm: 34, symflags:'LS' # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 16777216 bytes, per-thread 16777216 bytes # RSB_IO_WANT_MEMORY_HIERARCHY_INFO_STRING: unset @@ -7841,9 +7882,9 @@ # RSB_IO_WANT_SORT_METHOD: 0 # RSB_IO_WANT_SUBDIVISION_MULTIPLIER: 1 # librsb version 1.3.0.2 - 202212201855: Initialization success -3 iterations (1 th.) took 0.0002041s; avg 6.803e-05s ( +/- 2.92/ 4.44 %); best 6.604e-05s; worst 7.105e-05s; std dev. 2.171e-06 (taking best). -Reference operation time is 6.60419e-05 s (1223 Mflops) with 1 threads. -Challenging best inner round reference (3.60012e-05 s/1 threads) with: subdivision 1, 34 leaves, 2.372 bytes/nz, 6.60419e-05 s/0 threads (speedup 0.545126 x), same?n. +3 iterations (1 th.) took 0.06402s; avg 0.02134s ( +/- 24.90/ 49.56 %); best 0.01603s; worst 0.03192s; std dev. 0.007479 (taking best). +Reference operation time is 0.016026 s (5.042 Mflops) with 1 threads. +Challenging best inner round reference (3.60012e-05 s/1 threads) with: subdivision 1, 34 leaves, 2.372 bytes/nz, 0.016026 s/0 threads (speedup 0.00224642 x), same?n. New candidate clone performs slowly; discarding it: 100 x 100, type Z, 5050 nnz, 50 nnz/r, 47 subms, 34 lsubms, 2.3723 bpnz # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 16777216 bytes, per-thread 16777216 bytes @@ -7877,16 +7918,16 @@ # librsb version 1.3.0.2 - 202212201855: Initialization success Building a matrix with 5050 nnz, 100 x 100 Duplicates check: 5050 - 0 = 5050 - converted COO to RSB in 2.141e-04 s (100.00 %) - analyzed arrays in 6.485e-05 s (30.29 %) - cleaned-up arrays in 6.914e-06 s (3.23 %) - deduplicated arrays in 5.960e-06 s (2.78 %) + converted COO to RSB in 1.437e-01 s (100.00 %) + analyzed arrays in 4.765e-02 s (33.17 %) + cleaned-up arrays in 6.914e-06 s (0.00 %) + deduplicated arrays in 6.199e-06 s (0.00 %) sorted arrays in 0.000e+00 s (0.00 %) - shuffled partitions in 1.101e-04 s (51.45 %) - memory allocations took 9.298e-06 s (4.34 %) - leafs setup took 1.907e-06 s (0.89 %) - halfword conversion took 1.502e-05 s (7.02 %) -Built (100 x 100)[0x581cd150]{Z} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x42646096 (coo:0, csr:1, hw:1, ic:1, fi:0), storage: 1, subm: 36, symflags:'LS' + shuffled partitions in 4.801e-02 s (33.42 %) + memory allocations took 1.001e-05 s (0.01 %) + leafs setup took 3.815e-06 s (0.00 %) + halfword conversion took 4.798e-02 s (33.40 %) +Built (100 x 100)[0x57278190]{Z} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x42646096 (coo:0, csr:1, hw:1, ic:1, fi:0), storage: 1, subm: 36, symflags:'LS' # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 16777216 bytes, per-thread 16777216 bytes # RSB_IO_WANT_MEMORY_HIERARCHY_INFO_STRING: unset @@ -7932,9 +7973,9 @@ # RSB_IO_WANT_SORT_METHOD: 0 # RSB_IO_WANT_SUBDIVISION_MULTIPLIER: 2 # librsb version 1.3.0.2 - 202212201855: Initialization success -3 iterations (1 th.) took 0.0002079s; avg 6.93e-05s ( +/- 3.33/ 6.65 %); best 6.7e-05s; worst 7.391e-05s; std dev. 3.259e-06 (taking best). -Reference operation time is 6.69956e-05 s (1206 Mflops) with 1 threads. -Challenging best inner round reference (3.60012e-05 s/1 threads) with: subdivision 2, 36 leaves, 2.383 bytes/nz, 6.69956e-05 s/0 threads (speedup 0.537367 x), same?n. +3 iterations (1 th.) took 0.07194s; avg 0.02398s ( +/- 33.09/ 33.00 %); best 0.01605s; worst 0.03189s; std dev. 0.00647 (taking best). +Reference operation time is 0.0160458 s (5.036 Mflops) with 1 threads. +Challenging best inner round reference (3.60012e-05 s/1 threads) with: subdivision 2, 36 leaves, 2.383 bytes/nz, 0.0160458 s/0 threads (speedup 0.00224365 x), same?n. New candidate clone performs slowly; discarding it: 100 x 100, type Z, 5050 nnz, 50 nnz/r, 50 subms, 36 lsubms, 2.3834 bpnz # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 16777216 bytes, per-thread 16777216 bytes @@ -7968,16 +8009,16 @@ # librsb version 1.3.0.2 - 202212201855: Initialization success Building a matrix with 5050 nnz, 100 x 100 Duplicates check: 5050 - 0 = 5050 - converted COO to RSB in 2.260e-04 s (100.00 %) - analyzed arrays in 6.700e-05 s (29.64 %) - cleaned-up arrays in 6.914e-06 s (3.06 %) - deduplicated arrays in 5.960e-06 s (2.64 %) + converted COO to RSB in 1.957e-01 s (100.00 %) + analyzed arrays in 6.369e-02 s (32.54 %) + cleaned-up arrays in 5.960e-06 s (0.00 %) + deduplicated arrays in 7.153e-06 s (0.00 %) sorted arrays in 0.000e+00 s (0.00 %) - shuffled partitions in 1.090e-04 s (48.21 %) - memory allocations took 1.812e-05 s (8.02 %) - leafs setup took 3.099e-06 s (1.37 %) - halfword conversion took 1.597e-05 s (7.07 %) -Built (100 x 100)[0x581cd150]{Z} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x42646096 (coo:0, csr:1, hw:1, ic:1, fi:0), storage: 1, subm: 36, symflags:'LS' + shuffled partitions in 7.199e-02 s (36.79 %) + memory allocations took 1.907e-05 s (0.01 %) + leafs setup took 4.768e-06 s (0.00 %) + halfword conversion took 5.999e-02 s (30.65 %) +Built (100 x 100)[0x57278190]{Z} @ (0(0..0),0(0..0)) (5050 nnz, 50 nnz/r) flags 0x42646096 (coo:0, csr:1, hw:1, ic:1, fi:0), storage: 1, subm: 36, symflags:'LS' # librsb version 1.3.0.2 - 202212201855: Initializing # Cache block size total 16777216 bytes, per-thread 16777216 bytes # RSB_IO_WANT_MEMORY_HIERARCHY_INFO_STRING: unset @@ -8023,9 +8064,9 @@ # RSB_IO_WANT_SORT_METHOD: 0 # RSB_IO_WANT_SUBDIVISION_MULTIPLIER: 4 # librsb version 1.3.0.2 - 202212201855: Initialization success -3 iterations (1 th.) took 0.0002129s; avg 7.097e-05s ( +/- 5.60/ 2.80 %); best 6.7e-05s; worst 7.296e-05s; std dev. 2.81e-06 (taking best). -Reference operation time is 6.69956e-05 s (1206 Mflops) with 1 threads. -Challenging best inner round reference (3.60012e-05 s/1 threads) with: subdivision 4, 36 leaves, 2.383 bytes/nz, 6.69956e-05 s/0 threads (speedup 0.537367 x), same?n. +3 iterations (1 th.) took 0.06395s; avg 0.02132s ( +/- 25.21/ 50.19 %); best 0.01594s; worst 0.03202s; std dev. 0.007566 (taking best). +Reference operation time is 0.0159428 s (5.068 Mflops) with 1 threads. +Challenging best inner round reference (3.60012e-05 s/1 threads) with: subdivision 4, 36 leaves, 2.383 bytes/nz, 0.0159428 s/0 threads (speedup 0.00225815 x), same?n. New candidate clone performs slowly; discarding it: 100 x 100, type Z, 5050 nnz, 50 nnz/r, 50 subms, 36 lsubms, 2.3834 bpnz Best sparse multiply performance with subdivision multiplier of 1: 2244.37 Mflops. # librsb version 1.3.0.2 - 202212201855: Initializing @@ -8043,29 +8084,29 @@ # RSB_IO_WANT_SORT_METHOD: 0 # RSB_IO_WANT_SUBDIVISION_MULTIPLIER: 1 # librsb version 1.3.0.2 - 202212201855: Initialization success -Last tuner inner round (1 of 1) took 0.00408792 s (eq. to 1e+02/ 1e+02 old/new op.times), gained local/global speedup 1 x (3.60012e-05 : 3.60012e-05) / 1 x (3.60012e-05 : 3.60012e-05). This is not amortizable ! +Last tuner inner round (1 of 1) took 1.22389 s (eq. to 3e+04/ 3e+04 old/new op.times), gained local/global speedup 1 x (3.60012e-05 : 3.60012e-05) / 1 x (3.60012e-05 : 3.60012e-05). This is not amortizable ! Auto tuning inner round 1 did not find a configuration better than the original. -In 1 tuning rounds (tot. 0.0041s, 0.0025s for constructor, 0 clones) obtained NO speedup (best stays 2244 Mflops). -Second run of RSB Autotuner took 0.00411081 s and estimated a speedup of 1.000000 x (3.600e-05 s -> 3.600e-05 s per op) in same matrix (1 -> 1 lsubm) +In 1 tuning rounds (tot. 1.2s, 0.9s for constructor, 0 clones) obtained NO speedup (best stays 2244 Mflops). +Second run of RSB Autotuner took 1.22392 s and estimated a speedup of 1.000000 x (3.600e-05 s -> 3.600e-05 s per op) in same matrix (1 -> 1 lsubm) #min:1 0 #max:1 0 #sum:100 0 #norm:10 0 #used index storage compared to COO:10504 vs 40400 bytes (26.00%) ; compared to CSR:10504 vs 20604 bytes (50.99%) #%:CONSTRUCTOR_*:SORT SCAN INSERT SCAN+INSERT -%:CONSTRUCTOR_TIMES:lower-100x100-5050nz S N 1 100 100 5050 0.000001 0.000024 0.000129 0.000153 -%:UNSORTEDCOO2RSB_TIME:lower-100x100-5050nz S N 1 100 100 5050 0.000154 -%:RSB_SUBDIVISION_TIME:lower-100x100-5050nz S N 1 100 100 5050 0.000024 -%:RSB_SHUFFLE_TIME:lower-100x100-5050nz S N 1 100 100 5050 0.000129 -%:ROW_MAJOR_SORT_TIME:lower-100x100-5050nz S N 1 100 100 5050 0.000001 -%:ROW_MAJOR_SORT_SCALING:lower-100x100-5050nz S N 1 100 100 5050 1.000 -%:SORTEDCOO2RSB_TIME:lower-100x100-5050nz S N 1 100 100 5050 0.000153 +%:CONSTRUCTOR_TIMES:lower-100x100-5050nz S N 1 100 100 5050 0.000000 0.038347 0.115979 0.154326 +%:UNSORTEDCOO2RSB_TIME:lower-100x100-5050nz S N 1 100 100 5050 0.154326 +%:RSB_SUBDIVISION_TIME:lower-100x100-5050nz S N 1 100 100 5050 0.038347 +%:RSB_SHUFFLE_TIME:lower-100x100-5050nz S N 1 100 100 5050 0.115979 +%:ROW_MAJOR_SORT_TIME:lower-100x100-5050nz S N 1 100 100 5050 0.000000 +%:ROW_MAJOR_SORT_SCALING:lower-100x100-5050nz S N 1 100 100 5050 -nan +%:SORTEDCOO2RSB_TIME:lower-100x100-5050nz S N 1 100 100 5050 0.154326 %:ROW_MAJOR_SORT_TO_MOP:lower-100x100-5050nz S N 1 100 100 5050 0.000 %:UNSORTEDCOO2RSB_SCALING:lower-100x100-5050nz S N 1 100 100 5050 1.00 %:SORTEDCOO2RSB_SCALING:lower-100x100-5050nz S N 1 100 100 5050 1.00 %:RSB_SUBDIVISION_SCALING:lower-100x100-5050nz S N 1 100 100 5050 1.00 %:RSB_SHUFFLE_SCALING:lower-100x100-5050nz S N 1 100 100 5050 1.00 -%:CONSTRUCTOR_SCALING:lower-100x100-5050nz S N 1 100 100 5050 1.00 1.00 1.00 1.00 +%:CONSTRUCTOR_SCALING:lower-100x100-5050nz S N 1 100 100 5050 -nan 1.00 1.00 1.00 #%:SM_COUNTS: Tot HalfwordCsr FullwordCsr HalfwordCoo FullwordCoo %:SM_COUNTS:lower-100x100-5050nz S N 1 100 100 5050 1 1 0 0 0 %:SM_IDXOCCUPATIONRSBVSCOOANDCSR:lower-100x100-5050nz S N 1 100 100 5050 10504 40400 20600 @@ -8074,68 +8115,68 @@ %:SM_MINMAXAVGNNZ:lower-100x100-5050nz S N 1 100 100 5050 5050 5050 5050 # %operation:matrix CONSTRUCTOR[1] SPMV[1] SPMV[1] -%operation:lower-100x100-5050nz 0.000195026 1e+09 1e+09 +%operation:lower-100x100-5050nz 0.202446 1e+09 1e+09 %constructor:matrix SORT[1] SCAN[1] SHUFFLE[1] INSERT[1] -%constructor:lower-100x100-5050nz 9.53674e-07 2.40803e-05 0 0.000128984 -# so far, program took 9.070s of wall clock time; ancillary tests 0.000s; I/O 0.000s; checks 0.000s; conversions 0.000s; rsb/mkl tuning 0.029s/0.000s . +%constructor:lower-100x100-5050nz 0 0.038347 0 0.115979 +# so far, program took 20.677s of wall clock time; ancillary tests 0.000s; I/O 0.000s; checks 0.000s; conversions 0.000s; rsb/mkl tuning 6.867s/0.000s . getrusage() stats: -ru_maxrss: 72 (maximum resident set size -- MB) -ru_stime : 0.4445s (system CPU time used) -ru_utime : 10.35s (user CPU time used) +ru_maxrss: 69 (maximum resident set size -- MB) +ru_stime : 0.3397s (system CPU time used) +ru_utime : 24.2s (user CPU time used) # benchmarking terminated --- finalizing run. # ====== BEGIN Total summary record. #pr: ======== All results (not limiting) #pr: Dump from a base of 4 samples (of max 4) ordered by (1,1,1,1,1,4,1) = (filename x cores x incX x incY x nrhs x typecode x transA). pr: BESTCODE MTX NR NC NNZ NRHS TYPE SYM TRANS NT AT-NT AT-MKL-NT BPNZ AT-BPNZ NSUBM AT-SUBM RSBBEST-MFLOPS OPTIME MKL-OPTIME AT-OPTIME AT-MKL-OPTIME AT-TIME RWminBW-GBps CB-bpf AT-MS CMFLOPS -pr: 1:R_R lower-100x100-5050nz 100 100 5050 1 D S N 1 1 0 2.1212 2.0800 3 1 2017.26 2.503e-05 0.000e+00 1.001e-05 0.000e+00 3.988e-03 5.32e+00 2.60e+00 1 2.02e-02 -pr: 2:R_R lower-100x100-5050nz 100 100 5050 1 S S N 1 1 0 2.1212 2.0800 3 1 2017.26 1.788e-05 0.000e+00 1.001e-05 0.000e+00 3.951e-03 3.19e+00 1.56e+00 1 2.02e-02 -pr: 3:R_R lower-100x100-5050nz 100 100 5050 1 C S N 1 1 0 2.1212 2.0800 3 1 2131.45 4.792e-05 0.000e+00 3.791e-05 0.000e+00 4.493e-03 1.41e+00 6.50e-01 1 8.08e-02 -pr: 4:R_R lower-100x100-5050nz 100 100 5050 1 Z S N 1 1 0 2.1212 2.0800 3 1 2244.37 6.008e-05 0.000e+00 3.600e-05 0.000e+00 6.004e-03 2.67e+00 1.17e+00 1 8.08e-02 +pr: 1:R_R lower-100x100-5050nz 100 100 5050 1 D S N 1 1 0 2.1212 2.0800 3 1 2017.26 1.599e-02 0.000e+00 1.001e-05 0.000e+00 5.321e-01 5.32e+00 2.60e+00 1 2.02e-02 +pr: 2:R_R lower-100x100-5050nz 100 100 5050 1 S S N 1 1 0 2.1212 2.0800 3 1 2017.26 2.401e-02 0.000e+00 1.001e-05 0.000e+00 5.156e-01 3.19e+00 1.56e+00 1 2.02e-02 +pr: 3:R_R lower-100x100-5050nz 100 100 5050 1 C S N 1 1 0 2.1212 2.0800 3 1 2244.37 2.400e-02 0.000e+00 3.600e-05 0.000e+00 5.365e-01 1.48e+00 6.50e-01 1 8.08e-02 +pr: 4:R_R lower-100x100-5050nz 100 100 5050 1 Z S N 1 1 0 2.1212 2.0800 3 1 2186.45 1.607e-02 0.000e+00 3.695e-05 0.000e+00 5.200e-01 2.60e+00 1.17e+00 1 8.08e-02 #pr: below, we define 'successful' autotuning when speedup of 1.010000x is exceeded, and 'tuned' results even the ones which are same as untuned #pr: rsb autotuning was successful in 4 cases (100.00 %) and unsuccessful in 0 cases (0.00 %) -#pr: (in succ. cases rsb autotuning gave avg. 80.5 % faster, avg. sp. ratio 1.805x, max sp. ratio 2.500x, avg. ratio 0.000x) -#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 269.5/118.5/398.3/1078.1 tuned ops) -#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 143.5/ 93.8/220.9/573.9 untuned ops) -#pr: (and amortizes from untuned rsb in avg. 366.4, min. 249.3, max. 502.2 ops) +#pr: (in succ. cases rsb autotuning gave avg. 127291.9 % faster, avg. sp. ratio 1273.919x, max sp. ratio 2397.333x, avg. ratio 0.000x) +#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 33398.5/14071.5/53135.7/133593.9 tuned ops) +#pr: (in succ. cases rsb autotuning took an avg/min/max/tot of: 27.4/ 21.5/ 33.3/109.5 untuned ops) +#pr: (and amortizes from untuned rsb in avg. 27.4, min. 21.5, max. 33.3 ops) #pr: (avg/min/max (avg) nnz per subm before successful tuning were 1683/ 1683/ 1683) #pr: (avg/min/max (avg) nnz per subm after successful tuning were 5050/ 5050/ 5050) #pr: (avg/min/max (avg) bytes per subm before successful tuning were 15150/ 6733/ 26933) #pr: (avg/min/max (avg) bytes per subm after successful tuning were 45450/ 20200/ 80800) #pr: (avg/min/max (avg) bytes per nnz before successful tuning were 2.121/ 2.121/ 2.121) -#pr: (avg/min/max operands (mtx,lhs,rhs) read bandwidth lower bound 3.100/ 1.385/ 5.243,GBps) -#pr: (avg/min/max operands (mtx,rhs:r;lhs:rw) bandwidth lower bound 12.585/ 1.406/ 5.323,GBps) +#pr: (avg/min/max operands (mtx,lhs,rhs) read bandwidth lower bound 3.101/ 1.458/ 5.243,GBps) +#pr: (avg/min/max operands (mtx,rhs:r;lhs:rw) bandwidth lower bound 12.590/ 1.481/ 5.323,GBps) #pr: (avg/min/max code balance (bytes read at least once per flop) 1.495/ 0.650/ 2.599) #pr: (avg/min/max (avg) bytes per nnz after successful tuning were 2.080/ 2.080/ 2.080) #pr: (matrix has been subdivided more/less/same in resp. 0 / 4 /0 cases) #pr: (matrix has used more/less/same threads in resp. 0 / 0 /4 cases) #pr: no unsuccessful rsb autotuning attempt (according to 1.01x threshold) -#pr: rsb auto tuning (either succ. or uns.) time was: on avg.: 0.00 s, min 0.00 s, max 0.01 s, tot 0.02 s (4 samples) -#pr: rsb auto tuning ( only successful ) time was: on avg.: 0.00 s, min 0.00 s, max 0.01 s, tot 0.02 s (4 samples) -#pr: best tun. rsb canon. mflops were: on avg. 2.103e+03, min 2.017e+03, max 2.244e+03 (4 samples) -#pr: ref. unt. rsb canon. mflops were: on avg. 1.242e+03, min 8.069e+02, max 1.686e+03 (4 samples) -#pr: best tun. rsb operation time was: on avg. 2.348e-05s, min 1.001e-05s, max 3.791e-05s, tot 9.394e-05s (4 samples) -#pr: ref. unt. rsb operation time was: on avg. 3.773e-05s, min 1.788e-05s, max 6.008e-05s, tot 1.509e-04s (4 samples) -#pr: min / max ratio of in-memory MEMSET bandwidth to extrapolated read bandwidth ratio: 5.183e+00 1.962e+01 -#pr: in-cache to in-memory MEMSET bandwidth ratio: 1.755e+00 -#pr: Record collection took 0.25 s. +#pr: rsb auto tuning (either succ. or uns.) time was: on avg.: 0.53 s, min 0.52 s, max 0.54 s, tot 2.10 s (4 samples) +#pr: rsb auto tuning ( only successful ) time was: on avg.: 0.53 s, min 0.52 s, max 0.54 s, tot 2.10 s (4 samples) +#pr: best tun. rsb canon. mflops were: on avg. 2.116e+03, min 2.017e+03, max 2.244e+03 (4 samples) +#pr: ref. unt. rsb canon. mflops were: on avg. 2.625e+00, min 8.415e-01, max 5.029e+00 (4 samples) +#pr: best tun. rsb operation time was: on avg. 2.325e-05s, min 1.001e-05s, max 3.695e-05s, tot 9.298e-05s (4 samples) +#pr: ref. unt. rsb operation time was: on avg. 2.002e-02s, min 1.599e-02s, max 2.401e-02s, tot 8.006e-02s (4 samples) +#pr: min / max ratio of in-memory MEMSET bandwidth to extrapolated read bandwidth ratio: 2.455e+00 8.828e+00 +#pr: in-cache to in-memory MEMSET bandwidth ratio: 8.614e-01 +#pr: Record collection took 7.34 s. #pr: Record comprises 50 memory benchmark samples (prepend RSB_PR_MBW=1 to dump this). -#pr: Record comprises 99 environment variables in 4805 bytes (prepend RSB_PR_ENV=1 to dump this). +#pr: Record comprises 99 environment variables in 4859 bytes (prepend RSB_PR_ENV=1 to dump this). # ====== END Total summary record. #pr: ======== Saved a performance record of 4 samples to test.rpr # Removing the temporary record file test.rpr.tmp. -# terminating run at 1767573731 (after 9.1s of w.c.t.) +# terminating run at 1733165315 (after 20.7s of w.c.t.) + ls -ltr test-tuning-lower-100x100-5050nz--C-N-1--base.eps test-tuning-lower-100x100-5050nz--C-N-1--mv-tuned_merge1_1x1th.eps test-tuning-lower-100x100-5050nz--D-N-1--base.eps test-tuning-lower-100x100-5050nz--D-N-1--mv-tuned_merge1_1x1th.eps test-tuning-lower-100x100-5050nz--S-N-1--base.eps test-tuning-lower-100x100-5050nz--S-N-1--mv-tuned_merge1_1x1th.eps test-tuning-lower-100x100-5050nz--Z-N-1--base.eps test-tuning-lower-100x100-5050nz--Z-N-1--mv-tuned_merge1_1x1th.eps --rw-r--r-- 1 pbuilder1 pbuilder1 85629 Jan 4 12:42 test-tuning-lower-100x100-5050nz--D-N-1--base.eps --rw-r--r-- 1 pbuilder1 pbuilder1 84552 Jan 4 12:42 test-tuning-lower-100x100-5050nz--D-N-1--mv-tuned_merge1_1x1th.eps --rw-r--r-- 1 pbuilder1 pbuilder1 85630 Jan 4 12:42 test-tuning-lower-100x100-5050nz--S-N-1--base.eps --rw-r--r-- 1 pbuilder1 pbuilder1 84552 Jan 4 12:42 test-tuning-lower-100x100-5050nz--S-N-1--mv-tuned_merge1_1x1th.eps --rw-r--r-- 1 pbuilder1 pbuilder1 84552 Jan 4 12:42 test-tuning-lower-100x100-5050nz--C-N-1--mv-tuned_merge1_1x1th.eps --rw-r--r-- 1 pbuilder1 pbuilder1 85630 Jan 4 12:42 test-tuning-lower-100x100-5050nz--C-N-1--base.eps --rw-r--r-- 1 pbuilder1 pbuilder1 85630 Jan 4 12:42 test-tuning-lower-100x100-5050nz--Z-N-1--base.eps --rw-r--r-- 1 pbuilder1 pbuilder1 84552 Jan 4 12:42 test-tuning-lower-100x100-5050nz--Z-N-1--mv-tuned_merge1_1x1th.eps +-rw-r--r-- 1 pbuilder2 pbuilder2 85638 Dec 3 08:48 test-tuning-lower-100x100-5050nz--D-N-1--base.eps +-rw-r--r-- 1 pbuilder2 pbuilder2 84560 Dec 3 08:48 test-tuning-lower-100x100-5050nz--D-N-1--mv-tuned_merge1_1x1th.eps +-rw-r--r-- 1 pbuilder2 pbuilder2 85638 Dec 3 08:48 test-tuning-lower-100x100-5050nz--S-N-1--base.eps +-rw-r--r-- 1 pbuilder2 pbuilder2 84560 Dec 3 08:48 test-tuning-lower-100x100-5050nz--S-N-1--mv-tuned_merge1_1x1th.eps +-rw-r--r-- 1 pbuilder2 pbuilder2 85638 Dec 3 08:48 test-tuning-lower-100x100-5050nz--C-N-1--base.eps +-rw-r--r-- 1 pbuilder2 pbuilder2 84560 Dec 3 08:48 test-tuning-lower-100x100-5050nz--C-N-1--mv-tuned_merge1_1x1th.eps +-rw-r--r-- 1 pbuilder2 pbuilder2 85638 Dec 3 08:48 test-tuning-lower-100x100-5050nz--Z-N-1--base.eps +-rw-r--r-- 1 pbuilder2 pbuilder2 84559 Dec 3 08:48 test-tuning-lower-100x100-5050nz--Z-N-1--mv-tuned_merge1_1x1th.eps + rsbench --read-performance-record test.rpr + ls -ltr test.txt --rw-r--r-- 1 pbuilder1 pbuilder1 4082 Jan 4 12:42 test.txt +-rw-r--r-- 1 pbuilder2 pbuilder2 4099 Dec 3 08:48 test.txt + RSB_PR_WLTC=2 + RSB_PR_SR=0 + rsbench --read-performance-record test.rpr @@ -8145,29 +8186,29 @@ /usr/bin/kpsepath ++ kpsepath tex ++ sed 's/!!//g;s/:/\n/g;' -+ find . /nonexistent/first-build/.texlive2024/texmf-config/tex/kpsewhich// /nonexistent/first-build/.texlive2024/texmf-var/tex/kpsewhich// /nonexistent/first-build/texmf/tex/kpsewhich// /usr/local/share/texmf/tex/kpsewhich// /etc/texmf/tex/kpsewhich// /var/lib/texmf/tex/kpsewhich// /usr/share/texmf/tex/kpsewhich// /usr/share/texlive/texmf-dist/tex/kpsewhich// /nonexistent/first-build/.texlive2024/texmf-config/tex/generic// /nonexistent/first-build/.texlive2024/texmf-var/tex/generic// /nonexistent/first-build/texmf/tex/generic// /usr/local/share/texmf/tex/generic// /etc/texmf/tex/generic// /var/lib/texmf/tex/generic// /usr/share/texmf/tex/generic// /usr/share/texlive/texmf-dist/tex/generic// /nonexistent/first-build/.texlive2024/texmf-config/tex/latex// /nonexistent/first-build/.texlive2024/texmf-var/tex/latex// /nonexistent/first-build/texmf/tex/latex// /usr/local/share/texmf/tex/latex// /etc/texmf/tex/latex// /var/lib/texmf/tex/latex// /usr/share/texmf/tex/latex// /usr/share/texlive/texmf-dist/tex/latex// /nonexistent/first-build/.texlive2024/texmf-config/tex/// /nonexistent/first-build/.texlive2024/texmf-var/tex/// /nonexistent/first-build/texmf/tex/// /usr/local/share/texmf/tex/// /etc/texmf/tex/// /var/lib/texmf/tex/// /usr/share/texmf/tex/// /usr/share/texlive/texmf-dist/tex/// -name sciposter.cls -find: '/nonexistent/first-build/.texlive2024/texmf-config/tex/kpsewhich//': No such file or directory -find: '/nonexistent/first-build/.texlive2024/texmf-var/tex/kpsewhich//': No such file or directory -find: '/nonexistent/first-build/texmf/tex/kpsewhich//': No such file or directory ++ find . /nonexistent/second-build/.texlive2024/texmf-config/tex/kpsewhich// /nonexistent/second-build/.texlive2024/texmf-var/tex/kpsewhich// /nonexistent/second-build/texmf/tex/kpsewhich// /usr/local/share/texmf/tex/kpsewhich// /etc/texmf/tex/kpsewhich// /var/lib/texmf/tex/kpsewhich// /usr/share/texmf/tex/kpsewhich// /usr/share/texlive/texmf-dist/tex/kpsewhich// /nonexistent/second-build/.texlive2024/texmf-config/tex/generic// /nonexistent/second-build/.texlive2024/texmf-var/tex/generic// /nonexistent/second-build/texmf/tex/generic// /usr/local/share/texmf/tex/generic// /etc/texmf/tex/generic// /var/lib/texmf/tex/generic// /usr/share/texmf/tex/generic// /usr/share/texlive/texmf-dist/tex/generic// /nonexistent/second-build/.texlive2024/texmf-config/tex/latex// /nonexistent/second-build/.texlive2024/texmf-var/tex/latex// /nonexistent/second-build/texmf/tex/latex// /usr/local/share/texmf/tex/latex// /etc/texmf/tex/latex// /var/lib/texmf/tex/latex// /usr/share/texmf/tex/latex// /usr/share/texlive/texmf-dist/tex/latex// /nonexistent/second-build/.texlive2024/texmf-config/tex/// /nonexistent/second-build/.texlive2024/texmf-var/tex/// /nonexistent/second-build/texmf/tex/// /usr/local/share/texmf/tex/// /etc/texmf/tex/// /var/lib/texmf/tex/// /usr/share/texmf/tex/// /usr/share/texlive/texmf-dist/tex/// -name sciposter.cls +find: '/nonexistent/second-build/.texlive2024/texmf-config/tex/kpsewhich//': No such file or directory +find: '/nonexistent/second-build/.texlive2024/texmf-var/tex/kpsewhich//': No such file or directory +find: '/nonexistent/second-build/texmf/tex/kpsewhich//': No such file or directory find: '/usr/local/share/texmf/tex/kpsewhich//': No such file or directory find: '/etc/texmf/tex/kpsewhich//': No such file or directory find: '/var/lib/texmf/tex/kpsewhich//': No such file or directory find: '/usr/share/texmf/tex/kpsewhich//': No such file or directory find: '/usr/share/texlive/texmf-dist/tex/kpsewhich//': No such file or directory -find: '/nonexistent/first-build/.texlive2024/texmf-config/tex/generic//': No such file or directory -find: '/nonexistent/first-build/.texlive2024/texmf-var/tex/generic//': No such file or directory -find: '/nonexistent/first-build/texmf/tex/generic//': No such file or directory +find: '/nonexistent/second-build/.texlive2024/texmf-config/tex/generic//': No such file or directory +find: '/nonexistent/second-build/.texlive2024/texmf-var/tex/generic//': No such file or directory +find: '/nonexistent/second-build/texmf/tex/generic//': No such file or directory find: '/usr/local/share/texmf/tex/generic//': No such file or directory find: '/usr/share/texmf/tex/generic//': No such file or directory -find: '/nonexistent/first-build/.texlive2024/texmf-config/tex/latex//': No such file or directory -find: '/nonexistent/first-build/.texlive2024/texmf-var/tex/latex//': No such file or directory -find: '/nonexistent/first-build/texmf/tex/latex//': No such file or directory +find: '/nonexistent/second-build/.texlive2024/texmf-config/tex/latex//': No such file or directory +find: '/nonexistent/second-build/.texlive2024/texmf-var/tex/latex//': No such file or directory +find: '/nonexistent/second-build/texmf/tex/latex//': No such file or directory find: '/usr/local/share/texmf/tex/latex//': No such file or directory find: '/etc/texmf/tex/latex//': No such file or directory find: '/var/lib/texmf/tex/latex//': No such file or directory -find: '/nonexistent/first-build/.texlive2024/texmf-config/tex///': No such file or directory -find: '/nonexistent/first-build/.texlive2024/texmf-var/tex///': No such file or directory -find: '/nonexistent/first-build/texmf/tex///': No such file or directory +find: '/nonexistent/second-build/.texlive2024/texmf-config/tex///': No such file or directory +find: '/nonexistent/second-build/.texlive2024/texmf-var/tex///': No such file or directory +find: '/nonexistent/second-build/texmf/tex///': No such file or directory find: '/usr/local/share/texmf/tex///': No such file or directory + exit 0 for mf in pd.mtx vf.mtx ; do if test -f /build/reproducible-path/librsb-1.3.0.2+dfsg/examples/$mf ; then true; else cp -p /build/reproducible-path/librsb-1.3.0.2+dfsg/$mf /build/reproducible-path/librsb-1.3.0.2+dfsg/examples/$mf ; fi; done @@ -8182,7 +8223,7 @@ This error may be safely ignored. Correctly allocated a matrix. Summary information of the matrix: -(3 x 3)[0x57881530]{D} @ (0(0..3),0(0..3)) (3 nnz, 1 nnz/r) flags 0x2040384 (coo:1, csr:0, hw:0, ic:1, fi:0), storage: 40, subm: 1, symflags:'' +(3 x 3)[0x56f90530]{D} @ (0(0..3),0(0..3)) (3 nnz, 1 nnz/r) flags 0x2040384 (coo:1, csr:0, hw:0, ic:1, fi:0), storage: 40, subm: 1, symflags:'' Correctly performed a SPMV. Correctly freed the matrix. Correctly finalized the library. @@ -8197,7 +8238,7 @@ This error may be safely ignored. Correctly allocated a matrix. Summary information of the matrix: -(3 x 3)[0x58163530]{D} @ (0(0..3),0(0..3)) (3 nnz, 1 nnz/r) flags 0x2040384 (coo:1, csr:0, hw:0, ic:1, fi:0), storage: 40, subm: 1, symflags:'' +(3 x 3)[0x584be530]{D} @ (0(0..3),0(0..3)) (3 nnz, 1 nnz/r) flags 0x2040384 (coo:1, csr:0, hw:0, ic:1, fi:0), storage: 40, subm: 1, symflags:'' Correctly performed a SPMV. Correctly freed the matrix. Correctly finalized the library. @@ -8261,51 +8302,51 @@ Done. Building a matrix with 5 nnz, 5 x 5 Duplicates check: 5 - 0 = 5 - converted COO to RSB in 4.697e-05 s (100.00 %) - analyzed arrays in 1.407e-05 s (29.95 %) - cleaned-up arrays in 1.192e-06 s (2.54 %) - deduplicated arrays in 0.000e+00 s (0.00 %) - sorted arrays in 6.914e-06 s (14.72 %) - shuffled partitions in 1.097e-05 s (23.35 %) - memory allocations took 4.768e-06 s (10.15 %) - leafs setup took 0.000e+00 s (0.00 %) - halfword conversion took 8.106e-06 s (17.26 %) -Built (5 x 5)[0x58164700]{D} @ (0(0..0),0(0..0)) (5 nnz, 1 nnz/r) flags 0x2046186 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 2, symflags:'' + converted COO to RSB in 1.586e-01 s (100.00 %) + analyzed arrays in 6.399e-02 s (40.34 %) + cleaned-up arrays in 9.537e-07 s (0.00 %) + deduplicated arrays in 1.192e-06 s (0.00 %) + sorted arrays in 1.464e-02 s (9.23 %) + shuffled partitions in 4.800e-02 s (30.26 %) + memory allocations took 6.914e-06 s (0.00 %) + leafs setup took 4.053e-06 s (0.00 %) + halfword conversion took 3.200e-02 s (20.17 %) +Built (5 x 5)[0x584bf700]{D} @ (0(0..0),0(0..0)) (5 nnz, 1 nnz/r) flags 0x2046186 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 2, symflags:'' Allocated matrix of 5 nonzeroes: -(5 x 5)[0x58164700]{D} @ (0(0..0),0(0..0)) (5 nnz, 1 nnz/r) flags 0x2046186 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 2, symflags:'' +(5 x 5)[0x584bf700]{D} @ (0(0..0),0(0..0)) (5 nnz, 1 nnz/r) flags 0x2046186 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 2, symflags:'' -Before auto-tuning, 100 multiplications took 0.000638s. +Before auto-tuning, 100 multiplications took 2.323970s. Threads autotuning (may take more than 1.500000s)... Will use autotuning routine to sample matrix: 5 x 5, type D, 5 nnz, 1 nnz/r, 3 subms, 2 lsubms, 4.0000 bpnz. Parameters: verbosity:1 mintimes:3 maxtimes:10 mindt:0 maxdt:0.1 -Sampling (15 x 0.1 s stages, transA=N, nrhs=2, timer gran.=5.12481e-08), 8 suggested as starting thread count(default). -3 iterations (8 th.) took 2.384e-05s; avg 7.947e-06s ( +/- 25.00/ 26.00 %); best 5.96e-06s; worst 1.001e-05s; std dev. 1.656e-06 (taking best). -Reference operation time is 5.96046e-06 s (3.355 Mflops) with 8 threads. -3 iterations (8 th.) took 1.788e-05s; avg 5.96e-06s ( +/- 16.00/ 16.00 %); best 5.007e-06s; worst 6.914e-06s; std dev. 7.787e-07 (taking best). -Reference operation time is 5.00679e-06 s (3.995 Mflops) with 8 threads. -After 0.000072s, autotuning routine did not find a better threads count configuration. -(5 x 5)[0x58164700]{D} @ (0(0..0),0(0..0)) (5 nnz, 1 nnz/r) flags 0x2046186 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 2, symflags:'' -After threads auto-tuning, 100 multiplications took 0.000575s -- effective speedup of 1.10945 x +Sampling (15 x 0.1 s stages, transA=N, nrhs=2, timer gran.=5.35965e-08), 8 suggested as starting thread count(default). +3 iterations (8 th.) took 0.07195s; avg 0.02398s ( +/- 0.11/ 0.09 %); best 0.02396s; worst 0.02401s; std dev. 1.958e-05 (taking best). +Reference operation time is 0.0239589 s (0.0008348 Mflops) with 8 threads. +3 iterations (8 th.) took 0.07998s; avg 0.02666s ( +/- 10.06/ 19.97 %); best 0.02398s; worst 0.03199s; std dev. 0.003766 (taking best). +Reference operation time is 0.0239789 s (0.0008341 Mflops) with 8 threads. +After 0.152012s, autotuning routine did not find a better threads count configuration. +(5 x 5)[0x584bf700]{D} @ (0(0..0),0(0..0)) (5 nnz, 1 nnz/r) flags 0x2046186 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 2, symflags:'' +After threads auto-tuning, 100 multiplications took 2.443983s -- effective speedup of 0.950895 x Matrix autotuning (may take more than 1.500000s; using 8 threads )... Will autotune matrix: 5 x 5, type D, 5 nnz, 1 nnz/r, 3 subms, 2 lsubms, 4.0000 bpnz. Parameters: verbosity:1 mintimes:3 maxtimes:10 mindt:0 maxdt:0.1 -Starting autotuning (15 x 0.1 s stages, transA=N, nrhs=2, timer gran.=5.12481e-08), 8 suggested as starting thread count. -3 iterations (8 th.) took 1.788e-05s; avg 5.96e-06s ( +/- 0.00/ 0.00 %); best 5.96e-06s; worst 5.96e-06s; std dev. 0 (taking best). -Reference operation time is 5.96046e-06 s (3.355 Mflops) with 8 threads. -Starting merge (user-supplied threads) based auto-tuning procedure (transA=N, nrhs=2, order=cols) (max 6 steps, inclusive 3 grace steps) on: 5 x 5, type D, 5 nnz, 1 nnz/r, 3 subms, 2 lsubms, 4.0000 bpnz (tpop: 5.96e-06 Mflops: 3.355) -Merge (2 -> 1 leaves) took w.c.t. of 6.914e-06s, ~9.537e-07s of computing time (of which 0s sorting, 9.537e-07s analysis) -3 iterations (8 th.) took 1.907e-06s; avg 6.358e-07s ( +/- 91.94/ 50.00 %); best 5.125e-08s; worst 9.537e-07s; std dev. 4.496e-07 (taking best). -Reference operation time is 5.12481e-08 s (390.3 Mflops) with 8 threads. -After merge step 1: tpop: 5.125e-08 s ~Mflops: 390.259 nsubm:1 otn:8 -Applying merge (2 -> 1 leaves, 8 th.) yielded SPEEDUP of 116.306x: 5.96e-06s -> 5.125e-08s, so taking this instance. +Starting autotuning (15 x 0.1 s stages, transA=N, nrhs=2, timer gran.=5.35965e-08), 8 suggested as starting thread count. +3 iterations (8 th.) took 0.07199s; avg 0.024s ( +/- 33.26/ 33.20 %); best 0.01602s; worst 0.03196s; std dev. 0.006511 (taking best). +Reference operation time is 0.0160151 s (0.001249 Mflops) with 8 threads. +Starting merge (user-supplied threads) based auto-tuning procedure (transA=N, nrhs=2, order=cols) (max 6 steps, inclusive 3 grace steps) on: 5 x 5, type D, 5 nnz, 1 nnz/r, 3 subms, 2 lsubms, 4.0000 bpnz (tpop: 0.01602 Mflops: 0.001) +Merge (2 -> 1 leaves) took w.c.t. of 1.884e-05s, ~3.099e-06s of computing time (of which 0s sorting, 5.007e-06s analysis) +3 iterations (8 th.) took 2.146e-06s; avg 7.153e-07s ( +/- 92.51/200.00 %); best 5.36e-08s; worst 2.146e-06s; std dev. 1.012e-06 (taking best). +Reference operation time is 5.35965e-08 s (373.2 Mflops) with 8 threads. +After merge step 1: tpop: 5.36e-08 s ~Mflops: 373.159 nsubm:1 otn:8 +Applying merge (2 -> 1 leaves, 8 th.) yielded SPEEDUP of 298807.829x: 0.01602s -> 5.36e-08s, so taking this instance. Merged all the matrix leaves: no reason to continue merging. -A total of 1 merge steps (of max 6) (2 -> 1 subms) took 0.0001562s (of which 7.415e-05s partitioning, 0s I/O); computing times: 9.537e-07s in par. loops, 0s sorting, 9.537e-07s analyzing) -Total merge + benchmarking process took 0.0001562s, equivalent to 3047.2/26.2 new/old ops (9.012e-05s for 2 clones -- as 1758.5/15.1 ops, or 879.3/7.6 ops per clone), SPEEDUP of 116.306x -Applying multi-merge (2 -> 1 leaves, 1 steps, 8 -> 8 th.sp.) yielded SPEEDUP of 116.306x (5.96e-06s -> 5.125e-08s), will amortize in 26.4 ops by saving 5.909e-06s per op. -In 1 tuning rounds (tot. 0.00021s, 9e-05s for constructor, 2 clones) obtained a SPEEDUP of 11530.6% (116.3x) (from 3.355 to 390.3 Mflops). -After 0.000217s, autotuning routine declared speedup of 116.306 x, when using threads count of 8. -(5 x 5)[0x581666a0]{D} @ (0(0..5),0(0..5)) (5 nnz, 1 nnz/r) flags 0x2040186 (coo:1, csr:0, hw:1, ic:1, fi:0), storage: 40, subm: 1, symflags:'' -After threads auto-tuning, 100 multiplications took 0.000012s -- further speedup of 48.24 x +A total of 1 merge steps (of max 6) (2 -> 1 subms) took 0.07597s (of which 3.91e-05s partitioning, 0s I/O); computing times: 3.099e-06s in par. loops, 0s sorting, 5.007e-06s analyzing) +Total merge + benchmarking process took 0.07597s, equivalent to 1417535.6/4.7 new/old ops (0.1479s for 2 clones -- as 2759248.2/9.2 ops, or 1379624.1/4.6 ops per clone), SPEEDUP of 298807.829x +Applying multi-merge (2 -> 1 leaves, 1 steps, 8 -> 8 th.sp.) yielded SPEEDUP of 298807.829x (0.01602s -> 5.36e-08s), will amortize in 4.7 ops by saving 0.01601s per op. +In 1 tuning rounds (tot. 0.22s, 0.15s for constructor, 2 clones) obtained a SPEEDUP of 29880682.9% (2.988e+05x) (from 0.001249 to 373.2 Mflops). +After 0.219997s, autotuning routine declared speedup of 298808 x, when using threads count of 8. +(5 x 5)[0x584c16a0]{D} @ (0(0..5),0(0..5)) (5 nnz, 1 nnz/r) flags 0x2040186 (coo:1, csr:0, hw:1, ic:1, fi:0), storage: 40, subm: 1, symflags:'' +After threads auto-tuning, 100 multiplications took 0.000018s -- further speedup of 136677 x 0/2 0 0 -> 0 1/2 1 0 -> 5 0/2 0 3 -> 0 @@ -8316,7 +8357,7 @@ Correctly initialized the library. Correctly allocated a matrix with 7 nonzeroes. Summary information of the matrix: -(6 x 6)[0x58164700]{D} @ (0(1..2),0(5..6)) (1 nnz, 0.17 nnz/r) flags 0x20443ee (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 1, symflags:'UT' +(6 x 6)[0x584bf700]{D} @ (0(1..2),0(5..6)) (1 nnz, 0.17 nnz/r) flags 0x20443ee (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 1, symflags:'UT' Matrix printout: %%MatrixMarket matrix coordinate real general 6 6 1 @@ -8470,75 +8511,75 @@ Creating 500 x 500 matrix with 62500 nonzeroes. Building a matrix with 62500 nnz, 500 x 500 Duplicates check: 62500 - 0 = 62500 - converted COO to RSB in 2.051e-03 s (100.00 %) - analyzed arrays in 8.893e-05 s (4.34 %) - cleaned-up arrays in 8.392e-05 s (4.09 %) - deduplicated arrays in 7.200e-05 s (3.51 %) - sorted arrays in 1.494e-03 s (72.84 %) - shuffled partitions in 2.491e-04 s (12.15 %) - memory allocations took 1.931e-05 s (0.94 %) - leafs setup took 3.815e-06 s (0.19 %) - halfword conversion took 3.719e-05 s (1.81 %) -Built (500 x 500)[0x5732a360]{D} @ (0(0..0),0(0..0)) (62500 nnz, 1.2e+02 nnz/r) flags 0x2046186 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 22, symflags:'' + converted COO to RSB in 3.387e-01 s (100.00 %) + analyzed arrays in 5.184e-02 s (15.30 %) + cleaned-up arrays in 7.820e-05 s (0.02 %) + deduplicated arrays in 7.010e-05 s (0.02 %) + sorted arrays in 1.507e-01 s (44.49 %) + shuffled partitions in 9.999e-02 s (29.52 %) + memory allocations took 2.980e-05 s (0.01 %) + leafs setup took 9.060e-06 s (0.00 %) + halfword conversion took 3.599e-02 s (10.63 %) +Built (500 x 500)[0x56ff3360]{D} @ (0(0..0),0(0..0)) (62500 nnz, 1.2e+02 nnz/r) flags 0x2046186 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 22, symflags:'' Allocated matrix of 62500 nonzeroes: -(500 x 500)[0x5732a360]{D} @ (0(0..0),0(0..0)) (62500 nnz, 1.2e+02 nnz/r) flags 0x2046186 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 22, symflags:'' +(500 x 500)[0x56ff3360]{D} @ (0(0..0),0(0..0)) (62500 nnz, 1.2e+02 nnz/r) flags 0x2046186 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 22, symflags:'' -Before auto-tuning, 100 multiplications took 0.010511s. +Before auto-tuning, 100 multiplications took 2.443811s. Threads autotuning (may take more than 1.500000s)... -Will use autotuning routine to sample matrix: 500 x 500, type D, 62500 nnz, 1.2e+02 nnz/r, 31 subms, 22 lsubms, 2.0695 bpnz. +Will use autotuning routine to sample matrix: 500 x 500, type D, 62500 nnz, 1.2e+02 nnz/r, 31 subms, 22 lsubms, 2.0735 bpnz. Parameters: verbosity:1 mintimes:3 maxtimes:10 mindt:0 maxdt:0.1 -Sampling (15 x 0.1 s stages, transA=N, nrhs=2, timer gran.=5.31077e-08), 8 suggested as starting thread count(default). -3 iterations (8 th.) took 0.0003021s; avg 0.0001007s ( +/- 2.68/ 2.29 %); best 9.799e-05s; worst 0.000103s; std dev. 2.063e-06 (taking best). -Reference operation time is 9.799e-05 s (2551 Mflops) with 8 threads. -3 iterations (8 th.) took 0.000303s; avg 0.000101s ( +/- 1.81/ 1.97 %); best 9.918e-05s; worst 0.000103s; std dev. 1.561e-06 (taking best). -Reference operation time is 9.91821e-05 s (2521 Mflops) with 8 threads. -After 0.000646s, autotuning routine did not find a better threads count configuration. -(500 x 500)[0x5732a360]{D} @ (0(0..0),0(0..0)) (62500 nnz, 1.2e+02 nnz/r) flags 0x2046186 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 22, symflags:'' -After threads auto-tuning, 100 multiplications took 0.010385s -- effective speedup of 1.01214 x +Sampling (15 x 0.1 s stages, transA=N, nrhs=2, timer gran.=5.86033e-08), 8 suggested as starting thread count(default). +3 iterations (8 th.) took 0.07193s; avg 0.02398s ( +/- 33.21/ 33.19 %); best 0.01601s; worst 0.03193s; std dev. 0.0065 (taking best). +Reference operation time is 0.0160129 s (15.61 Mflops) with 8 threads. +3 iterations (8 th.) took 0.08799s; avg 0.02933s ( +/- 15.51/ 9.13 %); best 0.02478s; worst 0.03201s; std dev. 0.003233 (taking best). +Reference operation time is 0.024781 s (10.09 Mflops) with 8 threads. +After 0.160009s, autotuning routine did not find a better threads count configuration. +(500 x 500)[0x56ff3360]{D} @ (0(0..0),0(0..0)) (62500 nnz, 1.2e+02 nnz/r) flags 0x2046186 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 22, symflags:'' +After threads auto-tuning, 100 multiplications took 2.331960s -- effective speedup of 1.04796 x Matrix autotuning (may take more than 1.500000s; using 8 threads )... -Will autotune matrix: 500 x 500, type D, 62500 nnz, 1.2e+02 nnz/r, 31 subms, 22 lsubms, 2.0695 bpnz. +Will autotune matrix: 500 x 500, type D, 62500 nnz, 1.2e+02 nnz/r, 31 subms, 22 lsubms, 2.0735 bpnz. Parameters: verbosity:1 mintimes:3 maxtimes:10 mindt:0 maxdt:0.1 -Starting autotuning (15 x 0.1 s stages, transA=N, nrhs=2, timer gran.=5.31077e-08), 8 suggested as starting thread count. -3 iterations (8 th.) took 0.0003259s; avg 0.0001086s ( +/- 6.95/ 8.63 %); best 0.0001011s; worst 0.000118s; std dev. 7.031e-06 (taking best). -Reference operation time is 0.000101089 s (2473 Mflops) with 8 threads. -Starting merge (user-supplied threads) based auto-tuning procedure (transA=N, nrhs=2, order=cols) (max 6 steps, inclusive 3 grace steps) on: 500 x 500, type D, 62500 nnz, 1.2e+02 nnz/r, 31 subms, 22 lsubms, 2.0695 bpnz (tpop: 0.0001011 Mflops: 2473.057) -Merge (22 -> 19 leaves) took w.c.t. of 6.08e-05s, ~4.697e-05s of computing time (of which 2.098e-05s sorting, 2.861e-06s analysis) -3 iterations (8 th.) took 0.0003021s; avg 0.0001007s ( +/- 0.55/ 0.39 %); best 0.0001001s; worst 0.0001011s; std dev. 4.052e-07 (taking best). -Reference operation time is 0.000100136 s (2497 Mflops) with 8 threads. -After merge step 1: tpop: 0.0001001 s ~Mflops: 2496.610 nsubm:19 otn:8 -Applying merge (22 -> 19 leaves, 8 th.) yielded NEGLIGIBLE change (1th in a row) (old/new=1.00952x): 0.0001011s -> 0.0001001s, so IGNORING this instance. -Merge (19 -> 16 leaves) took w.c.t. of 5.198e-05s, ~4.387e-05s of computing time (of which 2.623e-05s sorting, 2.146e-06s analysis) -3 iterations (8 th.) took 0.0003018s; avg 0.0001006s ( +/- 0.71/ 0.47 %); best 9.99e-05s; worst 0.0001011s; std dev. 5.15e-07 (taking best). -Reference operation time is 9.98974e-05 s (2503 Mflops) with 8 threads. -After merge step 2: tpop: 9.99e-05 s ~Mflops: 2502.568 nsubm:16 otn:8 -Applying merge (19 -> 16 leaves, 8 th.) yielded SPEEDUP of 1.012x: 0.0001011s -> 9.99e-05s, so taking this instance. -Merge (16 -> 13 leaves) took w.c.t. of 4.721e-05s, ~4.101e-05s of computing time (of which 2.098e-05s sorting, 2.146e-06s analysis) -3 iterations (8 th.) took 0.0003171s; avg 0.0001057s ( +/- 5.49/ 9.85 %); best 9.99e-05s; worst 0.0001161s; std dev. 7.378e-06 (taking best). -Reference operation time is 9.98974e-05 s (2503 Mflops) with 8 threads. -After merge step 3: tpop: 9.99e-05 s ~Mflops: 2502.568 nsubm:13 otn:8 -Applying merge (16 -> 13 leaves, 8 th.) yielded NEGLIGIBLE change (1th in a row) (old/new=1.00000x): 9.99e-05s -> 9.99e-05s, so IGNORING this instance. -Merge (13 -> 10 leaves) took w.c.t. of 0.000196s, ~0.0001888s of computing time (of which 0.0001371s sorting, 9.537e-07s analysis) -3 iterations (8 th.) took 0.0003219s; avg 0.0001073s ( +/- 2.22/ 1.78 %); best 0.0001049s; worst 0.0001092s; std dev. 1.784e-06 (taking best). -Reference operation time is 0.000104904 s (2383 Mflops) with 8 threads. -After merge step 4: tpop: 0.0001049 s ~Mflops: 2383.127 nsubm:10 otn:8 -Applying merge (13 -> 10 leaves, 8 th.) yielded SLOWDOWN (1th of 3 tolerable) of 1.050x: 9.99e-05s -> 0.0001049s. -Merge (10 -> 7 leaves) took w.c.t. of 0.000144s, ~0.000139s of computing time (of which 9.203e-05s sorting, 1.192e-06s analysis) -3 iterations (8 th.) took 0.0003119s; avg 0.000104s ( +/- 2.06/ 2.06 %); best 0.0001018s; worst 0.0001061s; std dev. 1.752e-06 (taking best). -Reference operation time is 0.000101805 s (2456 Mflops) with 8 threads. -After merge step 5: tpop: 0.0001018 s ~Mflops: 2455.681 nsubm:7 otn:8 -Applying merge (10 -> 7 leaves, 8 th.) yielded NEGLIGIBLE change (2th in a row) (old/new=0.98126x): 9.99e-05s -> 0.0001018s, so IGNORING this instance. -Merge (7 -> 4 leaves) took w.c.t. of 0.000155s, ~0.000149s of computing time (of which 0.000103s sorting, 9.537e-07s analysis) -3 iterations (8 th.) took 0.000335s; avg 0.0001117s ( +/- 6.90/ 11.89 %); best 0.000104s; worst 0.0001249s; std dev. 9.425e-06 (taking best). -Reference operation time is 0.000103951 s (2405 Mflops) with 8 threads. -After merge step 6: tpop: 0.000104 s ~Mflops: 2404.991 nsubm:4 otn:8 -Applying merge (7 -> 4 leaves, 8 th.) yielded SLOWDOWN (2th of 3 tolerable) of 1.041x: 9.99e-05s -> 0.000104s. -A total of 6 merge steps (of max 6) (22 -> 4 subms) took 0.00301s (of which 0.0007472s partitioning, 0s I/O); computing times: 0.0006087s in par. loops, 0.0004003s sorting, 1.025e-05s analyzing) -Total merge + benchmarking process took 0.00301s, equivalent to 30.1/29.8 new/old ops (0.0006459s for 2 clones -- as 6.5/6.4 ops, or 3.2/3.2 ops per clone), SPEEDUP of 1.012x -Applying multi-merge (22 -> 16 leaves, 2 steps, 8 -> 8 th.sp.) yielded SPEEDUP of 1.012x (0.0001011s -> 9.99e-05s), will amortize in 2525.0 ops by saving 1.192e-06s per op. -In 1 tuning rounds (tot. 0.0038s, 0.00065s for constructor, 2 clones) obtained a SPEEDUP of 1.2% (1.012x) (from 2473 to 2503 Mflops). -After 0.003837s, autotuning routine declared speedup of 1.01193 x, when using threads count of 8. -(500 x 500)[0x5732da90]{D} @ (0(0..0),0(0..0)) (62500 nnz, 1.2e+02 nnz/r) flags 0x2046186 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 16, symflags:'' -After threads auto-tuning, 100 multiplications took 0.010340s -- further speedup of 1.00436 x +Starting autotuning (15 x 0.1 s stages, transA=N, nrhs=2, timer gran.=5.86033e-08), 8 suggested as starting thread count. +3 iterations (8 th.) took 0.07994s; avg 0.02665s ( +/- 9.95/ 5.09 %); best 0.024s; worst 0.028s; std dev. 0.001875 (taking best). +Reference operation time is 0.0239952 s (10.42 Mflops) with 8 threads. +Starting merge (user-supplied threads) based auto-tuning procedure (transA=N, nrhs=2, order=cols) (max 6 steps, inclusive 3 grace steps) on: 500 x 500, type D, 62500 nnz, 1.2e+02 nnz/r, 31 subms, 22 lsubms, 2.0735 bpnz (tpop: 0.024 Mflops: 10.419) +Merge (22 -> 16 leaves) took w.c.t. of 0.03598s, ~0.01212s of computing time (of which 4.101e-05s sorting, 5.96e-06s analysis) +3 iterations (8 th.) took 0.08797s; avg 0.02932s ( +/- 45.40/ 36.30 %); best 0.01601s; worst 0.03997s; std dev. 0.009961 (taking best). +Reference operation time is 0.016011 s (15.61 Mflops) with 8 threads. +After merge step 1: tpop: 0.01601 s ~Mflops: 15.614 nsubm:16 otn:8 +Applying merge (22 -> 16 leaves, 8 th.) yielded SPEEDUP of 1.499x: 0.024s -> 0.01601s, so taking this instance. +Merge (16 -> 10 leaves) took w.c.t. of 0.0161s, ~0.008232s of computing time (of which 0.008118s sorting, 4.053e-06s analysis) +3 iterations (8 th.) took 0.09587s; avg 0.03196s ( +/- 49.96/ 49.81 %); best 0.01599s; worst 0.04787s; std dev. 0.01302 (taking best). +Reference operation time is 0.0159891 s (15.64 Mflops) with 8 threads. +After merge step 2: tpop: 0.01599 s ~Mflops: 15.636 nsubm:10 otn:8 +Applying merge (16 -> 10 leaves, 8 th.) yielded NEGLIGIBLE change (1th in a row) (old/new=1.00137x): 0.01601s -> 0.01599s, so IGNORING this instance. +Merge (10 -> 7 leaves) took w.c.t. of 0.000103s, ~8.488e-05s of computing time (of which 4.911e-05s sorting, 5.007e-06s analysis) +3 iterations (8 th.) took 0.06387s; avg 0.02129s ( +/- 25.46/ 50.20 %); best 0.01587s; worst 0.03198s; std dev. 0.007558 (taking best). +Reference operation time is 0.0158699 s (15.75 Mflops) with 8 threads. +After merge step 3: tpop: 0.01587 s ~Mflops: 15.753 nsubm:7 otn:8 +Applying merge (10 -> 7 leaves, 8 th.) yielded NEGLIGIBLE change (2th in a row) (old/new=1.00889x): 0.01601s -> 0.01587s, so IGNORING this instance. +Merge (7 -> 4 leaves) took w.c.t. of 0.000123s, ~0.000109s of computing time (of which 6.199e-05s sorting, 5.007e-06s analysis) +3 iterations (8 th.) took 0.06385s; avg 0.02128s ( +/- 25.58/ 50.26 %); best 0.01584s; worst 0.03198s; std dev. 0.007564 (taking best). +Reference operation time is 0.0158391 s (15.78 Mflops) with 8 threads. +After merge step 4: tpop: 0.01584 s ~Mflops: 15.784 nsubm:4 otn:8 +Applying merge (7 -> 4 leaves, 8 th.) yielded SPEEDUP of 1.011x: 0.01601s -> 0.01584s, so taking this instance. +Merge (4 -> 3 leaves) took w.c.t. of 9.394e-05s, ~7.987e-05s of computing time (of which 0s sorting, 4.053e-06s analysis) +3 iterations (8 th.) took 0.0639s; avg 0.0213s ( +/- 25.35/ 50.19 %); best 0.0159s; worst 0.03199s; std dev. 0.007559 (taking best). +Reference operation time is 0.0158992 s (15.72 Mflops) with 8 threads. +After merge step 5: tpop: 0.0159 s ~Mflops: 15.724 nsubm:3 otn:8 +Applying merge (4 -> 3 leaves, 8 th.) yielded NEGLIGIBLE change (1th in a row) (old/new=0.99622x): 0.01584s -> 0.0159s, so IGNORING this instance. +Merge (3 -> 2 leaves) took w.c.t. of 7.987e-05s, ~6.294e-05s of computing time (of which 0s sorting, 5.007e-06s analysis) +3 iterations (8 th.) took 0.04791s; avg 0.01597s ( +/- 0.48/ 0.31 %); best 0.01589s; worst 0.01602s; std dev. 5.527e-05 (taking best). +Reference operation time is 0.015892 s (15.73 Mflops) with 8 threads. +After merge step 6: tpop: 0.01589 s ~Mflops: 15.731 nsubm:2 otn:8 +Applying merge (3 -> 2 leaves, 8 th.) yielded NEGLIGIBLE change (2th in a row) (old/new=0.99667x): 0.01584s -> 0.01589s, so IGNORING this instance. +A total of 6 merge steps (of max 6) (22 -> 2 subms) took 0.604s (of which 0.05252s partitioning, 0s I/O); computing times: 0.02069s in par. loops, 0.00827s sorting, 2.909e-05s analyzing) +Total merge + benchmarking process took 0.604s, equivalent to 38.1/25.2 new/old ops (0.192s for 3 clones -- as 12.1/8.0 ops, or 4.0/2.7 ops per clone), SPEEDUP of 1.515x +Applying multi-merge (22 -> 4 leaves, 4 steps, 8 -> 8 th.sp.) yielded SPEEDUP of 1.515x (0.024s -> 0.01584s), will amortize in 74.1 ops by saving 0.008156s per op. +In 1 tuning rounds (tot. 0.75s, 0.19s for constructor, 3 clones) obtained a SPEEDUP of 51.5% (1.515x) (from 10.42 to 15.78 Mflops). +After 0.748142s, autotuning routine declared speedup of 1.51493 x, when using threads count of 8. +(500 x 500)[0x570ed630]{D} @ (0(0..0),0(0..0)) (62500 nnz, 1.2e+02 nnz/r) flags 0x2046186 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 4, symflags:'' +After threads auto-tuning, 100 multiplications took 2.083841s -- further speedup of 1.11907 x librsb timer-based profiling is not supported in this build. If you wish to have it, re-configure librsb with its support. So you can safely ignore the error you might just have seen printed out on screen. /build/reproducible-path/librsb-1.3.0.2+dfsg/examples/backsolve Hello, RSB! @@ -8546,19 +8587,19 @@ Correctly initialized the library. Building a matrix with 7 nnz, 6 x 6 Duplicates check: 1 - 0 = 1 - converted COO to RSB in 3.829e-04 s (100.00 %) - analyzed arrays in 3.469e-04 s (90.60 %) - cleaned-up arrays in 7.868e-06 s (2.05 %) - deduplicated arrays in 1.192e-06 s (0.31 %) - sorted arrays in 9.537e-07 s (0.25 %) - shuffled partitions in 9.060e-06 s (2.37 %) - memory allocations took 1.025e-05 s (2.68 %) - leafs setup took 9.537e-07 s (0.25 %) - halfword conversion took 3.815e-06 s (1.00 %) -Built (6 x 6)[0x582bb540]{D} @ (0(0..1),0(5..6)) (1 nnz, 0.17 nnz/r) flags 0x20443ee (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 1, symflags:'UT' + converted COO to RSB in 1.168e-01 s (100.00 %) + analyzed arrays in 8.076e-02 s (69.15 %) + cleaned-up arrays in 6.914e-06 s (0.01 %) + deduplicated arrays in 0.000e+00 s (0.00 %) + sorted arrays in 1.192e-06 s (0.00 %) + shuffled partitions in 3.600e-02 s (30.82 %) + memory allocations took 1.383e-05 s (0.01 %) + leafs setup took 8.106e-06 s (0.01 %) + halfword conversion took 8.821e-06 s (0.01 %) +Built (6 x 6)[0x583bd540]{D} @ (0(0..1),0(5..6)) (1 nnz, 0.17 nnz/r) flags 0x20443ee (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 1, symflags:'UT' Correctly allocated a matrix with 7 nonzeroes. Summary information of the matrix: -(6 x 6)[0x582bb540]{D} @ (0(0..1),0(5..6)) (1 nnz, 0.17 nnz/r) flags 0x20443ee (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 1, symflags:'UT' +(6 x 6)[0x583bd540]{D} @ (0(0..1),0(5..6)) (1 nnz, 0.17 nnz/r) flags 0x20443ee (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 1, symflags:'UT' Matrix printout: %%MatrixMarket matrix coordinate real general 6 6 1 @@ -8584,55 +8625,55 @@ 1 1 Will autotune matrix: 6 x 6, type D, 1 nnz, 0.17 nnz/r, 1 subms, 1 lsubms, 4.0000 bpnz. -Parameters: verbosity:1 mintimes:3 maxtimes:10 mindt:0 maxdt:5.035e-08 -3 iterations (8 th.) took 1.693e-05s; avg 5.643e-06s ( +/- 99.11/183.10 %); best 5.035e-08s; worst 1.597e-05s; std dev. 7.316e-06 (taking best). -Reference operation time is 5.0354e-08 s (39.72 Mflops) with 8 threads. -Starting merge (same threads) based auto-tuning procedure (transA=N, nrhs=1, order=cols) (max 6 steps, inclusive 3 grace steps) on: 6 x 6, type D, 1 nnz, 0.17 nnz/r, 1 subms, 1 lsubms, 4.0000 bpnz (tpop: 5.035e-08 Mflops: 39.719) +Parameters: verbosity:1 mintimes:3 maxtimes:10 mindt:0 maxdt:5.33e-08 +3 iterations (8 th.) took 3.219e-05s; avg 1.073e-05s ( +/- 99.50/200.00 %); best 5.33e-08s; worst 3.219e-05s; std dev. 1.517e-05 (taking best). +Reference operation time is 5.32985e-08 s (37.52 Mflops) with 8 threads. +Starting merge (same threads) based auto-tuning procedure (transA=N, nrhs=1, order=cols) (max 6 steps, inclusive 3 grace steps) on: 6 x 6, type D, 1 nnz, 0.17 nnz/r, 1 subms, 1 lsubms, 4.0000 bpnz (tpop: 5.33e-08 Mflops: 37.525) Merge (1 -> 1 leaves) took w.c.t. of 0s, ~0s of computing time (of which 0s sorting, 0s analysis) -3 iterations (8 th.) took 9.537e-07s; avg 3.179e-07s ( +/- 84.16/200.00 %); best 5.035e-08s; worst 9.537e-07s; std dev. 4.496e-07 (taking best). -Reference operation time is 5.0354e-08 s (39.72 Mflops) with 8 threads. -After merge step 1: tpop: 5.035e-08 s ~Mflops: 39.719 nsubm:1 otn:8 -Applying merge (1 -> 1 leaves, 8 th.) yielded NEGLIGIBLE change (1th in a row) (old/new=1.00000x): 5.035e-08s -> 5.035e-08s, so IGNORING this instance. +3 iterations (8 th.) took 9.537e-07s; avg 3.179e-07s ( +/- 83.23/200.00 %); best 5.33e-08s; worst 9.537e-07s; std dev. 4.496e-07 (taking best). +Reference operation time is 5.32985e-08 s (37.52 Mflops) with 8 threads. +After merge step 1: tpop: 5.33e-08 s ~Mflops: 37.525 nsubm:1 otn:8 +Applying merge (1 -> 1 leaves, 8 th.) yielded NEGLIGIBLE change (1th in a row) (old/new=1.00000x): 5.33e-08s -> 5.33e-08s, so IGNORING this instance. Merged all the matrix leaves: no reason to continue merging. -A total of 1 merge steps (of max 6) (1 -> 1 subms) took 1.001e-05s (of which 2.146e-06s partitioning, 0s I/O); computing times: 0s in par. loops, 0s sorting, 0s analyzing) -Total merge + benchmarking process took 1.001e-05s, equivalent to 198.9/198.9 new/old ops (1.717e-05s for 1 clones -- as 340.9/340.9 ops, or 340.9/340.9 ops per clone), SPEEDUP of 1.000x (NO SPEEDUP) +A total of 1 merge steps (of max 6) (1 -> 1 subms) took 1.287e-05s (of which 4.053e-06s partitioning, 0s I/O); computing times: 0s in par. loops, 0s sorting, 0s analyzing) +Total merge + benchmarking process took 1.287e-05s, equivalent to 241.6/241.6 new/old ops (0.06385s for 1 clones -- as 1197915.5/1197915.5 ops, or 1197915.5/1197915.5 ops per clone), SPEEDUP of 1.000x (NO SPEEDUP) Merging based autotuning FAILED (=NO SPEEDUP); let's try splitting then... -3 iterations (8 th.) took 0s; avg 0s ( +/- -inf/ -nan %); best 5.035e-08s; worst 0s; std dev. 0 (taking best). -Reference operation time is 5.0354e-08 s (39.72 Mflops) with 8 threads. -Starting split (same threads) based auto-tuning procedure (transA=N, nrhs=1, order=cols) (max 6 steps, inclusive 3 grace steps) on: 6 x 6, type D, 1 nnz, 0.17 nnz/r, 1 subms, 1 lsubms, 4.0000 bpnz (tpop: 5.035e-08 Mflops: 39.719) -Split (1 -> 1 leaves, 1 -> 1 subms) took 8.821e-06s (of which: 9.537e-07s analysis, 0s mem.mgmt); compute time: 0s overall, 0s searches, 0s shuffle, 0s switch, 0s quadrants. -3 iterations (8 th.) took 9.537e-07s; avg 3.179e-07s ( +/- 84.16/200.00 %); best 5.035e-08s; worst 9.537e-07s; std dev. 4.496e-07 (taking best). -Reference operation time is 5.0354e-08 s (39.72 Mflops) with 8 threads. -After split step 1: tpop: 5.035e-08 s ~Mflops: 39.719 nsubm:1 otn:8 -Applying split (1 -> 1 leaves, 8 th.) yielded NEGLIGIBLE change (1th in a row) (old/new=1.00000x): 5.035e-08s -> 5.035e-08s, so IGNORING this instance. -Split (1 -> 1 leaves, 1 -> 1 subms) took 4.053e-06s (of which: 9.537e-07s analysis, 0s mem.mgmt); compute time: 0s overall, 0s searches, 0s shuffle, 0s switch, 0s quadrants. -3 iterations (8 th.) took 0s; avg 0s ( +/- -inf/ -nan %); best 5.035e-08s; worst 0s; std dev. 0 (taking best). -Reference operation time is 5.0354e-08 s (39.72 Mflops) with 8 threads. -After split step 2: tpop: 5.035e-08 s ~Mflops: 39.719 nsubm:1 otn:8 -Applying split (1 -> 1 leaves, 8 th.) yielded NEGLIGIBLE change (2th in a row) (old/new=1.00000x): 5.035e-08s -> 5.035e-08s, so IGNORING this instance. +3 iterations (8 th.) took 8.106e-06s; avg 2.702e-06s ( +/- 98.03/200.00 %); best 5.33e-08s; worst 8.106e-06s; std dev. 3.821e-06 (taking best). +Reference operation time is 5.32985e-08 s (37.52 Mflops) with 8 threads. +Starting split (same threads) based auto-tuning procedure (transA=N, nrhs=1, order=cols) (max 6 steps, inclusive 3 grace steps) on: 6 x 6, type D, 1 nnz, 0.17 nnz/r, 1 subms, 1 lsubms, 4.0000 bpnz (tpop: 5.33e-08 Mflops: 37.525) +Split (1 -> 1 leaves, 1 -> 1 subms) took 2.098e-05s (of which: 4.053e-06s analysis, 0s mem.mgmt); compute time: 0s overall, 0s searches, 0s shuffle, 0s switch, 0s quadrants. +3 iterations (8 th.) took 9.537e-07s; avg 3.179e-07s ( +/- 83.23/200.00 %); best 5.33e-08s; worst 9.537e-07s; std dev. 4.496e-07 (taking best). +Reference operation time is 5.32985e-08 s (37.52 Mflops) with 8 threads. +After split step 1: tpop: 5.33e-08 s ~Mflops: 37.525 nsubm:1 otn:8 +Applying split (1 -> 1 leaves, 8 th.) yielded NEGLIGIBLE change (1th in a row) (old/new=1.00000x): 5.33e-08s -> 5.33e-08s, so IGNORING this instance. +Split (1 -> 1 leaves, 1 -> 1 subms) took 4.768e-06s (of which: 9.537e-07s analysis, 0s mem.mgmt); compute time: 0s overall, 0s searches, 0s shuffle, 0s switch, 0s quadrants. +3 iterations (8 th.) took 9.537e-07s; avg 3.179e-07s ( +/- 83.23/200.00 %); best 5.33e-08s; worst 9.537e-07s; std dev. 4.496e-07 (taking best). +Reference operation time is 5.32985e-08 s (37.52 Mflops) with 8 threads. +After split step 2: tpop: 5.33e-08 s ~Mflops: 37.525 nsubm:1 otn:8 +Applying split (1 -> 1 leaves, 8 th.) yielded NEGLIGIBLE change (2th in a row) (old/new=1.00000x): 5.33e-08s -> 5.33e-08s, so IGNORING this instance. +Split (1 -> 1 leaves, 1 -> 1 subms) took 5.007e-06s (of which: 0s analysis, 0s mem.mgmt); compute time: 0s overall, 0s searches, 0s shuffle, 0s switch, 0s quadrants. +3 iterations (8 th.) took 9.537e-07s; avg 3.179e-07s ( +/- 83.23/200.00 %); best 5.33e-08s; worst 9.537e-07s; std dev. 4.496e-07 (taking best). +Reference operation time is 5.32985e-08 s (37.52 Mflops) with 8 threads. +After split step 3: tpop: 5.33e-08 s ~Mflops: 37.525 nsubm:1 otn:8 +Applying split (1 -> 1 leaves, 8 th.) yielded NEGLIGIBLE change (3th in a row) (old/new=1.00000x): 5.33e-08s -> 5.33e-08s, so IGNORING this instance. +Split (1 -> 1 leaves, 1 -> 1 subms) took 5.007e-06s (of which: 0s analysis, 0s mem.mgmt); compute time: 0s overall, 0s searches, 0s shuffle, 0s switch, 0s quadrants. +3 iterations (8 th.) took 0s; avg 0s ( +/- -inf/ -nan %); best 5.33e-08s; worst 0s; std dev. 0 (taking best). +Reference operation time is 5.32985e-08 s (37.52 Mflops) with 8 threads. +After split step 4: tpop: 5.33e-08 s ~Mflops: 37.525 nsubm:1 otn:8 +Applying split (1 -> 1 leaves, 8 th.) yielded NEGLIGIBLE change (4th in a row) (old/new=1.00000x): 5.33e-08s -> 5.33e-08s, so IGNORING this instance. +Split (1 -> 1 leaves, 1 -> 1 subms) took 4.053e-06s (of which: 0s analysis, 0s mem.mgmt); compute time: 0s overall, 0s searches, 0s shuffle, 0s switch, 0s quadrants. +3 iterations (8 th.) took 9.537e-07s; avg 3.179e-07s ( +/- 83.23/200.00 %); best 5.33e-08s; worst 9.537e-07s; std dev. 4.496e-07 (taking best). +Reference operation time is 5.32985e-08 s (37.52 Mflops) with 8 threads. +After split step 5: tpop: 5.33e-08 s ~Mflops: 37.525 nsubm:1 otn:8 +Applying split (1 -> 1 leaves, 8 th.) yielded NEGLIGIBLE change (5th in a row) (old/new=1.00000x): 5.33e-08s -> 5.33e-08s, so IGNORING this instance. Split (1 -> 1 leaves, 1 -> 1 subms) took 3.815e-06s (of which: 0s analysis, 0s mem.mgmt); compute time: 0s overall, 0s searches, 0s shuffle, 0s switch, 0s quadrants. -3 iterations (8 th.) took 9.537e-07s; avg 3.179e-07s ( +/- 84.16/200.00 %); best 5.035e-08s; worst 9.537e-07s; std dev. 4.496e-07 (taking best). -Reference operation time is 5.0354e-08 s (39.72 Mflops) with 8 threads. -After split step 3: tpop: 5.035e-08 s ~Mflops: 39.719 nsubm:1 otn:8 -Applying split (1 -> 1 leaves, 8 th.) yielded NEGLIGIBLE change (3th in a row) (old/new=1.00000x): 5.035e-08s -> 5.035e-08s, so IGNORING this instance. -Split (1 -> 1 leaves, 1 -> 1 subms) took 2.861e-06s (of which: 0s analysis, 0s mem.mgmt); compute time: 0s overall, 0s searches, 0s shuffle, 0s switch, 0s quadrants. -3 iterations (8 th.) took 0s; avg 0s ( +/- -inf/ -nan %); best 5.035e-08s; worst 0s; std dev. 0 (taking best). -Reference operation time is 5.0354e-08 s (39.72 Mflops) with 8 threads. -After split step 4: tpop: 5.035e-08 s ~Mflops: 39.719 nsubm:1 otn:8 -Applying split (1 -> 1 leaves, 8 th.) yielded NEGLIGIBLE change (4th in a row) (old/new=1.00000x): 5.035e-08s -> 5.035e-08s, so IGNORING this instance. -Split (1 -> 1 leaves, 1 -> 1 subms) took 3.099e-06s (of which: 0s analysis, 0s mem.mgmt); compute time: 0s overall, 0s searches, 0s shuffle, 0s switch, 0s quadrants. -3 iterations (8 th.) took 9.537e-07s; avg 3.179e-07s ( +/- 84.16/200.00 %); best 5.035e-08s; worst 9.537e-07s; std dev. 4.496e-07 (taking best). -Reference operation time is 5.0354e-08 s (39.72 Mflops) with 8 threads. -After split step 5: tpop: 5.035e-08 s ~Mflops: 39.719 nsubm:1 otn:8 -Applying split (1 -> 1 leaves, 8 th.) yielded NEGLIGIBLE change (5th in a row) (old/new=1.00000x): 5.035e-08s -> 5.035e-08s, so IGNORING this instance. -Split (1 -> 1 leaves, 1 -> 1 subms) took 3.099e-06s (of which: 0s analysis, 0s mem.mgmt); compute time: 0s overall, 0s searches, 0s shuffle, 0s switch, 0s quadrants. -3 iterations (8 th.) took 9.537e-07s; avg 3.179e-07s ( +/- 84.16/200.00 %); best 5.035e-08s; worst 9.537e-07s; std dev. 4.496e-07 (taking best). -Reference operation time is 5.0354e-08 s (39.72 Mflops) with 8 threads. -After split step 6: tpop: 5.035e-08 s ~Mflops: 39.719 nsubm:1 otn:8 -Applying split (1 -> 1 leaves, 8 th.) yielded NEGLIGIBLE change (6th in a row) (old/new=1.00000x): 5.035e-08s -> 5.035e-08s, so IGNORING this instance. -A total of 6 split steps (of max 6) (1 -> 1 subms) took 7.415e-05s (of which 3.6e-05s partitioning, 0s I/O); computing times: 0s in par. loops, 0s sorting, 1.907e-06s analyzing) -Total split + benchmarking process took 7.415e-05s, equivalent to 1472.5/1472.5 new/old ops (1.407e-05s for 1 clones -- as 279.4/279.4 ops, or 279.4/279.4 ops per clone), SPEEDUP of 1.000x (NO SPEEDUP) -In 1 tuning rounds (tot. 0.00016s, 3.1e-05s for constructor, 2 clones) obtained NO speedup (best stays 39.72 Mflops). +3 iterations (8 th.) took 9.537e-07s; avg 3.179e-07s ( +/- 83.23/200.00 %); best 5.33e-08s; worst 9.537e-07s; std dev. 4.496e-07 (taking best). +Reference operation time is 5.32985e-08 s (37.52 Mflops) with 8 threads. +After split step 6: tpop: 5.33e-08 s ~Mflops: 37.525 nsubm:1 otn:8 +Applying split (1 -> 1 leaves, 8 th.) yielded NEGLIGIBLE change (6th in a row) (old/new=1.00000x): 5.33e-08s -> 5.33e-08s, so IGNORING this instance. +A total of 6 split steps (of max 6) (1 -> 1 subms) took 0.0001221s (of which 6.7e-05s partitioning, 0s I/O); computing times: 0s in par. loops, 0s sorting, 5.007e-06s analyzing) +Total split + benchmarking process took 0.0001221s, equivalent to 2290.3/2290.3 new/old ops (0.08125s for 1 clones -- as 1524486.7/1524486.7 ops, or 1524486.7/1524486.7 ops per clone), SPEEDUP of 1.000x (NO SPEEDUP) +In 1 tuning rounds (tot. 0.15s, 0.15s for constructor, 2 clones) obtained NO speedup (best stays 37.52 Mflops). Backsolving we should get a unitary vector: %%MatrixMarket matrix array real general @@ -8667,117 +8708,217 @@ /build/reproducible-path/librsb-1.3.0.2+dfsg/examples/fortran Building a matrix with 210 nnz, 20 x 20 Duplicates check: 210 - 0 = 210 - converted COO to RSB in 4.630e-04 s (100.00 %) - analyzed arrays in 5.984e-05 s (12.92 %) - cleaned-up arrays in 5.960e-06 s (1.29 %) - deduplicated arrays in 9.537e-07 s (0.21 %) - sorted arrays in 3.021e-04 s (65.24 %) - shuffled partitions in 4.220e-05 s (9.11 %) - memory allocations took 2.098e-05 s (4.53 %) - leafs setup took 5.007e-06 s (1.08 %) - halfword conversion took 1.884e-05 s (4.07 %) -Built (20 x 20)[0x5745f440]{D} @ (0(0..0),0(0..0)) (210 nnz, 10 nnz/r) flags 0x2446396 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 23, symflags:'LS' -Will autotune matrix: 20 x 20, type D, 210 nnz, 10 nnz/r, 32 subms, 23 lsubms, 3.7524 bpnz. -Parameters: verbosity:1 mintimes:3 maxtimes:10 mindt:0 maxdt:5.18e-08 -Starting autotuning (16 x 5.17964e-08 s stages, transA=N, nrhs=1, timer gran.=5.17964e-08), 8 suggested as starting thread count(default). -3 iterations (8 th.) took 0.000721s; avg 0.0002403s ( +/- 53.37/ 26.88 %); best 0.0001121s; worst 0.0003049s; std dev. 9.07e-05 (taking best). -Reference operation time is 0.000112057 s (7.496 Mflops) with 8 threads. -Starting merge (same threads) based auto-tuning procedure (transA=N, nrhs=1, order=cols) (max 6 steps, inclusive 3 grace steps) on: 20 x 20, type D, 210 nnz, 10 nnz/r, 32 subms, 23 lsubms, 3.7524 bpnz (tpop: 0.0001121 Mflops: 7.496) -Merge (23 -> 19 leaves) took w.c.t. of 0.0001829s, ~0.00033s of computing time (of which 1.907e-06s sorting, 2.861e-06s analysis) -3 iterations (8 th.) took 0.0006499s; avg 0.0002166s ( +/- 68.64/102.16 %); best 6.795e-05s; worst 0.000438s; std dev. 0.0001596 (taking best). -Reference operation time is 6.79493e-05 s (12.36 Mflops) with 8 threads. -After merge step 1: tpop: 6.795e-05 s ~Mflops: 12.362 nsubm:19 otn:8 -Applying merge (23 -> 19 leaves, 8 th.) yielded SPEEDUP of 1.649x: 0.0001121s -> 6.795e-05s, so taking this instance. -Merge (19 -> 13 leaves) took w.c.t. of 2.313e-05s, ~8.106e-06s of computing time (of which 1.907e-06s sorting, 2.146e-06s analysis) -3 iterations (8 th.) took 0.000622s; avg 0.0002073s ( +/- 66.19/113.65 %); best 7.01e-05s; worst 0.000443s; std dev. 0.0001674 (taking best). -Reference operation time is 7.00951e-05 s (11.98 Mflops) with 8 threads. -After merge step 2: tpop: 7.01e-05 s ~Mflops: 11.984 nsubm:13 otn:8 -Applying merge (19 -> 13 leaves, 8 th.) yielded SLOWDOWN (1th of 3 tolerable) of 1.032x: 6.795e-05s -> 7.01e-05s. -Merge (13 -> 10 leaves) took w.c.t. of 1.097e-05s, ~4.053e-06s of computing time (of which 9.537e-07s sorting, 1.907e-06s analysis) -3 iterations (8 th.) took 0.000217s; avg 7.232e-05s ( +/- 36.37/ 31.54 %); best 4.601e-05s; worst 9.513e-05s; std dev. 2.02e-05 (taking best). -Reference operation time is 4.60148e-05 s (18.26 Mflops) with 8 threads. -After merge step 3: tpop: 4.601e-05 s ~Mflops: 18.255 nsubm:10 otn:8 -Applying merge (13 -> 10 leaves, 8 th.) yielded SPEEDUP of 1.477x: 6.795e-05s -> 4.601e-05s, so taking this instance. -Merge (10 -> 8 leaves) took w.c.t. of 8.821e-06s, ~3.099e-06s of computing time (of which 2.146e-06s sorting, 9.537e-07s analysis) -3 iterations (8 th.) took 0.000495s; avg 0.000165s ( +/- 52.75/104.91 %); best 7.796e-05s; worst 0.0003381s; std dev. 0.0001224 (taking best). -Reference operation time is 7.79629e-05 s (10.77 Mflops) with 8 threads. -After merge step 4: tpop: 7.796e-05 s ~Mflops: 10.774 nsubm:8 otn:8 -Applying merge (10 -> 8 leaves, 8 th.) yielded SLOWDOWN (1th of 3 tolerable) of 1.694x: 4.601e-05s -> 7.796e-05s. + converted COO to RSB in 1.846e-01 s (100.00 %) + analyzed arrays in 4.797e-02 s (25.98 %) + cleaned-up arrays in 5.007e-06 s (0.00 %) + deduplicated arrays in 1.907e-06 s (0.00 %) + sorted arrays in 4.062e-02 s (22.00 %) + shuffled partitions in 4.800e-02 s (26.00 %) + memory allocations took 2.503e-05 s (0.01 %) + leafs setup took 7.153e-06 s (0.00 %) + halfword conversion took 4.800e-02 s (26.00 %) +Built (20 x 20)[0x57258440]{D} @ (0(0..0),0(0..0)) (210 nnz, 10 nnz/r) flags 0x2446396 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 23, symflags:'LS' +Will autotune matrix: 20 x 20, type D, 210 nnz, 10 nnz/r, 31 subms, 23 lsubms, 3.7714 bpnz. +Parameters: verbosity:1 mintimes:3 maxtimes:10 mindt:0 maxdt:5.366e-08 +Starting autotuning (16 x 5.36561e-08 s stages, transA=N, nrhs=1, timer gran.=5.36561e-08), 8 suggested as starting thread count(default). +3 iterations (8 th.) took 0.064s; avg 0.02133s ( +/- 25.02/ 50.02 %); best 0.016s; worst 0.03201s; std dev. 0.007545 (taking best). +Reference operation time is 0.015996 s (0.05251 Mflops) with 8 threads. +Starting merge (same threads) based auto-tuning procedure (transA=N, nrhs=1, order=cols) (max 6 steps, inclusive 3 grace steps) on: 20 x 20, type D, 210 nnz, 10 nnz/r, 31 subms, 23 lsubms, 3.7714 bpnz (tpop: 0.016 Mflops: 0.053) +Merge (23 -> 17 leaves) took w.c.t. of 0.02797s, ~0.008069s of computing time (of which 3.815e-06s sorting, 9.06e-06s analysis) +3 iterations (8 th.) took 0.116s; avg 0.03866s ( +/- 48.27/ 44.81 %); best 0.02s; worst 0.05598s; std dev. 0.01472 (taking best). +Reference operation time is 0.02 s (0.042 Mflops) with 8 threads. +After merge step 1: tpop: 0.02 s ~Mflops: 0.042 nsubm:17 otn:8 +Applying merge (23 -> 17 leaves, 8 th.) yielded SLOWDOWN (1th of 3 tolerable) of 1.250x: 0.016s -> 0.02s. Skipping further merge based tests after 1 definite performance degradations in a row (and last exceeding limit). -A total of 4 merge steps (of max 6) (23 -> 8 subms) took 0.002299s (of which 0.0002348s partitioning, 0s I/O); computing times: 0.0003452s in par. loops, 6.914e-06s sorting, 7.868e-06s analyzing) -Total merge + benchmarking process took 0.002299s, equivalent to 50.0/20.5 new/old ops (8.178e-05s for 3 clones -- as 1.8/0.7 ops, or 0.6/0.2 ops per clone), SPEEDUP of 2.435x -Applying multi-merge (23 -> 10 leaves, 3 steps, 0 -> 8 th.sp.) yielded SPEEDUP of 2.435x (0.0001121s -> 4.601e-05s), will amortize in 34.8 ops by saving 6.604e-05s per op. -In 1 tuning rounds (tot. 0.0031s, 8.2e-05s for constructor, 3 clones) obtained a SPEEDUP of 143.5% (2.435x) (from 7.496 to 18.26 Mflops). +A total of 1 merge steps (of max 6) (23 -> 17 subms) took 0.144s (of which 0.02798s partitioning, 0s I/O); computing times: 0.008069s in par. loops, 3.815e-06s sorting, 9.06e-06s analyzing) +Total merge + benchmarking process took 0.144s, equivalent to 9.0/9.0 new/old ops (0.07991s for 1 clones -- as 5.0/5.0 ops, or 5.0/5.0 ops per clone), SPEEDUP of 1.000x (NO SPEEDUP) +Merging based autotuning FAILED (=NO SPEEDUP); let's try splitting then... +3 iterations (8 th.) took 0.08s; avg 0.02667s ( +/- 40.00/ 20.01 %); best 0.016s; worst 0.032s; std dev. 0.007543 (taking best). +Reference operation time is 0.0159998 s (0.0525 Mflops) with 8 threads. +Starting split (same threads) based auto-tuning procedure (transA=N, nrhs=1, order=cols) (max 6 steps, inclusive 3 grace steps) on: 20 x 20, type D, 210 nnz, 10 nnz/r, 31 subms, 23 lsubms, 3.7714 bpnz (tpop: 0.016 Mflops: 0.053) +Split (23 -> 53 leaves, 31 -> 72 subms) took 0.03196s (of which: 5.007e-06s analysis, -1.906e+10s mem.mgmt); compute time: 0.0003436s overall, 5.007e-06s searches, 0.0003386s shuffle, 0.0001476s switch, 6.509e-05s quadrants. +3 iterations (8 th.) took 0.06397s; avg 0.02132s ( +/- 25.09/ 50.05 %); best 0.01597s; worst 0.032s; std dev. 0.007546 (taking best). +Reference operation time is 0.0159731 s (0.05259 Mflops) with 8 threads. +After split step 1: tpop: 0.01597 s ~Mflops: 0.053 nsubm:53 otn:8 +Applying split (23 -> 53 leaves, 8 th.) yielded NEGLIGIBLE change (1th in a row) (old/new=1.00167x): 0.016s -> 0.01597s, so IGNORING this instance. +Split (53 -> 121 leaves, 72 -> 164 subms) took 0.03197s (of which: 9.06e-06s analysis, -4.16e+10s mem.mgmt); compute time: 0.0002904s overall, 1.526e-05s searches, 0.0002751s shuffle, 0.0001659s switch, 2.074e-05s quadrants. +3 iterations (8 th.) took 0.06398s; avg 0.02133s ( +/- 25.14/ 50.04 %); best 0.01597s; worst 0.032s; std dev. 0.007546 (taking best). +Reference operation time is 0.0159659 s (0.05261 Mflops) with 8 threads. +After split step 2: tpop: 0.01597 s ~Mflops: 0.053 nsubm:121 otn:8 +Applying split (53 -> 121 leaves, 8 th.) yielded NEGLIGIBLE change (2th in a row) (old/new=1.00212x): 0.016s -> 0.01597s, so IGNORING this instance. +Split (121 -> 143 leaves, 164 -> 194 subms) took 0.03988s (of which: 1.311e-05s analysis, -1.387e+10s mem.mgmt); compute time: 0.000319s overall, 4.292e-06s searches, 0.0003147s shuffle, 0.0001984s switch, 1.311e-05s quadrants. +3 iterations (8 th.) took 0.06393s; avg 0.02131s ( +/- 43.66/ 31.31 %); best 0.01201s; worst 0.02798s; std dev. 0.006783 (taking best). +Reference operation time is 0.012006 s (0.06996 Mflops) with 8 threads. +After split step 3: tpop: 0.01201 s ~Mflops: 0.070 nsubm:143 otn:8 +Applying split (121 -> 143 leaves, 8 th.) yielded SPEEDUP of 1.333x: 0.016s -> 0.01201s, so taking this instance. +Split (143 -> 146 leaves, 194 -> 198 subms) took 0.0279s (of which: 1.693e-05s analysis, -1.733e+09s mem.mgmt); compute time: 1.407e-05s overall, 1.192e-06s searches, 1.287e-05s shuffle, 5.96e-06s switch, 9.537e-07s quadrants. +3 iterations (8 th.) took 0.06395s; avg 0.02132s ( +/- 24.91/ 12.58 %); best 0.01601s; worst 0.024s; std dev. 0.003754 (taking best). +Reference operation time is 0.0160069 s (0.05248 Mflops) with 8 threads. +After split step 4: tpop: 0.01601 s ~Mflops: 0.052 nsubm:146 otn:8 +Applying split (143 -> 146 leaves, 8 th.) yielded SLOWDOWN (1th of 3 tolerable) of 1.333x: 0.01201s -> 0.01601s. +Skipping further split based tests after 1 definite performance degradations in a row (and last exceeding limit). +A total of 4 split steps (of max 6) (23 -> 146 subms) took 0.456s (of which 0.1321s partitioning, 0s I/O); computing times: 0.000967s in par. loops, 2.575e-05s sorting, 4.411e-05s analyzing) +Total split + benchmarking process took 0.456s, equivalent to 38.0/28.5 new/old ops (0.1399s for 2 clones -- as 11.7/8.7 ops, or 5.8/4.4 ops per clone), SPEEDUP of 1.333x +Applying multi-split (23 -> 143 leaves, 3 steps, 0 -> 8 th.sp.) yielded SPEEDUP of 1.333x (0.016s -> 0.01201s), will amortize in 114.2 ops by saving 0.003994s per op. +In 1 tuning rounds (tot. 0.9s, 0.22s for constructor, 3 clones) obtained a SPEEDUP of 33.3% (1.333x) (from 0.0525 to 0.06996 Mflops). autotuner chose 8 threads -Will autotune matrix: 20 x 20, type D, 210 nnz, 10 nnz/r, 14 subms, 10 lsubms, 3.1429 bpnz. -Parameters: verbosity:1 mintimes:3 maxtimes:10 mindt:0 maxdt:5.18e-08 -Starting autotuning (16 x 5.17964e-08 s stages, transA=N, nrhs=1, timer gran.=5.17964e-08), 8 suggested as starting thread count(default). -3 iterations (8 th.) took 0.0002089s; avg 6.962e-05s ( +/- 23.97/ 44.86 %); best 5.293e-05s; worst 0.0001009s; std dev. 2.21e-05 (taking best). -~ 8 threads: 5.293e-05s (16 Mflops) (0/2 degradations so far) - -3 iterations (7 th.) took 0.0008872s; avg 0.0002957s ( +/- 73.56/ 51.17 %); best 7.82e-05s; worst 0.000447s; std dev. 0.0001577 (taking best). - 7 threads: 7.82e-05s (11 Mflops) (1/2 degradations so far) - -3 iterations (6 th.) took 0.0004022s; avg 0.0001341s ( +/- 27.62/ 47.78 %); best 9.704e-05s; worst 0.0001981s; std dev. 4.548e-05 (taking best). - 6 threads: 9.704e-05s (8.7 Mflops) (2/2 degradations so far) - -Best threads choice is 8; starting threads were 8; max speed gap is 1.8x; search took 0.0015s. -Starting merge (and threads) based auto-tuning procedure (transA=N, nrhs=1, order=cols) (max 6 steps, inclusive 3 grace steps) on: 20 x 20, type D, 210 nnz, 10 nnz/r, 14 subms, 10 lsubms, 3.1429 bpnz (tpop: 5.293e-05 Mflops: 15.870) -Merge (10 -> 8 leaves) took w.c.t. of 9.06e-06s, ~2.861e-06s of computing time (of which 9.537e-07s sorting, 1.907e-06s analysis) -3 iterations (8 th.) took 0.000191s; avg 6.366e-05s ( +/- 24.34/ 36.33 %); best 4.816e-05s; worst 8.678e-05s; std dev. 1.667e-05 (taking best). -~ 8 threads: 4.816e-05s (17 Mflops) (0/2 degradations so far) - -3 iterations (7 th.) took 0.000175s; avg 5.833e-05s ( +/- 55.45/ 63.08 %); best 2.599e-05s; worst 9.513e-05s; std dev. 2.84e-05 (taking best). - 7 threads: 2.599e-05s (32 Mflops) (0/2 degradations so far) - -3 iterations (6 th.) took 0.0005109s; avg 0.0001703s ( +/- 83.62/155.34 %); best 2.789e-05s; worst 0.0004349s; std dev. 0.0001873 (taking best). - 6 threads: 2.789e-05s (30 Mflops) (1/2 degradations so far) - -3 iterations (5 th.) took 0.001098s; avg 0.000366s ( +/- 95.11/ 58.76 %); best 1.788e-05s; worst 0.000581s; std dev. 0.0002484 (taking best). - 5 threads: 1.788e-05s (47 Mflops) (0/2 degradations so far) - -3 iterations (4 th.) took 8.917e-05s; avg 2.972e-05s ( +/- 18.98/ 14.71 %); best 2.408e-05s; worst 3.409e-05s; std dev. 4.186e-06 (taking best). - 4 threads: 2.408e-05s (35 Mflops) (1/2 degradations so far) - -3 iterations (3 th.) took 4.101e-05s; avg 1.367e-05s ( +/- 12.79/ 9.88 %); best 1.192e-05s; worst 1.502e-05s; std dev. 1.296e-06 (taking best). - 3 threads: 1.192e-05s (70 Mflops) (0/2 degradations so far) - -3 iterations (2 th.) took 3.91e-05s; avg 1.303e-05s ( +/- 15.85/ 15.24 %); best 1.097e-05s; worst 1.502e-05s; std dev. 1.656e-06 (taking best). - 2 threads: 1.097e-05s (77 Mflops) (0/2 degradations so far) - -3 iterations (1 th.) took 1.788e-05s; avg 5.96e-06s ( +/- 16.00/ 16.00 %); best 5.007e-06s; worst 6.914e-06s; std dev. 7.787e-07 (taking best). - 1 threads: 5.007e-06s (1.7e+02 Mflops) (0/2 degradations so far) - -Best threads choice is 1; starting threads were 8; max speed gap is 9.6x; search took 0.0022s. -After merge step 1: tpop: 5.007e-06 s ~Mflops: 167.772 nsubm:8 otn:1 -Applying merge (10 -> 8 leaves, 1 th.) yielded SPEEDUP of 10.571x: 5.293e-05s -> 5.007e-06s, so taking this instance. -Merge (8 -> 6 leaves) took w.c.t. of 7.868e-06s, ~3.099e-06s of computing time (of which 9.537e-07s sorting, 9.537e-07s analysis) -3 iterations (8 th.) took 5.794e-05s; avg 1.931e-05s ( +/- 22.22/ 13.58 %); best 1.502e-05s; worst 2.193e-05s; std dev. 3.059e-06 (taking best). -~ 8 threads: 1.502e-05s (56 Mflops) (0/2 degradations so far) - -3 iterations (7 th.) took 6.7e-05s; avg 2.233e-05s ( +/- 10.32/ 7.83 %); best 2.003e-05s; worst 2.408e-05s; std dev. 1.701e-06 (taking best). - 7 threads: 2.003e-05s (42 Mflops) (1/2 degradations so far) - -3 iterations (6 th.) took 0.0003252s; avg 0.0001084s ( +/- 76.91/152.71 %); best 2.503e-05s; worst 0.0002739s; std dev. 0.0001171 (taking best). - 6 threads: 2.503e-05s (34 Mflops) (2/2 degradations so far) - -Best threads choice is 8; starting threads were 8; max speed gap is 1.7x; search took 0.00048s. -After merge step 2: tpop: 1.502e-05 s ~Mflops: 55.924 nsubm:6 otn:8 -Applying merge (8 -> 6 leaves, 8 th.) yielded SLOWDOWN (1th of 3 tolerable) of 3.000x: 5.007e-06s -> 1.502e-05s. -Skipping further merge based tests after 1 definite performance degradations in a row (and last exceeding limit). -A total of 2 merge steps (of max 6) (10 -> 6 subms) took 0.002726s (of which 2.098e-05s partitioning, 0s I/O); computing times: 5.96e-06s in par. loops, 1.907e-06s sorting, 2.861e-06s analyzing) -Total merge + benchmarking process took 0.002726s, equivalent to 544.5/51.5 new/old ops (3.314e-05s for 2 clones -- as 6.6/0.6 ops, or 3.3/0.3 ops per clone), SPEEDUP of 10.571x -Applying multi-merge (10 -> 8 leaves, 1 steps, 8 -> 1 th.sp.) yielded SPEEDUP of 10.571x (5.293e-05s -> 5.007e-06s), will amortize in 56.9 ops by saving 4.792e-05s per op. -In 1 tuning rounds (tot. 0.0043s, 3.3e-05s for constructor, 2 clones) obtained a SPEEDUP of 957.1% (10.57x) (from 15.87 to 167.8 Mflops). +Will autotune matrix: 20 x 20, type D, 210 nnz, 10 nnz/r, 194 subms, 143 lsubms, 4.2476 bpnz. +Parameters: verbosity:1 mintimes:3 maxtimes:10 mindt:0 maxdt:5.366e-08 +Starting autotuning (16 x 5.36561e-08 s stages, transA=N, nrhs=1, timer gran.=5.36561e-08), 8 suggested as starting thread count(default). +3 iterations (8 th.) took 0.07199s; avg 0.024s ( +/- 0.04/ 0.02 %); best 0.02399s; worst 0.024s; std dev. 6.481e-06 (taking best). +~ 8 threads: 0.02399s (0.035 Mflops) (0/2 degradations so far) - +3 iterations (7 th.) took 0.06397s; avg 0.02132s ( +/- 43.70/ 50.05 %); best 0.01201s; worst 0.03199s; std dev. 0.008216 (taking best). + 7 threads: 0.01201s (0.07 Mflops) (0/2 degradations so far) - +3 iterations (6 th.) took 0.06398s; avg 0.02133s ( +/- 25.02/ 49.98 %); best 0.01599s; worst 0.03199s; std dev. 0.007538 (taking best). + 6 threads: 0.01599s (0.053 Mflops) (1/2 degradations so far) - +3 iterations (5 th.) took 0.068s; avg 0.02267s ( +/- 46.99/ 41.12 %); best 0.01202s; worst 0.03199s; std dev. 0.008207 (taking best). + 5 threads: 0.01202s (0.07 Mflops) (2/2 degradations so far) - +Best threads choice is 7; starting threads were 8; max speed gap is 2x; search took 0.27s. +Starting merge (and threads) based auto-tuning procedure (transA=N, nrhs=1, order=cols) (max 6 steps, inclusive 3 grace steps) on: 20 x 20, type D, 210 nnz, 10 nnz/r, 194 subms, 143 lsubms, 4.2476 bpnz (tpop: 0.01201 Mflops: 0.070) +Merge (143 -> 97 leaves) took w.c.t. of 0.01599s, ~8.321e-05s of computing time (of which 1.311e-05s sorting, 1.001e-05s analysis) +3 iterations (8 th.) took 0.06798s; avg 0.02266s ( +/- 47.06/ 41.09 %); best 0.012s; worst 0.03197s; std dev. 0.008211 (taking best). +~ 8 threads: 0.012s (0.07 Mflops) (0/2 degradations so far) - +3 iterations (7 th.) took 0.07197s; avg 0.02399s ( +/- 0.13/ 0.07 %); best 0.02396s; worst 0.02401s; std dev. 2.246e-05 (taking best). + 7 threads: 0.02396s (0.035 Mflops) (1/2 degradations so far) - +3 iterations (6 th.) took 0.06397s; avg 0.02132s ( +/- 43.79/ 31.21 %); best 0.01199s; worst 0.02798s; std dev. 0.006799 (taking best). + 6 threads: 0.01199s (0.07 Mflops) (0/2 degradations so far) - +3 iterations (5 th.) took 0.068s; avg 0.02267s ( +/- 29.40/ 41.13 %); best 0.016s; worst 0.03199s; std dev. 0.006793 (taking best). + 5 threads: 0.016s (0.052 Mflops) (1/2 degradations so far) - +3 iterations (4 th.) took 0.07198s; avg 0.02399s ( +/- 33.43/ 49.91 %); best 0.01597s; worst 0.03597s; std dev. 0.008629 (taking best). + 4 threads: 0.01597s (0.053 Mflops) (2/2 degradations so far) - +Best threads choice is 6; starting threads were 8; max speed gap is 2x; search took 0.34s. +After merge step 1: tpop: 0.01199 s ~Mflops: 0.070 nsubm:97 otn:6 +Applying merge (143 -> 97 leaves, 6 th.) yielded NEGLIGIBLE change (1th in a row) (old/new=1.00159x): 0.01201s -> 0.01199s, so IGNORING this instance. +Merge (97 -> 65 leaves) took w.c.t. of 0.03598s, ~6.58e-05s of computing time (of which 1.431e-05s sorting, 1.001e-05s analysis) +3 iterations (8 th.) took 0.04799s; avg 0.016s ( +/- 25.12/ 50.01 %); best 0.01198s; worst 0.02399s; std dev. 0.005656 (taking best). +~ 8 threads: 0.01198s (0.07 Mflops) (0/2 degradations so far) - +3 iterations (7 th.) took 0.04799s; avg 0.016s ( +/- 24.97/ 49.84 %); best 0.012s; worst 0.02397s; std dev. 0.005638 (taking best). + 7 threads: 0.012s (0.07 Mflops) (1/2 degradations so far) - +3 iterations (6 th.) took 0.0759s; avg 0.0253s ( +/- 37.53/ 74.38 %); best 0.0158s; worst 0.04412s; std dev. 0.01331 (taking best). + 6 threads: 0.0158s (0.053 Mflops) (2/2 degradations so far) - +Best threads choice is 8; starting threads were 8; max speed gap is 1.3x; search took 0.17s. +After merge step 2: tpop: 0.01198 s ~Mflops: 0.070 nsubm:65 otn:8 +Applying merge (97 -> 65 leaves, 8 th.) yielded NEGLIGIBLE change (2th in a row) (old/new=1.00227x): 0.01201s -> 0.01198s, so IGNORING this instance. +Merge (65 -> 48 leaves) took w.c.t. of 0.01208s, ~4.101e-05s of computing time (of which 7.153e-06s sorting, 8.106e-06s analysis) +3 iterations (8 th.) took 0.08797s; avg 0.02932s ( +/- 18.19/ 36.33 %); best 0.02399s; worst 0.03998s; std dev. 0.007533 (taking best). +~ 8 threads: 0.02399s (0.035 Mflops) (0/2 degradations so far) - +3 iterations (7 th.) took 0.05999s; avg 0.02s ( +/- 39.87/ 20.03 %); best 0.01202s; worst 0.024s; std dev. 0.005638 (taking best). + 7 threads: 0.01202s (0.07 Mflops) (0/2 degradations so far) - +3 iterations (6 th.) took 0.09584s; avg 0.03195s ( +/- 0.15/ 0.12 %); best 0.0319s; worst 0.03198s; std dev. 3.593e-05 (taking best). + 6 threads: 0.0319s (0.026 Mflops) (1/2 degradations so far) - +3 iterations (5 th.) took 0.09612s; avg 0.03204s ( +/- 0.13/ 0.25 %); best 0.032s; worst 0.03212s; std dev. 5.613e-05 (taking best). + 5 threads: 0.032s (0.026 Mflops) (2/2 degradations so far) - +Best threads choice is 7; starting threads were 8; max speed gap is 2.7x; search took 0.34s. +After merge step 3: tpop: 0.01202 s ~Mflops: 0.070 nsubm:48 otn:7 +Applying merge (65 -> 48 leaves, 7 th.) yielded NEGLIGIBLE change (3th in a row) (old/new=0.99851x): 0.01201s -> 0.01202s, so IGNORING this instance. +Merge (48 -> 34 leaves) took w.c.t. of 0.01599s, ~4.172e-05s of computing time (of which 5.96e-06s sorting, 1.001e-05s analysis) +3 iterations (8 th.) took 0.07995s; avg 0.02665s ( +/- 9.96/ 19.89 %); best 0.02399s; worst 0.03195s; std dev. 0.003747 (taking best). +~ 8 threads: 0.02399s (0.035 Mflops) (0/2 degradations so far) - +3 iterations (7 th.) took 0.07198s; avg 0.02399s ( +/- 0.05/ 0.04 %); best 0.02398s; worst 0.024s; std dev. 8.709e-06 (taking best). + 7 threads: 0.02398s (0.035 Mflops) (0/2 degradations so far) - +3 iterations (6 th.) took 0.05999s; avg 0.02s ( +/- 39.99/ 20.02 %); best 0.012s; worst 0.024s; std dev. 0.005654 (taking best). + 6 threads: 0.012s (0.07 Mflops) (0/2 degradations so far) - +3 iterations (5 th.) took 0.052s; avg 0.01733s ( +/- 30.82/ 38.42 %); best 0.01199s; worst 0.02399s; std dev. 0.004987 (taking best). + 5 threads: 0.01199s (0.07 Mflops) (0/2 degradations so far) - +3 iterations (4 th.) took 0.06399s; avg 0.02133s ( +/- 25.04/ 50.01 %); best 0.01599s; worst 0.032s; std dev. 0.007543 (taking best). + 4 threads: 0.01599s (0.053 Mflops) (1/2 degradations so far) - +3 iterations (3 th.) took 0.06397s; avg 0.02132s ( +/- 25.07/ 50.05 %); best 0.01598s; worst 0.032s; std dev. 0.007546 (taking best). + 3 threads: 0.01598s (0.053 Mflops) (2/2 degradations so far) - +Best threads choice is 5; starting threads were 8; max speed gap is 2x; search took 0.39s. +After merge step 4: tpop: 0.01199 s ~Mflops: 0.070 nsubm:34 otn:5 +Applying merge (48 -> 34 leaves, 5 th.) yielded NEGLIGIBLE change (4th in a row) (old/new=1.00109x): 0.01201s -> 0.01199s, so IGNORING this instance. +Merge (34 -> 25 leaves) took w.c.t. of 0.01199s, ~3.672e-05s of computing time (of which 5.007e-06s sorting, 7.153e-06s analysis) +3 iterations (8 th.) took 0.09596s; avg 0.03199s ( +/- 24.98/ 12.51 %); best 0.024s; worst 0.03599s; std dev. 0.005649 (taking best). +~ 8 threads: 0.024s (0.035 Mflops) (0/2 degradations so far) - +3 iterations (7 th.) took 0.05998s; avg 0.01999s ( +/- 40.03/ 20.04 %); best 0.01199s; worst 0.024s; std dev. 0.00566 (taking best). + 7 threads: 0.01199s (0.07 Mflops) (0/2 degradations so far) - +3 iterations (6 th.) took 0.06s; avg 0.02s ( +/- 20.15/ 39.97 %); best 0.01597s; worst 0.028s; std dev. 0.005653 (taking best). + 6 threads: 0.01597s (0.053 Mflops) (1/2 degradations so far) - +3 iterations (5 th.) took 0.064s; avg 0.02133s ( +/- 25.07/ 49.99 %); best 0.01598s; worst 0.032s; std dev. 0.007541 (taking best). + 5 threads: 0.01598s (0.053 Mflops) (2/2 degradations so far) - +Best threads choice is 7; starting threads were 8; max speed gap is 2x; search took 0.28s. +After merge step 5: tpop: 0.01199 s ~Mflops: 0.070 nsubm:25 otn:7 +Applying merge (34 -> 25 leaves, 7 th.) yielded NEGLIGIBLE change (5th in a row) (old/new=1.00133x): 0.01201s -> 0.01199s, so IGNORING this instance. +Merge (25 -> 16 leaves) took w.c.t. of 0.02396s, ~3.29e-05s of computing time (of which 6.199e-06s sorting, 7.868e-06s analysis) +3 iterations (8 th.) took 0.07597s; avg 0.02532s ( +/- 36.82/ 26.34 %); best 0.016s; worst 0.032s; std dev. 0.006794 (taking best). +~ 8 threads: 0.016s (0.052 Mflops) (0/2 degradations so far) - +3 iterations (7 th.) took 0.06399s; avg 0.02133s ( +/- 24.99/ 49.93 %); best 0.016s; worst 0.03198s; std dev. 0.007531 (taking best). + 7 threads: 0.016s (0.052 Mflops) (0/2 degradations so far) - +3 iterations (6 th.) took 0.06397s; avg 0.02132s ( +/- 24.98/ 49.94 %); best 0.016s; worst 0.03197s; std dev. 0.00753 (taking best). + 6 threads: 0.016s (0.053 Mflops) (0/2 degradations so far) - +3 iterations (5 th.) took 0.07998s; avg 0.02666s ( +/- 39.99/ 20.04 %); best 0.016s; worst 0.032s; std dev. 0.007539 (taking best). + 5 threads: 0.016s (0.053 Mflops) (1/2 degradations so far) - +3 iterations (4 th.) took 0.06399s; avg 0.02133s ( +/- 25.02/ 49.94 %); best 0.01599s; worst 0.03198s; std dev. 0.007532 (taking best). + 4 threads: 0.01599s (0.053 Mflops) (0/2 degradations so far) - +3 iterations (3 th.) took 0.0679s; avg 0.02263s ( +/- 29.66/ 58.99 %); best 0.01592s; worst 0.03598s; std dev. 0.009441 (taking best). + 3 threads: 0.01592s (0.053 Mflops) (0/2 degradations so far) - +3 iterations (2 th.) took 0.06006s; avg 0.02002s ( +/- 39.96/ 20.21 %); best 0.01202s; worst 0.02406s; std dev. 0.005656 (taking best). + 2 threads: 0.01202s (0.07 Mflops) (0/2 degradations so far) - +3 iterations (1 th.) took 0.04798s; avg 0.01599s ( +/- 25.07/ 49.94 %); best 0.01198s; worst 0.02398s; std dev. 0.005648 (taking best). + 1 threads: 0.01198s (0.07 Mflops) (0/2 degradations so far) - +Best threads choice is 1; starting threads were 8; max speed gap is 1.3x; search took 0.52s. +After merge step 6: tpop: 0.01198 s ~Mflops: 0.070 nsubm:16 otn:1 +Applying merge (25 -> 16 leaves, 1 th.) yielded NEGLIGIBLE change (6th in a row) (old/new=1.00183x): 0.01201s -> 0.01198s, so IGNORING this instance. +A total of 6 merge steps (of max 6) (143 -> 16 subms) took 2.168s (of which 0.116s partitioning, 0s I/O); computing times: 0.0003014s in par. loops, 5.174e-05s sorting, 5.317e-05s analyzing) +Total merge + benchmarking process took 2.168s, equivalent to 180.6/180.6 new/old ops (0.05997s for 1 clones -- as 5.0/5.0 ops, or 5.0/5.0 ops per clone), SPEEDUP of 1.000x (NO SPEEDUP) +Merging based autotuning FAILED (=NO SPEEDUP); let's try splitting then... +3 iterations (8 th.) took 0.07599s; avg 0.02533s ( +/- 5.24/ 10.47 %); best 0.024s; worst 0.02798s; std dev. 0.001874 (taking best). +~ 8 threads: 0.024s (0.035 Mflops) (0/2 degradations so far) - +3 iterations (7 th.) took 0.07198s; avg 0.02399s ( +/- 0.02/ 0.01 %); best 0.02399s; worst 0.024s; std dev. 2.686e-06 (taking best). + 7 threads: 0.02399s (0.035 Mflops) (0/2 degradations so far) - +3 iterations (6 th.) took 0.07198s; avg 0.02399s ( +/- 0.07/ 0.04 %); best 0.02398s; worst 0.02401s; std dev. 1.133e-05 (taking best). + 6 threads: 0.02398s (0.035 Mflops) (0/2 degradations so far) - +3 iterations (5 th.) took 0.07998s; avg 0.02666s ( +/- 39.97/ 20.05 %); best 0.016s; worst 0.032s; std dev. 0.007535 (taking best). + 5 threads: 0.016s (0.052 Mflops) (0/2 degradations so far) - +3 iterations (4 th.) took 0.05999s; avg 0.02s ( +/- 39.93/ 60.06 %); best 0.01201s; worst 0.03201s; std dev. 0.008645 (taking best). + 4 threads: 0.01201s (0.07 Mflops) (0/2 degradations so far) - +3 iterations (3 th.) took 0.07197s; avg 0.02399s ( +/- 0.04/ 0.03 %); best 0.02398s; worst 0.024s; std dev. 6.702e-06 (taking best). + 3 threads: 0.02398s (0.035 Mflops) (1/2 degradations so far) - +3 iterations (2 th.) took 0.05199s; avg 0.01733s ( +/- 18.95/ 26.60 %); best 0.01405s; worst 0.02194s; std dev. 0.003356 (taking best). + 2 threads: 0.01405s (0.06 Mflops) (2/2 degradations so far) - +Best threads choice is 4; starting threads were 8; max speed gap is 2x; search took 0.48s. +Starting split (and threads) based auto-tuning procedure (transA=N, nrhs=1, order=cols) (max 6 steps, inclusive 3 grace steps) on: 20 x 20, type D, 210 nnz, 10 nnz/r, 194 subms, 143 lsubms, 4.2476 bpnz (tpop: 0.01201 Mflops: 0.070) +Split (143 -> 146 leaves, 194 -> 198 subms) took 0.03199s (of which: 1.407e-05s analysis, -1.733e+09s mem.mgmt); compute time: 2.289e-05s overall, 2.146e-06s searches, 2.074e-05s shuffle, 1.192e-05s switch, 2.146e-06s quadrants. +3 iterations (8 th.) took 0.08385s; avg 0.02795s ( +/- 28.42/ 14.49 %); best 0.02001s; worst 0.032s; std dev. 0.005618 (taking best). +~ 8 threads: 0.02001s (0.042 Mflops) (0/2 degradations so far) - +3 iterations (7 th.) took 0.068s; avg 0.02267s ( +/- 12.31/ 24.11 %); best 0.01988s; worst 0.02813s; std dev. 0.003865 (taking best). + 7 threads: 0.01988s (0.042 Mflops) (0/2 degradations so far) - +3 iterations (6 th.) took 0.06396s; avg 0.02132s ( +/- 25.06/ 49.98 %); best 0.01598s; worst 0.03198s; std dev. 0.007535 (taking best). + 6 threads: 0.01598s (0.053 Mflops) (0/2 degradations so far) - +3 iterations (5 th.) took 0.07613s; avg 0.02538s ( +/- 32.40/ 26.01 %); best 0.01716s; worst 0.03198s; std dev. 0.006158 (taking best). + 5 threads: 0.01716s (0.049 Mflops) (1/2 degradations so far) - +3 iterations (4 th.) took 0.06783s; avg 0.02261s ( +/- 29.24/ 41.46 %); best 0.016s; worst 0.03199s; std dev. 0.006812 (taking best). + 4 threads: 0.016s (0.052 Mflops) (2/2 degradations so far) - +Best threads choice is 6; starting threads were 8; max speed gap is 1.3x; search took 0.36s. +After split step 1: tpop: 0.01598 s ~Mflops: 0.053 nsubm:146 otn:6 +Applying split (143 -> 146 leaves, 6 th.) yielded SLOWDOWN (1th of 3 tolerable) of 1.330x: 0.01201s -> 0.01598s. +Skipping further split based tests after 1 definite performance degradations in a row (and last exceeding limit). +A total of 1 split steps (of max 6) (143 -> 146 subms) took 0.392s (of which 0.03209s partitioning, 0s I/O); computing times: 2.289e-05s in par. loops, 2.146e-06s sorting, 1.407e-05s analyzing) +Total split + benchmarking process took 0.392s, equivalent to 32.6/32.6 new/old ops (0.04799s for 1 clones -- as 4.0/4.0 ops, or 4.0/4.0 ops per clone), SPEEDUP of 1.000x (NO SPEEDUP) +In 1 tuning rounds (tot. 3.4s, 0.11s for constructor, 2 clones) obtained NO speedup (best stays 0.06993 Mflops). check results are ok Building a matrix with 36 nnz, 6 x 6 Duplicates check: 36 - 0 = 36 - converted COO to RSB in 2.789e-05 s (100.00 %) - analyzed arrays in 9.060e-06 s (32.48 %) - cleaned-up arrays in 0.000e+00 s (0.00 %) + converted COO to RSB in 9.581e-02 s (100.00 %) + analyzed arrays in 3.198e-02 s (33.38 %) + cleaned-up arrays in 9.537e-07 s (0.00 %) deduplicated arrays in 0.000e+00 s (0.00 %) - sorted arrays in 9.060e-06 s (32.48 %) - shuffled partitions in 5.007e-06 s (17.95 %) - memory allocations took 3.815e-06 s (13.68 %) - leafs setup took 0.000e+00 s (0.00 %) - halfword conversion took 9.537e-07 s (3.42 %) -Built (6 x 6)[0x5745dd90]{Z} @ (0(0..6),0(0..6)) (36 nnz, 6 nnz/r) flags 0x20440b4 (coo:0, csr:1, hw:0, ic:1, fi:0), storage: 1, subm: 1, symflags:'UL' + sorted arrays in 4.782e-02 s (49.92 %) + shuffled partitions in 1.599e-02 s (16.69 %) + memory allocations took 1.144e-05 s (0.01 %) + leafs setup took 2.146e-06 s (0.00 %) + halfword conversion took 9.537e-07 s (0.00 %) +Built (6 x 6)[0x57259310]{Z} @ (0(0..6),0(0..6)) (36 nnz, 6 nnz/r) flags 0x20440b4 (coo:0, csr:1, hw:0, ic:1, fi:0), storage: 1, subm: 1, symflags:'UL' Read matrix pd.mtx 6 x 6 : 36 Matrix has no symmetry Using NRHS=4 -Repeated USMV took 0.2694E-04 s -A single USMM took 0.1001E-04 s -USMM-to-USMV speed ratio is is 2.690 x +Repeated USMV took 0.2289E-04 s +A single USMM took 0.5960E-05 s +USMM-to-USMV speed ratio is is 3.840 x Call auto-tuning routine.. Repeat measurement. -Tuned USMM took 0.2146E-05 s -Tuned-to-untuned speed ratio is is 4.667 x +Tuned USMM took 0.2861E-05 s +Tuned-to-untuned speed ratio is is 2.083 x FAILED: 0 PASSED: 2 /build/reproducible-path/librsb-1.3.0.2+dfsg/examples/fortran_rsb_fi @@ -8826,234 +8967,242 @@ Loading matrix from file "/build/reproducible-path/librsb-1.3.0.2+dfsg/pd.mtx". Building a matrix with 36 nnz, 6 x 6 Duplicates check: 36 - 0 = 36 - converted COO to RSB in 4.590e-04 s (100.00 %) - analyzed arrays in 5.388e-05 s (11.74 %) - cleaned-up arrays in 8.106e-06 s (1.77 %) - deduplicated arrays in 9.537e-07 s (0.21 %) - sorted arrays in 3.190e-04 s (69.51 %) - shuffled partitions in 3.815e-05 s (8.31 %) - memory allocations took 7.868e-06 s (1.71 %) - leafs setup took 4.053e-06 s (0.88 %) - halfword conversion took 1.884e-05 s (4.10 %) -Built (6 x 6)[0x582849b0]{D} @ (0(0..0),0(0..0)) (36 nnz, 6 nnz/r) flags 0x42046186 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 22, symflags:'' + converted COO to RSB in 1.836e-01 s (100.00 %) + analyzed arrays in 5.996e-02 s (32.66 %) + cleaned-up arrays in 5.007e-06 s (0.00 %) + deduplicated arrays in 2.861e-06 s (0.00 %) + sorted arrays in 3.560e-02 s (19.39 %) + shuffled partitions in 5.602e-02 s (30.52 %) + memory allocations took 1.597e-05 s (0.01 %) + leafs setup took 9.060e-06 s (0.00 %) + halfword conversion took 3.197e-02 s (17.41 %) +Built (6 x 6)[0x57dd29b0]{D} @ (0(0..0),0(0..0)) (36 nnz, 6 nnz/r) flags 0x42046186 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 22, symflags:'' Considering D clone. Base matrix: -(6 x 6)[0x58286d50]{D} @ (0(0..0),0(0..0)) (36 nnz, 6 nnz/r) flags 0x2046186 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 22, symflags:'' +(6 x 6)[0x57dd4d50]{D} @ (0(0..0),0(0..0)) (36 nnz, 6 nnz/r) flags 0x2046186 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 22, symflags:'' -Will use autotuning routine to sample matrix: 6 x 6, type D, 36 nnz, 6 nnz/r, 29 subms, 22 lsubms, 4.2778 bpnz. +Will use autotuning routine to sample matrix: 6 x 6, type D, 36 nnz, 6 nnz/r, 29 subms, 22 lsubms, 4.6667 bpnz. Parameters: verbosity:1 mintimes:3 maxtimes:10 mindt:0 maxdt:0.1 -3 iterations (8 th.) took 0.0003829s; avg 0.0001276s ( +/- 45.08/ 69.99 %); best 7.01e-05s; worst 0.000217s; std dev. 6.403e-05 (taking best). -Reference operation time is 7.00951e-05 s (2.054 Mflops) with 8 threads. -After 0.000414s, autotuning routine did not find a better threads count configuration. +3 iterations (8 th.) took 0.07991s; avg 0.02664s ( +/- 10.18/ 20.10 %); best 0.02392s; worst 0.03199s; std dev. 0.003786 (taking best). +Reference operation time is 0.0239241 s (0.006019 Mflops) with 8 threads. +After 0.079980s, autotuning routine did not find a better threads count configuration. -Will autotune matrix: 6 x 6, type D, 36 nnz, 6 nnz/r, 29 subms, 22 lsubms, 4.2778 bpnz. +Will autotune matrix: 6 x 6, type D, 36 nnz, 6 nnz/r, 29 subms, 22 lsubms, 4.6667 bpnz. Parameters: verbosity:1 mintimes:3 maxtimes:10 mindt:0 maxdt:0.1 -3 iterations (8 th.) took 0.000411s; avg 0.000137s ( +/- 30.57/ 31.38 %); best 9.513e-05s; worst 0.00018s; std dev. 3.466e-05 (taking best). -Reference operation time is 9.5129e-05 s (1.514 Mflops) with 8 threads. -Starting merge (same threads) based auto-tuning procedure (transA=N, nrhs=2, order=cols) (max 6 steps, inclusive 3 grace steps) on: 6 x 6, type D, 36 nnz, 6 nnz/r, 29 subms, 22 lsubms, 4.2778 bpnz (tpop: 9.513e-05 Mflops: 1.514) -Merge (22 -> 19 leaves) took w.c.t. of 2.217e-05s, ~6.914e-06s of computing time (of which 9.537e-07s sorting, 5.007e-06s analysis) -3 iterations (8 th.) took 0.0003731s; avg 0.0001244s ( +/- 34.82/ 56.04 %); best 8.106e-05s; worst 0.0001941s; std dev. 4.977e-05 (taking best). -Reference operation time is 8.10623e-05 s (1.776 Mflops) with 8 threads. -After merge step 1: tpop: 8.106e-05 s ~Mflops: 1.776 nsubm:19 otn:8 -Applying merge (22 -> 19 leaves, 8 th.) yielded SPEEDUP of 1.174x: 9.513e-05s -> 8.106e-05s, so taking this instance. -Merge (19 -> 16 leaves) took w.c.t. of 9.06e-06s, ~1.907e-06s of computing time (of which 0s sorting, 2.861e-06s analysis) -3 iterations (8 th.) took 0.0002589s; avg 8.631e-05s ( +/- 43.37/ 29.83 %); best 4.888e-05s; worst 0.0001121s; std dev. 2.708e-05 (taking best). -Reference operation time is 4.88758e-05 s (2.946 Mflops) with 8 threads. -After merge step 2: tpop: 4.888e-05 s ~Mflops: 2.946 nsubm:16 otn:8 -Applying merge (19 -> 16 leaves, 8 th.) yielded SPEEDUP of 1.659x: 8.106e-05s -> 4.888e-05s, so taking this instance. -Merge (16 -> 13 leaves) took w.c.t. of 9.06e-06s, ~1.907e-06s of computing time (of which 9.537e-07s sorting, 1.907e-06s analysis) -3 iterations (8 th.) took 0.0001791s; avg 5.968e-05s ( +/- 36.48/ 55.79 %); best 3.791e-05s; worst 9.298e-05s; std dev. 2.392e-05 (taking best). -Reference operation time is 3.79086e-05 s (3.799 Mflops) with 8 threads. -After merge step 3: tpop: 3.791e-05 s ~Mflops: 3.799 nsubm:13 otn:8 -Applying merge (16 -> 13 leaves, 8 th.) yielded SPEEDUP of 1.289x: 4.888e-05s -> 3.791e-05s, so taking this instance. -Merge (13 -> 10 leaves) took w.c.t. of 7.868e-06s, ~2.146e-06s of computing time (of which 9.537e-07s sorting, 9.537e-07s analysis) -3 iterations (8 th.) took 0.0003529s; avg 0.0001176s ( +/- 61.89/111.62 %); best 4.482e-05s; worst 0.0002489s; std dev. 9.302e-05 (taking best). -Reference operation time is 4.48227e-05 s (3.213 Mflops) with 8 threads. -After merge step 4: tpop: 4.482e-05 s ~Mflops: 3.213 nsubm:10 otn:8 -Applying merge (13 -> 10 leaves, 8 th.) yielded SLOWDOWN (1th of 3 tolerable) of 1.182x: 3.791e-05s -> 4.482e-05s. -Merge (10 -> 7 leaves) took w.c.t. of 1.287e-05s, ~3.815e-06s of computing time (of which 9.537e-07s sorting, 1.907e-06s analysis) -3 iterations (8 th.) took 8.392e-05s; avg 2.797e-05s ( +/- 21.59/ 25.28 %); best 2.193e-05s; worst 3.505e-05s; std dev. 5.403e-06 (taking best). -Reference operation time is 2.19345e-05 s (6.565 Mflops) with 8 threads. -After merge step 5: tpop: 2.193e-05 s ~Mflops: 6.565 nsubm:7 otn:8 -Applying merge (10 -> 7 leaves, 8 th.) yielded SPEEDUP of 1.728x: 3.791e-05s -> 2.193e-05s, so taking this instance. -Merge (7 -> 4 leaves) took w.c.t. of 8.106e-06s, ~1.907e-06s of computing time (of which 9.537e-07s sorting, 1.192e-06s analysis) -3 iterations (8 th.) took 5.603e-05s; avg 1.868e-05s ( +/- 40.00/ 65.96 %); best 1.121e-05s; worst 3.099e-05s; std dev. 8.776e-06 (taking best). -Reference operation time is 1.12057e-05 s (12.85 Mflops) with 8 threads. -After merge step 6: tpop: 1.121e-05 s ~Mflops: 12.851 nsubm:4 otn:8 -Applying merge (7 -> 4 leaves, 8 th.) yielded SPEEDUP of 1.957x: 2.193e-05s -> 1.121e-05s, so taking this instance. -A total of 6 merge steps (of max 6) (22 -> 4 subms) took 0.001665s (of which 8.297e-05s partitioning, 0s I/O); computing times: 1.86e-05s in par. loops, 4.768e-06s sorting, 1.383e-05s analyzing) -Total merge + benchmarking process took 0.001665s, equivalent to 148.6/17.5 new/old ops (0.000128s for 6 clones -- as 11.4/1.3 ops, or 1.9/0.2 ops per clone), SPEEDUP of 8.489x -Applying multi-merge (22 -> 4 leaves, 6 steps, 0 -> 8 th.sp.) yielded SPEEDUP of 8.489x (9.513e-05s -> 1.121e-05s), will amortize in 19.8 ops by saving 8.392e-05s per op. -In 1 tuning rounds (tot. 0.0021s, 0.00013s for constructor, 6 clones) obtained a SPEEDUP of 748.9% (8.489x) (from 1.514 to 12.85 Mflops). -After 0.002138s, global autotuning declared speedup of 8.48936 x, when using threads count of 8 and a new matrix: -(6 x 6)[0x58288890]{D} @ (0(0..0),0(0..0)) (36 nnz, 6 nnz/r) flags 0x2046186 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 4, symflags:'' +3 iterations (8 th.) took 0.06399s; avg 0.02133s ( +/- 25.01/ 12.52 %); best 0.016s; worst 0.024s; std dev. 0.003773 (taking best). +Reference operation time is 0.015995 s (0.009003 Mflops) with 8 threads. +Starting merge (same threads) based auto-tuning procedure (transA=N, nrhs=2, order=cols) (max 6 steps, inclusive 3 grace steps) on: 6 x 6, type D, 36 nnz, 6 nnz/r, 29 subms, 22 lsubms, 4.6667 bpnz (tpop: 0.016 Mflops: 0.009) +Merge (22 -> 16 leaves) took w.c.t. of 0.000123s, ~4.768e-05s of computing time (of which 2.146e-06s sorting, 5.007e-06s analysis) +3 iterations (8 th.) took 0.08785s; avg 0.02928s ( +/- 45.36/ 36.08 %); best 0.016s; worst 0.03985s; std dev. 0.009925 (taking best). +Reference operation time is 0.016 s (0.009 Mflops) with 8 threads. +After merge step 1: tpop: 0.016 s ~Mflops: 0.009 nsubm:16 otn:8 +Applying merge (22 -> 16 leaves, 8 th.) yielded NEGLIGIBLE change (1th in a row) (old/new=0.99969x): 0.016s -> 0.016s, so IGNORING this instance. +Merge (16 -> 10 leaves) took w.c.t. of 0.008098s, ~2.003e-05s of computing time (of which 1.907e-06s sorting, 4.053e-06s analysis) +3 iterations (8 th.) took 0.08388s; avg 0.02796s ( +/- 42.78/ 42.61 %); best 0.016s; worst 0.03987s; std dev. 0.009748 (taking best). +Reference operation time is 0.0159972 s (0.009002 Mflops) with 8 threads. +After merge step 2: tpop: 0.016 s ~Mflops: 0.009 nsubm:10 otn:8 +Applying merge (16 -> 10 leaves, 8 th.) yielded NEGLIGIBLE change (2th in a row) (old/new=0.99987x): 0.016s -> 0.016s, so IGNORING this instance. +Merge (10 -> 7 leaves) took w.c.t. of 1.979e-05s, ~5.96e-06s of computing time (of which 1.907e-06s sorting, 4.053e-06s analysis) +3 iterations (8 th.) took 0.06068s; avg 0.02023s ( +/- 37.03/ 18.65 %); best 0.01274s; worst 0.024s; std dev. 0.005297 (taking best). +Reference operation time is 0.0127358 s (0.01131 Mflops) with 8 threads. +After merge step 3: tpop: 0.01274 s ~Mflops: 0.011 nsubm:7 otn:8 +Applying merge (10 -> 7 leaves, 8 th.) yielded SPEEDUP of 1.256x: 0.016s -> 0.01274s, so taking this instance. +Merge (7 -> 4 leaves) took w.c.t. of 1.788e-05s, ~5.96e-06s of computing time (of which 9.537e-07s sorting, 4.053e-06s analysis) +3 iterations (8 th.) took 0.05996s; avg 0.01999s ( +/- 39.92/ 20.08 %); best 0.01201s; worst 0.024s; std dev. 0.005642 (taking best). +Reference operation time is 0.0120091 s (0.01199 Mflops) with 8 threads. +After merge step 4: tpop: 0.01201 s ~Mflops: 0.012 nsubm:4 otn:8 +Applying merge (7 -> 4 leaves, 8 th.) yielded SPEEDUP of 1.061x: 0.01274s -> 0.01201s, so taking this instance. +Merge (4 -> 1 leaves) took w.c.t. of 1.812e-05s, ~6.914e-06s of computing time (of which 2.146e-06s sorting, 4.053e-06s analysis) +3 iterations (8 th.) took 5.96e-06s; avg 1.987e-06s ( +/- 97.13/152.00 %); best 5.71e-08s; worst 5.007e-06s; std dev. 2.171e-06 (taking best). +Reference operation time is 5.71012e-08 s (2522 Mflops) with 8 threads. +After merge step 5: tpop: 5.71e-08 s ~Mflops: 2521.836 nsubm:1 otn:8 +Applying merge (4 -> 1 leaves, 8 th.) yielded SPEEDUP of 210313.152x: 0.01201s -> 5.71e-08s, so taking this instance. +Merged all the matrix leaves: no reason to continue merging. +A total of 5 merge steps (of max 6) (22 -> 1 subms) took 0.48s (of which 0.00831s partitioning, 0s I/O); computing times: 8.655e-05s in par. loops, 9.06e-06s sorting, 2.122e-05s analyzing) +Total merge + benchmarking process took 0.48s, equivalent to 8406275.6/30.0 new/old ops (0.2432s for 4 clones -- as 4258371.6/15.2 ops, or 1064592.9/3.8 ops per clone), SPEEDUP of 280116.910x +Applying multi-merge (22 -> 1 leaves, 5 steps, 0 -> 8 th.sp.) yielded SPEEDUP of 280116.910x (0.016s -> 5.71e-08s), will amortize in 30.0 ops by saving 0.01599s per op. +In 1 tuning rounds (tot. 0.61s, 0.24s for constructor, 4 clones) obtained a SPEEDUP of 28011591.0% (2.801e+05x) (from 0.009003 to 2522 Mflops). +After 0.608020s, global autotuning declared speedup of 280117 x, when using threads count of 8 and a new matrix: +(6 x 6)[0x57dd85c0]{D} @ (0(0..6),0(0..6)) (36 nnz, 6 nnz/r) flags 0x2244086 (coo:0, csr:1, hw:1, ic:1, fi:0), storage: 1, subm: 1, symflags:'' Considering S clone. Building a matrix with 36 nnz, 6 x 6 Duplicates check: 36 - 0 = 36 - converted COO to RSB in 8.011e-05 s (100.00 %) - analyzed arrays in 3.505e-05 s (43.75 %) + converted COO to RSB in 1.319e-01 s (100.00 %) + analyzed arrays in 5.993e-02 s (45.42 %) cleaned-up arrays in 0.000e+00 s (0.00 %) - deduplicated arrays in 0.000e+00 s (0.00 %) + deduplicated arrays in 1.192e-06 s (0.00 %) sorted arrays in 0.000e+00 s (0.00 %) - shuffled partitions in 2.694e-05 s (33.63 %) - memory allocations took 5.007e-06 s (6.25 %) - leafs setup took 2.146e-06 s (2.68 %) - halfword conversion took 1.097e-05 s (13.69 %) -Built (6 x 6)[0x58288890]{S} @ (0(0..0),0(0..0)) (36 nnz, 6 nnz/r) flags 0x42046186 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 16, symflags:'' + shuffled partitions in 4.800e-02 s (36.38 %) + memory allocations took 4.768e-06 s (0.00 %) + leafs setup took 4.053e-06 s (0.00 %) + halfword conversion took 2.399e-02 s (18.19 %) +Built (6 x 6)[0x57dd4d50]{S} @ (0(0..0),0(0..0)) (36 nnz, 6 nnz/r) flags 0x42046186 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 16, symflags:'' Base matrix: -(6 x 6)[0x58288890]{S} @ (0(0..0),0(0..0)) (36 nnz, 6 nnz/r) flags 0x2046186 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 16, symflags:'' +(6 x 6)[0x57dd4d50]{S} @ (0(0..0),0(0..0)) (36 nnz, 6 nnz/r) flags 0x2046186 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 16, symflags:'' -Will use autotuning routine to sample matrix: 6 x 6, type S, 36 nnz, 6 nnz/r, 21 subms, 16 lsubms, 4.1111 bpnz. +Will use autotuning routine to sample matrix: 6 x 6, type S, 36 nnz, 6 nnz/r, 21 subms, 16 lsubms, 4.8889 bpnz. Parameters: verbosity:1 mintimes:3 maxtimes:10 mindt:0 maxdt:0.1 -3 iterations (8 th.) took 0.0003989s; avg 0.000133s ( +/- 72.92/ 63.90 %); best 3.6e-05s; worst 0.0002179s; std dev. 7.475e-05 (taking best). -Reference operation time is 3.60012e-05 s (4 Mflops) with 8 threads. -After 0.000410s, autotuning routine did not find a better threads count configuration. +3 iterations (8 th.) took 0.05995s; avg 0.01998s ( +/- 39.96/ 20.08 %); best 0.012s; worst 0.024s; std dev. 0.005647 (taking best). +Reference operation time is 0.0119989 s (0.012 Mflops) with 8 threads. +After 0.059986s, autotuning routine did not find a better threads count configuration. -Will autotune matrix: 6 x 6, type S, 36 nnz, 6 nnz/r, 21 subms, 16 lsubms, 4.1111 bpnz. +Will autotune matrix: 6 x 6, type S, 36 nnz, 6 nnz/r, 21 subms, 16 lsubms, 4.8889 bpnz. Parameters: verbosity:1 mintimes:3 maxtimes:10 mindt:0 maxdt:0.1 -3 iterations (8 th.) took 0.000231s; avg 7.701e-05s ( +/- 59.75/ 88.24 %); best 3.099e-05s; worst 0.000145s; std dev. 4.904e-05 (taking best). -Reference operation time is 3.09944e-05 s (4.646 Mflops) with 8 threads. -Starting merge (same threads) based auto-tuning procedure (transA=N, nrhs=2, order=cols) (max 6 steps, inclusive 3 grace steps) on: 6 x 6, type S, 36 nnz, 6 nnz/r, 21 subms, 16 lsubms, 4.1111 bpnz (tpop: 3.099e-05 Mflops: 4.646) -Merge (16 -> 13 leaves) took w.c.t. of 1.502e-05s, ~3.099e-06s of computing time (of which 1.192e-06s sorting, 3.099e-06s analysis) -3 iterations (8 th.) took 0.0001409s; avg 4.697e-05s ( +/- 2.03/ 4.06 %); best 4.601e-05s; worst 4.888e-05s; std dev. 1.349e-06 (taking best). -Reference operation time is 4.60148e-05 s (3.129 Mflops) with 8 threads. -After merge step 1: tpop: 4.601e-05 s ~Mflops: 3.129 nsubm:13 otn:8 -Applying merge (16 -> 13 leaves, 8 th.) yielded SLOWDOWN (1th of 3 tolerable) of 1.485x: 3.099e-05s -> 4.601e-05s. +3 iterations (8 th.) took 0.06401s; avg 0.02134s ( +/- 24.95/ 34.13 %); best 0.01601s; worst 0.02862s; std dev. 0.00533 (taking best). +Reference operation time is 0.0160129 s (0.008993 Mflops) with 8 threads. +Starting merge (same threads) based auto-tuning procedure (transA=N, nrhs=2, order=cols) (max 6 steps, inclusive 3 grace steps) on: 6 x 6, type S, 36 nnz, 6 nnz/r, 21 subms, 16 lsubms, 4.8889 bpnz (tpop: 0.01601 Mflops: 0.009) +Merge (16 -> 10 leaves) took w.c.t. of 0.01598s, ~1.907e-05s of computing time (of which 1.907e-06s sorting, 4.053e-06s analysis) +3 iterations (8 th.) took 0.07998s; avg 0.02666s ( +/- 9.98/ 19.90 %); best 0.024s; worst 0.03197s; std dev. 0.003751 (taking best). +Reference operation time is 0.0240009 s (0.006 Mflops) with 8 threads. +After merge step 1: tpop: 0.024 s ~Mflops: 0.006 nsubm:10 otn:8 +Applying merge (16 -> 10 leaves, 8 th.) yielded SLOWDOWN (1th of 3 tolerable) of 1.499x: 0.01601s -> 0.024s. Skipping further merge based tests after 1 definite performance degradations in a row (and last exceeding limit). -A total of 1 merge steps (of max 6) (16 -> 13 subms) took 0.0001991s (of which 1.693e-05s partitioning, 0s I/O); computing times: 3.099e-06s in par. loops, 1.192e-06s sorting, 3.099e-06s analyzing) -Total merge + benchmarking process took 0.0001991s, equivalent to 6.4/6.4 new/old ops (2.599e-05s for 1 clones -- as 0.8/0.8 ops, or 0.8/0.8 ops per clone), SPEEDUP of 1.000x (NO SPEEDUP) +A total of 1 merge steps (of max 6) (16 -> 10 subms) took 0.096s (of which 0.01599s partitioning, 0s I/O); computing times: 1.907e-05s in par. loops, 1.907e-06s sorting, 4.053e-06s analyzing) +Total merge + benchmarking process took 0.096s, equivalent to 6.0/6.0 new/old ops (0.07997s for 1 clones -- as 5.0/5.0 ops, or 5.0/5.0 ops per clone), SPEEDUP of 1.000x (NO SPEEDUP) Merging based autotuning FAILED (=NO SPEEDUP); let's try splitting then... -3 iterations (8 th.) took 0.0002601s; avg 8.67e-05s ( +/- 48.03/ 91.38 %); best 4.506e-05s; worst 0.0001659s; std dev. 5.605e-05 (taking best). -Reference operation time is 4.50611e-05 s (3.196 Mflops) with 8 threads. -Starting split (same threads) based auto-tuning procedure (transA=N, nrhs=2, order=cols) (max 6 steps, inclusive 3 grace steps) on: 6 x 6, type S, 36 nnz, 6 nnz/r, 21 subms, 16 lsubms, 4.1111 bpnz (tpop: 4.506e-05 Mflops: 3.196) -Split (16 -> 22 leaves, 21 -> 29 subms) took 5.794e-05s (of which: 2.146e-06s analysis, -3.535e+09s mem.mgmt); compute time: 7.582e-05s overall, 2.146e-06s searches, 7.367e-05s shuffle, 6.58e-05s switch, 9.537e-07s quadrants. -3 iterations (8 th.) took 0.00015s; avg 4.999e-05s ( +/- 18.44/ 12.08 %); best 4.077e-05s; worst 5.603e-05s; std dev. 6.623e-06 (taking best). -Reference operation time is 4.07696e-05 s (3.532 Mflops) with 8 threads. -After split step 1: tpop: 4.077e-05 s ~Mflops: 3.532 nsubm:22 otn:8 -Applying split (16 -> 22 leaves, 8 th.) yielded SPEEDUP of 1.105x: 4.506e-05s -> 4.077e-05s, so taking this instance. -Split (22 -> 28 leaves, 29 -> 37 subms) took 5.412e-05s (of which: 1.907e-06s analysis, -3.535e+09s mem.mgmt); compute time: 6.986e-05s overall, 1.192e-06s searches, 6.866e-05s shuffle, 3.195e-05s switch, 1.907e-06s quadrants. -3 iterations (8 th.) took 0.0003841s; avg 0.000128s ( +/- 52.33/ 85.10 %); best 6.104e-05s; worst 0.000237s; std dev. 7.772e-05 (taking best). -Reference operation time is 6.10352e-05 s (2.359 Mflops) with 8 threads. -After split step 2: tpop: 6.104e-05 s ~Mflops: 2.359 nsubm:28 otn:8 -Applying split (22 -> 28 leaves, 8 th.) yielded SLOWDOWN (1th of 3 tolerable) of 1.497x: 4.077e-05s -> 6.104e-05s. +3 iterations (8 th.) took 0.05999s; avg 0.02s ( +/- 39.99/ 20.01 %); best 0.012s; worst 0.024s; std dev. 0.005654 (taking best). +Reference operation time is 0.0119989 s (0.012 Mflops) with 8 threads. +Starting split (same threads) based auto-tuning procedure (transA=N, nrhs=2, order=cols) (max 6 steps, inclusive 3 grace steps) on: 6 x 6, type S, 36 nnz, 6 nnz/r, 21 subms, 16 lsubms, 4.8889 bpnz (tpop: 0.012 Mflops: 0.012) +Split (16 -> 28 leaves, 21 -> 37 subms) took 0.02398s (of which: 4.053e-06s analysis, -6.933e+09s mem.mgmt); compute time: 7.987e-05s overall, 1.907e-06s searches, 7.796e-05s shuffle, 6.175e-05s switch, 3.815e-06s quadrants. +3 iterations (8 th.) took 0.04798s; avg 0.01599s ( +/- 24.95/ 49.77 %); best 0.012s; worst 0.02395s; std dev. 0.005629 (taking best). +Reference operation time is 0.0120041 s (0.012 Mflops) with 8 threads. +After split step 1: tpop: 0.012 s ~Mflops: 0.012 nsubm:28 otn:8 +Applying split (16 -> 28 leaves, 8 th.) yielded NEGLIGIBLE change (1th in a row) (old/new=0.99956x): 0.012s -> 0.012s, so IGNORING this instance. +Split (28 -> 28 leaves, 37 -> 37 subms) took 0.02796s (of which: 5.96e-06s analysis, 0s mem.mgmt); compute time: 0s overall, 0s searches, 0s shuffle, 0s switch, 0s quadrants. +3 iterations (8 th.) took 0.06397s; avg 0.02132s ( +/- 24.99/ 49.94 %); best 0.01599s; worst 0.03197s; std dev. 0.00753 (taking best). +Reference operation time is 0.0159941 s (0.009003 Mflops) with 8 threads. +After split step 2: tpop: 0.01599 s ~Mflops: 0.009 nsubm:28 otn:8 +Applying split (28 -> 28 leaves, 8 th.) yielded SLOWDOWN (1th of 3 tolerable) of 1.333x: 0.012s -> 0.01599s. Skipping further split based tests after 1 definite performance degradations in a row (and last exceeding limit). -A total of 2 split steps (of max 6) (16 -> 28 subms) took 0.0007482s (of which 0.0001731s partitioning, 0s I/O); computing times: 0.0001457s in par. loops, 3.338e-06s sorting, 4.053e-06s analyzing) -Total split + benchmarking process took 0.0007482s, equivalent to 18.4/16.6 new/old ops (5.078e-05s for 2 clones -- as 1.2/1.1 ops, or 0.6/0.6 ops per clone), SPEEDUP of 1.105x -Applying multi-split (16 -> 22 leaves, 1 steps, 0 -> 8 th.sp.) yielded SPEEDUP of 1.105x (4.506e-05s -> 4.077e-05s), will amortize in 174.3 ops by saving 4.292e-06s per op. -In 1 tuning rounds (tot. 0.0015s, 7.7e-05s for constructor, 3 clones) obtained a SPEEDUP of 10.5% (1.105x) (from 3.196 to 3.532 Mflops). -After 0.001538s, global autotuning declared speedup of 1.10526 x, when using threads count of 8 and a new matrix: -(6 x 6)[0x5828c860]{S} @ (0(0..0),0(0..0)) (36 nnz, 6 nnz/r) flags 0x2046186 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 22, symflags:'' +A total of 2 split steps (of max 6) (16 -> 28 subms) took 0.164s (of which 0.05201s partitioning, 0s I/O); computing times: 7.987e-05s in par. loops, 1.907e-06s sorting, 1.001e-05s analyzing) +Total split + benchmarking process took 0.164s, equivalent to 13.7/13.7 new/old ops (0.04793s for 1 clones -- as 4.0/4.0 ops, or 4.0/4.0 ops per clone), SPEEDUP of 1.000x (NO SPEEDUP) +In 1 tuning rounds (tot. 0.51s, 0.13s for constructor, 2 clones) obtained NO speedup (best stays 0.012 Mflops). +After 0.512024s, global autotuning found old matrix optimal, with declared speedup 1 x when using 8 threads Considering C clone. Building a matrix with 36 nnz, 6 x 6 Duplicates check: 36 - 0 = 36 - converted COO to RSB in 8.607e-05 s (100.00 %) - analyzed arrays in 3.290e-05 s (38.23 %) - cleaned-up arrays in 0.000e+00 s (0.00 %) - deduplicated arrays in 9.537e-07 s (1.11 %) + converted COO to RSB in 1.559e-01 s (100.00 %) + analyzed arrays in 5.994e-02 s (38.44 %) + cleaned-up arrays in 9.537e-07 s (0.00 %) + deduplicated arrays in 9.537e-07 s (0.00 %) sorted arrays in 0.000e+00 s (0.00 %) - shuffled partitions in 3.099e-05 s (36.01 %) - memory allocations took 6.199e-06 s (7.20 %) - leafs setup took 2.146e-06 s (2.49 %) - halfword conversion took 1.287e-05 s (14.96 %) -Built (6 x 6)[0x5828c860]{C} @ (0(0..0),0(0..0)) (36 nnz, 6 nnz/r) flags 0x42046186 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 22, symflags:'' + shuffled partitions in 3.601e-02 s (23.09 %) + memory allocations took 6.914e-06 s (0.00 %) + leafs setup took 4.053e-06 s (0.00 %) + halfword conversion took 5.998e-02 s (38.46 %) +Built (6 x 6)[0x57dd9c30]{C} @ (0(0..0),0(0..0)) (36 nnz, 6 nnz/r) flags 0x42046186 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 22, symflags:'' Base matrix: -(6 x 6)[0x5828c860]{C} @ (0(0..0),0(0..0)) (36 nnz, 6 nnz/r) flags 0x2046186 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 22, symflags:'' +(6 x 6)[0x57dd9c30]{C} @ (0(0..0),0(0..0)) (36 nnz, 6 nnz/r) flags 0x2046186 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 22, symflags:'' Will use autotuning routine to sample matrix: 6 x 6, type C, 36 nnz, 6 nnz/r, 29 subms, 22 lsubms, 4.2778 bpnz. Parameters: verbosity:1 mintimes:3 maxtimes:10 mindt:0 maxdt:0.1 -3 iterations (8 th.) took 0.0004029s; avg 0.0001343s ( +/- 69.47/126.33 %); best 4.101e-05s; worst 0.000304s; std dev. 0.0001202 (taking best). -Reference operation time is 4.1008e-05 s (14.05 Mflops) with 8 threads. -After 0.000414s, autotuning routine did not find a better threads count configuration. +3 iterations (8 th.) took 0.07195s; avg 0.02398s ( +/- 50.16/ 50.12 %); best 0.01195s; worst 0.03601s; std dev. 0.009819 (taking best). +Reference operation time is 0.0119541 s (0.04818 Mflops) with 8 threads. +After 0.071987s, autotuning routine did not find a better threads count configuration. Will autotune matrix: 6 x 6, type C, 36 nnz, 6 nnz/r, 29 subms, 22 lsubms, 4.2778 bpnz. Parameters: verbosity:1 mintimes:3 maxtimes:10 mindt:0 maxdt:0.1 -3 iterations (8 th.) took 0.0003531s; avg 0.0001177s ( +/- 58.27/ 54.56 %); best 4.911e-05s; worst 0.0001819s; std dev. 5.43e-05 (taking best). -Reference operation time is 4.91142e-05 s (11.73 Mflops) with 8 threads. -Starting merge (same threads) based auto-tuning procedure (transA=N, nrhs=2, order=cols) (max 6 steps, inclusive 3 grace steps) on: 6 x 6, type C, 36 nnz, 6 nnz/r, 29 subms, 22 lsubms, 4.2778 bpnz (tpop: 4.911e-05 Mflops: 11.728) -Merge (22 -> 19 leaves) took w.c.t. of 9.06e-06s, ~1.907e-06s of computing time (of which 0s sorting, 1.907e-06s analysis) -3 iterations (8 th.) took 0.0003071s; avg 0.0001024s ( +/- 62.73/ 62.11 %); best 3.815e-05s; worst 0.0001659s; std dev. 5.217e-05 (taking best). -Reference operation time is 3.8147e-05 s (15.1 Mflops) with 8 threads. -After merge step 1: tpop: 3.815e-05 s ~Mflops: 15.099 nsubm:19 otn:8 -Applying merge (22 -> 19 leaves, 8 th.) yielded SPEEDUP of 1.288x: 4.911e-05s -> 3.815e-05s, so taking this instance. -Merge (19 -> 16 leaves) took w.c.t. of 7.153e-06s, ~1.907e-06s of computing time (of which 9.537e-07s sorting, 2.146e-06s analysis) -3 iterations (8 th.) took 0.0002451s; avg 8.17e-05s ( +/- 34.92/ 59.05 %); best 5.317e-05s; worst 0.0001299s; std dev. 3.43e-05 (taking best). -Reference operation time is 5.31673e-05 s (10.83 Mflops) with 8 threads. -After merge step 2: tpop: 5.317e-05 s ~Mflops: 10.834 nsubm:16 otn:8 -Applying merge (19 -> 16 leaves, 8 th.) yielded SLOWDOWN (1th of 3 tolerable) of 1.394x: 3.815e-05s -> 5.317e-05s. +3 iterations (8 th.) took 0.072s; avg 0.024s ( +/- 33.37/ 33.33 %); best 0.01599s; worst 0.032s; std dev. 0.006536 (taking best). +Reference operation time is 0.01599 s (0.03602 Mflops) with 8 threads. +Starting merge (same threads) based auto-tuning procedure (transA=N, nrhs=2, order=cols) (max 6 steps, inclusive 3 grace steps) on: 6 x 6, type C, 36 nnz, 6 nnz/r, 29 subms, 22 lsubms, 4.2778 bpnz (tpop: 0.01599 Mflops: 0.036) +Merge (22 -> 19 leaves) took w.c.t. of 2.098e-05s, ~5.007e-06s of computing time (of which 2.146e-06s sorting, 5.007e-06s analysis) +3 iterations (8 th.) took 0.06394s; avg 0.02131s ( +/- 25.14/ 12.59 %); best 0.01596s; worst 0.024s; std dev. 0.003788 (taking best). +Reference operation time is 0.0159559 s (0.0361 Mflops) with 8 threads. +After merge step 1: tpop: 0.01596 s ~Mflops: 0.036 nsubm:19 otn:8 +Applying merge (22 -> 19 leaves, 8 th.) yielded NEGLIGIBLE change (1th in a row) (old/new=1.00214x): 0.01599s -> 0.01596s, so IGNORING this instance. +Merge (19 -> 16 leaves) took w.c.t. of 2.313e-05s, ~5.96e-06s of computing time (of which 1.907e-06s sorting, 4.768e-06s analysis) +3 iterations (8 th.) took 0.07196s; avg 0.02399s ( +/- 0.14/ 0.11 %); best 0.02395s; worst 0.02401s; std dev. 2.538e-05 (taking best). +Reference operation time is 0.023952 s (0.02405 Mflops) with 8 threads. +After merge step 2: tpop: 0.02395 s ~Mflops: 0.024 nsubm:16 otn:8 +Applying merge (19 -> 16 leaves, 8 th.) yielded SLOWDOWN (1th of 3 tolerable) of 1.498x: 0.01599s -> 0.02395s. Skipping further merge based tests after 1 definite performance degradations in a row (and last exceeding limit). -A total of 2 merge steps (of max 6) (22 -> 16 subms) took 0.0006011s (of which 1.907e-05s partitioning, 0s I/O); computing times: 3.815e-06s in par. loops, 9.537e-07s sorting, 4.053e-06s analyzing) -Total merge + benchmarking process took 0.0006011s, equivalent to 15.8/12.2 new/old ops (3.386e-05s for 2 clones -- as 0.9/0.7 ops, or 0.4/0.3 ops per clone), SPEEDUP of 1.288x -Applying multi-merge (22 -> 19 leaves, 1 steps, 0 -> 8 th.sp.) yielded SPEEDUP of 1.288x (4.911e-05s -> 3.815e-05s), will amortize in 54.8 ops by saving 1.097e-05s per op. -In 1 tuning rounds (tot. 0.00099s, 3.4e-05s for constructor, 2 clones) obtained a SPEEDUP of 28.8% (1.288x) (from 11.73 to 15.1 Mflops). -After 0.000994s, global autotuning declared speedup of 1.2875 x, when using threads count of 8 and a new matrix: -(6 x 6)[0x58286d50]{C} @ (0(0..0),0(0..0)) (36 nnz, 6 nnz/r) flags 0x2046186 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 19, symflags:'' +A total of 2 merge steps (of max 6) (22 -> 16 subms) took 0.136s (of which 5.102e-05s partitioning, 0s I/O); computing times: 1.097e-05s in par. loops, 4.053e-06s sorting, 9.775e-06s analyzing) +Total merge + benchmarking process took 0.136s, equivalent to 8.5/8.5 new/old ops (0.08796s for 1 clones -- as 5.5/5.5 ops, or 5.5/5.5 ops per clone), SPEEDUP of 1.000x (NO SPEEDUP) +Merging based autotuning FAILED (=NO SPEEDUP); let's try splitting then... +3 iterations (8 th.) took 0.07598s; avg 0.02533s ( +/- 5.30/ 10.52 %); best 0.02399s; worst 0.02799s; std dev. 0.001884 (taking best). +Reference operation time is 0.0239861 s (0.02401 Mflops) with 8 threads. +Starting split (same threads) based auto-tuning procedure (transA=N, nrhs=2, order=cols) (max 6 steps, inclusive 3 grace steps) on: 6 x 6, type C, 36 nnz, 6 nnz/r, 29 subms, 22 lsubms, 4.2778 bpnz (tpop: 0.02399 Mflops: 0.024) +Split (22 -> 25 leaves, 29 -> 33 subms) took 0.03564s (of which: 4.053e-06s analysis, -1.733e+09s mem.mgmt); compute time: 1.502e-05s overall, 2.146e-06s searches, 1.287e-05s shuffle, 5.007e-06s switch, 9.537e-07s quadrants. +3 iterations (8 th.) took 0.06031s; avg 0.0201s ( +/- 38.69/ 19.37 %); best 0.01233s; worst 0.024s; std dev. 0.0055 (taking best). +Reference operation time is 0.012325 s (0.04673 Mflops) with 8 threads. +After split step 1: tpop: 0.01233 s ~Mflops: 0.047 nsubm:25 otn:8 +Applying split (22 -> 25 leaves, 8 th.) yielded SPEEDUP of 1.946x: 0.02399s -> 0.01233s, so taking this instance. +Split (25 -> 28 leaves, 33 -> 37 subms) took 0.02798s (of which: 5.007e-06s analysis, -1.733e+09s mem.mgmt); compute time: 8.702e-05s overall, 9.537e-07s searches, 8.607e-05s shuffle, 7.987e-05s switch, 9.537e-07s quadrants. +3 iterations (8 th.) took 0.04798s; avg 0.01599s ( +/- 0.08/ 0.05 %); best 0.01598s; worst 0.016s; std dev. 9.692e-06 (taking best). +Reference operation time is 0.0159791 s (0.03605 Mflops) with 8 threads. +After split step 2: tpop: 0.01598 s ~Mflops: 0.036 nsubm:28 otn:8 +Applying split (25 -> 28 leaves, 8 th.) yielded SLOWDOWN (1th of 3 tolerable) of 1.296x: 0.01233s -> 0.01598s. +Skipping further split based tests after 1 definite performance degradations in a row (and last exceeding limit). +A total of 2 split steps (of max 6) (22 -> 28 subms) took 0.232s (of which 0.06367s partitioning, 0s I/O); computing times: 0.000102s in par. loops, 3.099e-06s sorting, 9.06e-06s analyzing) +Total split + benchmarking process took 0.232s, equivalent to 18.8/9.7 new/old ops (0.132s for 2 clones -- as 10.7/5.5 ops, or 5.4/2.8 ops per clone), SPEEDUP of 1.946x +Applying multi-split (22 -> 25 leaves, 1 steps, 0 -> 8 th.sp.) yielded SPEEDUP of 1.946x (0.02399s -> 0.01233s), will amortize in 19.9 ops by saving 0.01166s per op. +In 1 tuning rounds (tot. 0.68s, 0.22s for constructor, 3 clones) obtained a SPEEDUP of 94.6% (1.946x) (from 0.02401 to 0.04673 Mflops). +After 0.676028s, global autotuning declared speedup of 1.94613 x, when using threads count of 8 and a new matrix: +(6 x 6)[0x57ddb980]{C} @ (0(0..0),0(0..0)) (36 nnz, 6 nnz/r) flags 0x2046186 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 25, symflags:'' Considering Z clone. Building a matrix with 36 nnz, 6 x 6 Duplicates check: 36 - 0 = 36 - converted COO to RSB in 9.489e-05 s (100.00 %) - analyzed arrays in 3.290e-05 s (34.67 %) - cleaned-up arrays in 1.192e-06 s (1.26 %) - deduplicated arrays in 0.000e+00 s (0.00 %) + converted COO to RSB in 1.359e-01 s (100.00 %) + analyzed arrays in 5.191e-02 s (38.19 %) + cleaned-up arrays in 9.537e-07 s (0.00 %) + deduplicated arrays in 1.192e-06 s (0.00 %) sorted arrays in 0.000e+00 s (0.00 %) - shuffled partitions in 3.815e-05 s (40.20 %) - memory allocations took 7.868e-06 s (8.29 %) - leafs setup took 1.907e-06 s (2.01 %) - halfword conversion took 1.192e-05 s (12.56 %) -Built (6 x 6)[0x5828c860]{Z} @ (0(0..0),0(0..0)) (36 nnz, 6 nnz/r) flags 0x42046186 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 25, symflags:'' + shuffled partitions in 3.600e-02 s (26.48 %) + memory allocations took 4.768e-06 s (0.00 %) + leafs setup took 2.861e-06 s (0.00 %) + halfword conversion took 4.800e-02 s (35.31 %) +Built (6 x 6)[0x57dd9c30]{Z} @ (0(0..0),0(0..0)) (36 nnz, 6 nnz/r) flags 0x42046186 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 28, symflags:'' Base matrix: -(6 x 6)[0x5828c860]{Z} @ (0(0..0),0(0..0)) (36 nnz, 6 nnz/r) flags 0x2046186 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 25, symflags:'' +(6 x 6)[0x57dd9c30]{Z} @ (0(0..0),0(0..0)) (36 nnz, 6 nnz/r) flags 0x2046186 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 28, symflags:'' -Will use autotuning routine to sample matrix: 6 x 6, type Z, 36 nnz, 6 nnz/r, 33 subms, 25 lsubms, 4.5556 bpnz. +Will use autotuning routine to sample matrix: 6 x 6, type Z, 36 nnz, 6 nnz/r, 37 subms, 28 lsubms, 4.4444 bpnz. Parameters: verbosity:1 mintimes:3 maxtimes:10 mindt:0 maxdt:0.1 -3 iterations (8 th.) took 0.000252s; avg 8.4e-05s ( +/- 33.30/ 43.90 %); best 5.603e-05s; worst 0.0001209s; std dev. 2.721e-05 (taking best). -Reference operation time is 5.60284e-05 s (10.28 Mflops) with 8 threads. -After 0.000263s, autotuning routine did not find a better threads count configuration. +3 iterations (8 th.) took 0.04797s; avg 0.01599s ( +/- 25.23/ 50.19 %); best 0.01196s; worst 0.02401s; std dev. 0.005674 (taking best). +Reference operation time is 0.011955 s (0.04818 Mflops) with 8 threads. +After 0.047996s, autotuning routine did not find a better threads count configuration. -Will autotune matrix: 6 x 6, type Z, 36 nnz, 6 nnz/r, 33 subms, 25 lsubms, 4.5556 bpnz. +Will autotune matrix: 6 x 6, type Z, 36 nnz, 6 nnz/r, 37 subms, 28 lsubms, 4.4444 bpnz. Parameters: verbosity:1 mintimes:3 maxtimes:10 mindt:0 maxdt:0.1 -3 iterations (8 th.) took 0.0004029s; avg 0.0001343s ( +/- 51.54/ 57.10 %); best 6.509e-05s; worst 0.000211s; std dev. 5.98e-05 (taking best). -Reference operation time is 6.50883e-05 s (8.85 Mflops) with 8 threads. -Starting merge (same threads) based auto-tuning procedure (transA=N, nrhs=2, order=cols) (max 6 steps, inclusive 3 grace steps) on: 6 x 6, type Z, 36 nnz, 6 nnz/r, 33 subms, 25 lsubms, 4.5556 bpnz (tpop: 6.509e-05 Mflops: 8.850) -Merge (25 -> 19 leaves) took w.c.t. of 0.0001991s, ~0.0003748s of computing time (of which 9.537e-07s sorting, 2.146e-06s analysis) -3 iterations (8 th.) took 0.000577s; avg 0.0001923s ( +/- 66.65/ 97.48 %); best 6.413e-05s; worst 0.0003798s; std dev. 0.0001355 (taking best). -Reference operation time is 6.41346e-05 s (8.981 Mflops) with 8 threads. -After merge step 1: tpop: 6.413e-05 s ~Mflops: 8.981 nsubm:19 otn:8 -Applying merge (25 -> 19 leaves, 8 th.) yielded SPEEDUP of 1.015x: 6.509e-05s -> 6.413e-05s, so taking this instance. -Merge (19 -> 13 leaves) took w.c.t. of 1.192e-05s, ~5.722e-06s of computing time (of which 9.537e-07s sorting, 1.907e-06s analysis) -3 iterations (8 th.) took 0.0004392s; avg 0.0001464s ( +/- 73.29/137.79 %); best 3.91e-05s; worst 0.0003481s; std dev. 0.0001427 (taking best). -Reference operation time is 3.91006e-05 s (14.73 Mflops) with 8 threads. -After merge step 2: tpop: 3.91e-05 s ~Mflops: 14.731 nsubm:13 otn:8 -Applying merge (19 -> 13 leaves, 8 th.) yielded SPEEDUP of 1.640x: 6.413e-05s -> 3.91e-05s, so taking this instance. -Merge (13 -> 10 leaves) took w.c.t. of 8.106e-06s, ~1.907e-06s of computing time (of which 9.537e-07s sorting, 2.146e-06s analysis) -3 iterations (8 th.) took 0.0002201s; avg 7.335e-05s ( +/- 39.87/ 21.24 %); best 4.411e-05s; worst 8.893e-05s; std dev. 2.069e-05 (taking best). -Reference operation time is 4.41074e-05 s (13.06 Mflops) with 8 threads. -After merge step 3: tpop: 4.411e-05 s ~Mflops: 13.059 nsubm:10 otn:8 -Applying merge (13 -> 10 leaves, 8 th.) yielded SLOWDOWN (1th of 3 tolerable) of 1.128x: 3.91e-05s -> 4.411e-05s. -Merge (10 -> 7 leaves) took w.c.t. of 8.106e-06s, ~2.861e-06s of computing time (of which 9.537e-07s sorting, 9.537e-07s analysis) -3 iterations (8 th.) took 0.000159s; avg 5.301e-05s ( +/- 50.97/ 26.39 %); best 2.599e-05s; worst 6.7e-05s; std dev. 1.911e-05 (taking best). -Reference operation time is 2.59876e-05 s (22.16 Mflops) with 8 threads. -After merge step 4: tpop: 2.599e-05 s ~Mflops: 22.164 nsubm:7 otn:8 -Applying merge (10 -> 7 leaves, 8 th.) yielded SPEEDUP of 1.505x: 3.91e-05s -> 2.599e-05s, so taking this instance. -Merge (7 -> 4 leaves) took w.c.t. of 3.815e-06s, ~1.907e-06s of computing time (of which 0s sorting, 0s analysis) -3 iterations (8 th.) took 5.507e-05s; avg 1.836e-05s ( +/- 23.38/ 41.56 %); best 1.407e-05s; worst 2.599e-05s; std dev. 5.409e-06 (taking best). -Reference operation time is 1.40667e-05 s (40.95 Mflops) with 8 threads. -After merge step 5: tpop: 1.407e-05 s ~Mflops: 40.948 nsubm:4 otn:8 -Applying merge (7 -> 4 leaves, 8 th.) yielded SPEEDUP of 1.847x: 2.599e-05s -> 1.407e-05s, so taking this instance. -Merge (4 -> 1 leaves) took w.c.t. of 7.868e-06s, ~4.053e-06s of computing time (of which 9.537e-07s sorting, 9.537e-07s analysis) -3 iterations (8 th.) took 4.053e-06s; avg 1.351e-06s ( +/- 29.41/ 41.18 %); best 9.537e-07s; worst 1.907e-06s; std dev. 4.052e-07 (taking best). -Reference operation time is 9.53674e-07 s (604 Mflops) with 8 threads. -After merge step 6: tpop: 9.537e-07 s ~Mflops: 603.980 nsubm:1 otn:8 -Applying merge (4 -> 1 leaves, 8 th.) yielded SPEEDUP of 14.750x: 1.407e-05s -> 9.537e-07s, so taking this instance. -Merged all the matrix leaves: no reason to continue merging. -A total of 6 merge steps (of max 6) (25 -> 1 subms) took 0.001949s (of which 0.000257s partitioning, 0s I/O); computing times: 0.0003912s in par. loops, 4.768e-06s sorting, 8.106e-06s analyzing) -Total merge + benchmarking process took 0.001949s, equivalent to 2043.8/29.9 new/old ops (0.0001087s for 6 clones -- as 114.0/1.7 ops, or 19.0/0.3 ops per clone), SPEEDUP of 68.250x -Applying multi-merge (25 -> 1 leaves, 6 steps, 0 -> 8 th.sp.) yielded SPEEDUP of 68.250x (6.509e-05s -> 9.537e-07s), will amortize in 30.4 ops by saving 6.413e-05s per op. -In 1 tuning rounds (tot. 0.0024s, 0.00011s for constructor, 6 clones) obtained a SPEEDUP of 6725.0% (68.25x) (from 8.85 to 604 Mflops). -After 0.002401s, global autotuning declared speedup of 68.25 x, when using threads count of 8 and a new matrix: -(6 x 6)[0x58288890]{Z} @ (0(0..6),0(0..6)) (36 nnz, 6 nnz/r) flags 0x2244086 (coo:0, csr:1, hw:1, ic:1, fi:0), storage: 1, subm: 1, symflags:'' +3 iterations (8 th.) took 0.06398s; avg 0.02133s ( +/- 43.74/ 31.27 %); best 0.012s; worst 0.02799s; std dev. 0.006796 (taking best). +Reference operation time is 0.011997 s (0.04801 Mflops) with 8 threads. +Starting merge (same threads) based auto-tuning procedure (transA=N, nrhs=2, order=cols) (max 6 steps, inclusive 3 grace steps) on: 6 x 6, type Z, 36 nnz, 6 nnz/r, 37 subms, 28 lsubms, 4.4444 bpnz (tpop: 0.012 Mflops: 0.048) +Merge (28 -> 22 leaves) took w.c.t. of 0.008013s, ~1.621e-05s of computing time (of which 4.768e-06s sorting, 5.007e-06s analysis) +3 iterations (8 th.) took 0.104s; avg 0.03465s ( +/- 53.85/ 61.51 %); best 0.01599s; worst 0.05597s; std dev. 0.01643 (taking best). +Reference operation time is 0.0159919 s (0.03602 Mflops) with 8 threads. +After merge step 1: tpop: 0.01599 s ~Mflops: 0.036 nsubm:22 otn:8 +Applying merge (28 -> 22 leaves, 8 th.) yielded SLOWDOWN (1th of 3 tolerable) of 1.333x: 0.012s -> 0.01599s. +Skipping further merge based tests after 1 definite performance degradations in a row (and last exceeding limit). +A total of 1 merge steps (of max 6) (28 -> 22 subms) took 0.112s (of which 0.008019s partitioning, 0s I/O); computing times: 1.621e-05s in par. loops, 4.768e-06s sorting, 5.007e-06s analyzing) +Total merge + benchmarking process took 0.112s, equivalent to 9.3/9.3 new/old ops (0.04797s for 1 clones -- as 4.0/4.0 ops, or 4.0/4.0 ops per clone), SPEEDUP of 1.000x (NO SPEEDUP) +Merging based autotuning FAILED (=NO SPEEDUP); let's try splitting then... +3 iterations (8 th.) took 0.06399s; avg 0.02133s ( +/- 25.09/ 50.06 %); best 0.01598s; worst 0.03201s; std dev. 0.00755 (taking best). +Reference operation time is 0.0159791 s (0.03605 Mflops) with 8 threads. +Starting split (same threads) based auto-tuning procedure (transA=N, nrhs=2, order=cols) (max 6 steps, inclusive 3 grace steps) on: 6 x 6, type Z, 36 nnz, 6 nnz/r, 37 subms, 28 lsubms, 4.4444 bpnz (tpop: 0.01598 Mflops: 0.036) +Split (28 -> 28 leaves, 37 -> 37 subms) took 0.03197s (of which: 5.007e-06s analysis, 0s mem.mgmt); compute time: 0s overall, 0s searches, 0s shuffle, 0s switch, 0s quadrants. +3 iterations (8 th.) took 0.068s; avg 0.02267s ( +/- 29.50/ 58.92 %); best 0.01598s; worst 0.03602s; std dev. 0.009443 (taking best). +Reference operation time is 0.0159791 s (0.03605 Mflops) with 8 threads. +After split step 1: tpop: 0.01598 s ~Mflops: 0.036 nsubm:28 otn:8 +Applying split (28 -> 28 leaves, 8 th.) yielded NEGLIGIBLE change (1th in a row) (old/new=1.00000x): 0.01598s -> 0.01598s, so IGNORING this instance. +Split (28 -> 28 leaves, 37 -> 37 subms) took 0.01599s (of which: 5.007e-06s analysis, 0s mem.mgmt); compute time: 0s overall, 0s searches, 0s shuffle, 0s switch, 0s quadrants. +3 iterations (8 th.) took 0.06398s; avg 0.02133s ( +/- 27.88/ 49.91 %); best 0.01538s; worst 0.03197s; std dev. 0.007544 (taking best). +Reference operation time is 0.0153809 s (0.03745 Mflops) with 8 threads. +After split step 2: tpop: 0.01538 s ~Mflops: 0.037 nsubm:28 otn:8 +Applying split (28 -> 28 leaves, 8 th.) yielded SPEEDUP of 1.039x: 0.01598s -> 0.01538s, so taking this instance. +Split (28 -> 28 leaves, 37 -> 37 subms) took 0.03194s (of which: 5.96e-06s analysis, 0s mem.mgmt); compute time: 0s overall, 0s searches, 0s shuffle, 0s switch, 0s quadrants. +3 iterations (8 th.) took 0.08s; avg 0.02667s ( +/- 10.02/ 19.89 %); best 0.02399s; worst 0.03197s; std dev. 0.00375 (taking best). +Reference operation time is 0.0239949 s (0.02401 Mflops) with 8 threads. +After split step 3: tpop: 0.02399 s ~Mflops: 0.024 nsubm:28 otn:8 +Applying split (28 -> 28 leaves, 8 th.) yielded SLOWDOWN (1th of 3 tolerable) of 1.560x: 0.01538s -> 0.02399s. +Skipping further split based tests after 1 definite performance degradations in a row (and last exceeding limit). +A total of 3 split steps (of max 6) (28 -> 28 subms) took 0.356s (of which 0.08s partitioning, 0s I/O); computing times: 0s in par. loops, 0s sorting, 1.597e-05s analyzing) +Total split + benchmarking process took 0.356s, equivalent to 23.1/22.3 new/old ops (0.128s for 2 clones -- as 8.3/8.0 ops, or 4.2/4.0 ops per clone), SPEEDUP of 1.039x +Applying multi-split (28 -> 28 leaves, 2 steps, 0 -> 8 th.sp.) yielded SPEEDUP of 1.039x (0.01598s -> 0.01538s), will amortize in 595.2 ops by saving 0.0005982s per op. +In 1 tuning rounds (tot. 0.71s, 0.18s for constructor, 3 clones) obtained a SPEEDUP of 3.9% (1.039x) (from 0.03605 to 0.03745 Mflops). +After 0.708065s, global autotuning declared speedup of 1.03889 x, when using threads count of 8 and a new matrix: +(6 x 6)[0x57ddc680]{Z} @ (0(0..0),0(0..0)) (36 nnz, 6 nnz/r) flags 0x2046186 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 28, symflags:'' gmake[4]: Leaving directory '/build/reproducible-path/librsb-1.3.0.2+dfsg/examples' gmake[3]: Leaving directory '/build/reproducible-path/librsb-1.3.0.2+dfsg' @@ -9184,10 +9333,10 @@ 4 0 DIFF PRINT TEST END Beginning large binary search test. -Detected 3891118080 bytes of memory, comprehensive of 1528254464 of free memory. +Detected 3883683840 bytes of memory, comprehensive of 1554317312 of free memory. On this system, maximal array of coordinates can have 2147483137 elements and occupy 4294965252 bytes. -Will perform the test using less memory (69 MB) than on the maximal coordinate indices array (72449024) allows. -(c)allocated 18112256 nnz (72449024 bytes) +Will perform the test using less memory (87 MB) than on the maximal coordinate indices array (91996160) allows. +(c)allocated 22999040 nnz (91996160 bytes) Succeeded retrieving array last element. Successfully performed large binary search test. BASIC SPARSE BLAS TEST: BEGIN @@ -9196,7 +9345,7 @@ got RSB_IO_WANT_IS_INITIALIZED_MARKER: 1 INIT INTERFACE TEST: END (SUCCESS) DEVEL PRINT TEST: BEGIN -(4 x 4)[0x57ced780]{S} @ (0(0..0),0(0..0)) (4 nnz, 1 nnz/r) flags 0x2046186 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 2, symflags:'' +(4 x 4)[0x569d6780]{S} @ (0(0..0),0(0..0)) (4 nnz, 1 nnz/r) flags 0x2046186 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 2, symflags:'' RSB_FLAG_USE_HALFWORD_INDICES | RSB_FLAG_SORTED_INPUT | RSB_FLAG_WANT_COO_STORAGE | @@ -9205,8 +9354,8 @@ RSB_FLAG_ASSEMBLED_IN_COO_ARRAYS | RSB_FLAG_OWN_PARTITIONING_ARRAYS | RSB_FLAG_SORT_INPUT -(2 x 2)[0x57ced850]{S} @ (0(0..2),0(0..2)) (2 nnz, 1 nnz/r) flags 0x2144386 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 0, symflags:'' -(2 x 2)[0x57ced920]{S} @ (2(2..4),2(2..4)) (2 nnz, 1 nnz/r) flags 0x2144386 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 0, symflags:'' +(2 x 2)[0x569d6850]{S} @ (0(0..2),0(0..2)) (2 nnz, 1 nnz/r) flags 0x2144386 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 0, symflags:'' +(2 x 2)[0x569d6920]{S} @ (2(2..4),2(2..4)) (2 nnz, 1 nnz/r) flags 0x2144386 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 0, symflags:'' #R 4 x 4, 4 nnz (16 bytes), 16 index space for bytes, 416 bytes for 2 structs (2 of which are on the diagonal) (1e+02% of nnz are on the diagonal) #N at 0 0, 4 x 4, 4 nnz ( 25%) #T at 0 0, 2 x 2, 2 nnz ( 50%) @@ -9214,9 +9363,9 @@ ( 0x2046186 = { rec:1 coo:1 css:1 hw:1 ic:1 fi:0 symflags: } ) DEVEL PRINT TEST: END PRINT TEST: BEGIN [QUIET] -(2 x 2)[0x57ced850]{S} @ (0(0..2),0(0..2)) (2 nnz, 1 nnz/r) flags 0x2144386 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 0, symflags:'' -(2 x 2)[0x57ced920]{S} @ (2(2..4),2(2..4)) (2 nnz, 1 nnz/r) flags 0x2144386 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 0, symflags:'' -(4 x 4)[0x57ced780]{S} @ (0(0..0),0(0..0)) (4 nnz, 1 nnz/r) flags 0x2046186 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 2, symflags:'' +(2 x 2)[0x569d6850]{S} @ (0(0..2),0(0..2)) (2 nnz, 1 nnz/r) flags 0x2144386 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 0, symflags:'' +(2 x 2)[0x569d6920]{S} @ (2(2..4),2(2..4)) (2 nnz, 1 nnz/r) flags 0x2144386 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 0, symflags:'' +(4 x 4)[0x569d6780]{S} @ (0(0..0),0(0..0)) (4 nnz, 1 nnz/r) flags 0x2046186 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 2, symflags:'' RSB_FLAG_USE_HALFWORD_INDICES | RSB_FLAG_SORTED_INPUT | RSB_FLAG_WANT_COO_STORAGE | @@ -9234,8 +9383,8 @@ BASIC PRIMITIVES TEST: BEGIN BASIC PRIMITIVES TEST: END (SUCCESS) ADVANCED SPARSE BLAS TEST: BEGIN [limit 30.000000s] [QUIET] -Terminating testing earlier due to user timeout request: test took 30.002458 s, max allowed was 30.000000. - PASSED:42807 +Terminating testing earlier due to user timeout request: test took 30.056004 s, max allowed was 30.000000. + PASSED:628 FAILED:0 ADVANCED SPARSE BLAS TEST: END (SUCCESS) gmake qtests -C librsbpp @@ -9244,75 +9393,75 @@ gmake[4]: Entering directory '/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp' gmake[4]: Leaving directory '/build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp' ./rsbtt -if ! test -f G.mtx ; then cp -p /build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp/G.mtx . ; fi ; /bin/bash /build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp/test.sh +if ! test -f G.mtx ; then cp -p /build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp/G.mtx . ; fi ; /bin/sh /build/reproducible-path/librsb-1.3.0.2+dfsg/librsbpp/test.sh +++ wc -l ++ ./rsbpp Td,s G.mtx ++ grep Z-sort -++ wc -l + test 54 = 54 -++ ./rsbpp Td G.mtx ++ grep Z-sort +++ ./rsbpp Td G.mtx ++ wc -l + test 27 = 27 ++ ./rsbpp Td,z G.mtx ++ grep Z-sort ++ wc -l + test 54 = 54 -++ ./rsbpp vTd,z G.mtx -++ grep Z-sort ++ wc -l +++ grep Z-sort +++ ./rsbpp vTd,z G.mtx + test 54 = 54 +++ wc -l ++ ./rsbpp vTd,z G.mtx ++ grep Z-sort -++ wc -l + test 54 = 54 -++ ./rsbpp vvvTd,z G.mtx ++ grep Zorted +++ ./rsbpp vvvTd,z G.mtx ++ wc -l + test 8 = 8 +++ wc -l ++ ./rsbpp vvTd,z G.mtx ++ grep Z-sort -++ wc -l + test 54 = 54 ++ ./rsbpp vvTd,z G.mtx ++ grep Range ++ wc -l + test 0 = 0 ++ ./rsbpp vvvTd,z G.mtx -++ grep Range ++ wc -l +++ grep Range + test 258 -gt 0 ++ ./rsbpp vvvTd,z S.mtx -++ grep Range ++ wc -l +++ grep Range + test 0 -eq 0 ++ ./rsbpp vvvTd,z G.mtx -++ grep Range ++ wc -l +++ grep Range + test 258 = 258 ++ OMP_NUM_THREADS=1 ++ ./rsbpp m10M10I1r1,4,8sFv ++ grep spmm- ++ wc -l + test 9 = 9 -++ OMP_NUM_THREADS=1 -++ ./rsbpp C1000m100M100I1r1,4,8sFv ++ grep spmm- ++ wc -l +++ OMP_NUM_THREADS=1 +++ ./rsbpp C1000m100M100I1r1,4,8sFv + test 9 = 9 ++ OMP_NUM_THREADS=1 ++ ./rsbpp C1000m100M100I1r1sFvtN,T -++ grep spmm- ++ wc -l +++ grep spmm- + test 3 = 3 ++ OMP_NUM_THREADS=1 ++ ./rsbpp C1000m100M100I1r1vtN,TsF ++ grep spmm- ++ wc -l + test 2 = 2 +++ wc -l ++ OMP_NUM_THREADS=1 ++ ./rsbpp C1000m100M100I1r0vtN,TsF ++ grep spmm- -++ wc -l + test 0 = 0 ++ OMP_NUM_THREADS=1 ++ RSB_NUM_THREADS=1 @@ -9326,17 +9475,17 @@ ++ grep Recursing ++ wc -l + test 4 = 4 +++ wc -l ++ OMP_NUM_THREADS=1 ++ RSB_NUM_THREADS=1 ++ ./rsbpp vvvC1000m100M100I1r1vtN,ToRsF ++ grep Recursing -++ wc -l + test 208 = 208 +++ wc -l ++ OMP_NUM_THREADS=2 ++ RSB_NUM_THREADS=2 ++ ./rsbpp vvvC1000m100M100I1r1vtN,ToRsF ++ grep Recursing -++ wc -l + test 410 = 410 echo "Skipping tests based on Google Test (not detected at configure time)" Skipping tests based on Google Test (not detected at configure time) @@ -9383,7 +9532,7 @@ 0 0 0 0 before tuning for SPMV: -(3 x 3)[0x56d05f80]{D} @ (0(0..0),0(0..0)) (6 nnz, 2 nnz/r) flags 0x2046186 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'' +(3 x 3)[0x56c300e0]{D} @ (0(0..0),0(0..0)) (6 nnz, 2 nnz/r) flags 0x2046186 (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'' ** x: 1.1 @@ -9472,18 +9621,18 @@ BEGIN Rsb_Matrix_test_multimatrix_ms_mnrhs BEGIN -(3 x 3)[0x56d33960]{D} @ (0(0..0),0(0..0)) (6 nnz, 2 nnz/r) flags 0x204619e (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'LT' -Tuned with speedup factor of 1.44828: -(3 x 3)[0x56d1c640]{D} @ (0(0..0),0(0..0)) (6 nnz, 2 nnz/r) flags 0x204619e (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'LT' -(3 x 3)[0x56d33960]{D} @ (0(0..0),0(0..0)) (6 nnz, 2 nnz/r) flags 0x204619e (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'LT' -Tuned with speedup factor of 1.08696: -(3 x 3)[0x56d2d120]{D} @ (0(0..0),0(0..0)) (6 nnz, 2 nnz/r) flags 0x204619e (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'LT' -(3 x 3)[0x56d33960]{D} @ (0(0..0),0(0..0)) (6 nnz, 2 nnz/r) flags 0x204619e (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'LT' -Tuned with speedup factor of 1.27273: -(3 x 3)[0x56d37440]{D} @ (0(0..0),0(0..0)) (6 nnz, 2 nnz/r) flags 0x204619e (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'LT' -(3 x 3)[0x56d33960]{D} @ (0(0..0),0(0..0)) (6 nnz, 2 nnz/r) flags 0x204619e (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'LT' -Tuned with speedup factor of 1.26: -(3 x 3)[0x56d382f0]{D} @ (0(0..0),0(0..0)) (6 nnz, 2 nnz/r) flags 0x204619e (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'LT' +(3 x 3)[0x56c5e010]{D} @ (0(0..0),0(0..0)) (6 nnz, 2 nnz/r) flags 0x204619e (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'LT' +Tuned with speedup factor of 1.33089: +(3 x 3)[0x56c626d0]{D} @ (0(0..0),0(0..0)) (6 nnz, 2 nnz/r) flags 0x204619e (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'LT' +(3 x 3)[0x56c5e010]{D} @ (0(0..0),0(0..0)) (6 nnz, 2 nnz/r) flags 0x204619e (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'LT' +Tuned with speedup factor of 1.14314: +(3 x 3)[0x56c613e0]{D} @ (0(0..0),0(0..0)) (6 nnz, 2 nnz/r) flags 0x204619e (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'LT' +(3 x 3)[0x56c5e010]{D} @ (0(0..0),0(0..0)) (6 nnz, 2 nnz/r) flags 0x204619e (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'LT' +Tuned with speedup factor of 1.4939: +(3 x 3)[0x56c613e0]{D} @ (0(0..0),0(0..0)) (6 nnz, 2 nnz/r) flags 0x204619e (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'LT' +(3 x 3)[0x56c5e010]{D} @ (0(0..0),0(0..0)) (6 nnz, 2 nnz/r) flags 0x204619e (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'LT' +Tuned with speedup factor of 1.28113: +(3 x 3)[0x56c66160]{D} @ (0(0..0),0(0..0)) (6 nnz, 2 nnz/r) flags 0x204619e (coo:1, csr:1, hw:1, ic:1, fi:0), storage: 40, subm: 3, symflags:'LT' END OK: terminating with no allocations registered in librsb [*] tests terminated successfully ! @@ -9500,10 +9649,10 @@ ./rsbtest --no-tune --max_t 0.01 --serial | dd if=/dev/stdin of=/dev/stdout bs=16M status=none iflag=fullblock | grep -q Building ./rsbtest --no-tune --max_t 0.01 --max 1 --nrhs 1 --beta 1 --incy 1 --incx 1 --no-trans --alpha 1 --type d --rand --serial . | dd if=/dev/stdin of=/dev/stdout bs=16M status=none iflag=fullblock | grep -q adding ! ./rsbtest --mkl A.mkl -running on infom08-i386 +running on i-capture-the-hostname Built without the MKL. ( ! ./rsbtest --unrecognized-option-triggers-abort ) -running on infom08-i386 +running on i-capture-the-hostname /build/reproducible-path/librsb-1.3.0.2+dfsg/rsbtest/.libs/rsbtest: unrecognized option '--unrecognized-option-triggers-abort' unrecognized option, aborting. ( ./rsbtest --no-tune --max_t 0.01 --skip-loading-hermitian-matrices --skip-loading-unsymmetric-matrices --tune-maxt 10 --tune-maxr 10 --verbose-tuning --extra-verbose-interface --min_t 0.01 --max_t 0.01 --mintimes 1 --maxtimes 1 --verbose --skip-loading-symmetric-matrices A.mtx | dd if=/dev/stdin of=/dev/stdout bs=16M status=none iflag=fullblock | grep -q skip ) @@ -9512,7 +9661,7 @@ ( ! ./rsbtest --no-tune --max_t 0.01 --quiet --types all --nthreads 1,2 --maxtimes 1 -+ A.mtx | dd if=/dev/stdin of=/dev/stdout bs=16M status=none iflag=fullblock | grep -q 2.threads ) ( ! ./rsbtest --no-tune --max_t 0.01 --quiet --render-only A.mtx > /dev/null ) ! ./rsbtest --no-tune --max_t 0.01 --quiet --max 1 --nrhs 1 --beta 1 --incy 1 --incx 1 --render --no-trans --alpha 1 --type all A.mtx -running on infom08-i386 +running on i-capture-the-hostname Will not invoke autotuning routine. Benchmark will sample for at most 0.01 s Built without render support! @@ -9564,7 +9713,7 @@ gmake[4]: Entering directory '/build/reproducible-path/librsb-1.3.0.2+dfsg' gmake[5]: Entering directory '/build/reproducible-path/librsb-1.3.0.2+dfsg' /usr/bin/mkdir -p '/build/reproducible-path/librsb-1.3.0.2+dfsg/debian/tmp/usr/lib/i386-linux-gnu' - /bin/bash ./libtool --mode=install /usr/bin/install -c librsb.la '/build/reproducible-path/librsb-1.3.0.2+dfsg/debian/tmp/usr/lib/i386-linux-gnu' + /bin/sh ./libtool --mode=install /usr/bin/install -c librsb.la '/build/reproducible-path/librsb-1.3.0.2+dfsg/debian/tmp/usr/lib/i386-linux-gnu' libtool: install: /usr/bin/install -c .libs/librsb.so.0.0.0 /build/reproducible-path/librsb-1.3.0.2+dfsg/debian/tmp/usr/lib/i386-linux-gnu/librsb.so.0.0.0 libtool: install: (cd /build/reproducible-path/librsb-1.3.0.2+dfsg/debian/tmp/usr/lib/i386-linux-gnu && { ln -s -f librsb.so.0.0.0 librsb.so.0 || { rm -f librsb.so.0 && ln -s librsb.so.0.0.0 librsb.so.0; }; }) libtool: install: (cd /build/reproducible-path/librsb-1.3.0.2+dfsg/debian/tmp/usr/lib/i386-linux-gnu && { ln -s -f librsb.so.0.0.0 librsb.so || { rm -f librsb.so && ln -s librsb.so.0.0.0 librsb.so; }; }) @@ -9574,7 +9723,7 @@ libtool: install: ranlib /build/reproducible-path/librsb-1.3.0.2+dfsg/debian/tmp/usr/lib/i386-linux-gnu/librsb.a libtool: warning: remember to run 'libtool --finish /usr/lib/i386-linux-gnu' /usr/bin/mkdir -p '/build/reproducible-path/librsb-1.3.0.2+dfsg/debian/tmp/usr/bin' - /bin/bash ./libtool --mode=install /usr/bin/install -c rsbench '/build/reproducible-path/librsb-1.3.0.2+dfsg/debian/tmp/usr/bin' + /bin/sh ./libtool --mode=install /usr/bin/install -c rsbench '/build/reproducible-path/librsb-1.3.0.2+dfsg/debian/tmp/usr/bin' libtool: warning: 'librsb.la' has not been installed in '/usr/lib/i386-linux-gnu' libtool: install: /usr/bin/install -c .libs/rsbench /build/reproducible-path/librsb-1.3.0.2+dfsg/debian/tmp/usr/bin/rsbench /usr/bin/mkdir -p '/build/reproducible-path/librsb-1.3.0.2+dfsg/debian/tmp/usr/bin' @@ -9701,12 +9850,12 @@ dh_gencontrol dh_md5sums dh_builddeb -dpkg-deb: building package 'librsb0t64' in '../librsb0t64_1.3.0.2+dfsg-7_i386.deb'. -dpkg-deb: building package 'librsb0t64-dbgsym' in '../librsb0t64-dbgsym_1.3.0.2+dfsg-7_i386.deb'. dpkg-deb: building package 'librsb-dev' in '../librsb-dev_1.3.0.2+dfsg-7_i386.deb'. dpkg-deb: building package 'librsb-tools-dbgsym' in '../librsb-tools-dbgsym_1.3.0.2+dfsg-7_i386.deb'. +dpkg-deb: building package 'librsb0t64' in '../librsb0t64_1.3.0.2+dfsg-7_i386.deb'. dpkg-deb: building package 'librsb-tools' in '../librsb-tools_1.3.0.2+dfsg-7_i386.deb'. dpkg-deb: building package 'librsb-doc' in '../librsb-doc_1.3.0.2+dfsg-7_all.deb'. +dpkg-deb: building package 'librsb0t64-dbgsym' in '../librsb0t64-dbgsym_1.3.0.2+dfsg-7_i386.deb'. dpkg-genbuildinfo --build=binary -O../librsb_1.3.0.2+dfsg-7_i386.buildinfo dpkg-genchanges --build=binary -O../librsb_1.3.0.2+dfsg-7_i386.changes dpkg-genchanges: info: binary-only upload (no source code included) @@ -9715,12 +9864,14 @@ dpkg-buildpackage: info: binary-only upload (no source included) dpkg-genchanges: info: not including original source code in upload I: copying local configuration +I: user script /srv/workspace/pbuilder/13949/tmp/hooks/B01_cleanup starting +I: user script /srv/workspace/pbuilder/13949/tmp/hooks/B01_cleanup finished I: unmounting dev/ptmx filesystem I: unmounting dev/pts filesystem I: unmounting dev/shm filesystem I: unmounting proc filesystem I: unmounting sys filesystem I: cleaning the build env -I: removing directory /srv/workspace/pbuilder/23139 and its subdirectories -I: Current time: Sun Jan 4 12:42:59 -12 2026 -I: pbuilder-time-stamp: 1767573779 +I: removing directory /srv/workspace/pbuilder/13949 and its subdirectories +I: Current time: Tue Dec 3 09:13:53 +14 2024 +I: pbuilder-time-stamp: 1733166833