[kaze@kaze ~]$ su
Password: 
su: Authentication failure
[kaze@kaze ~]$ su
Password: 
su: Authentication failure
[kaze@kaze ~]$ su
Password: 
su: Authentication failure
[kaze@kaze ~]$ su
Password: 
su: Authentication failure
[kaze@kaze ~]$ su
Password: 
su: Authentication failure
[kaze@kaze ~]$ su
Password: 
su: Authentication failure
[kaze@kaze ~]$ su
Password: 
su: Authentication failure
[kaze@kaze ~]$ su
Password: 
su: Authentication failure
[kaze@kaze ~]$ su
Password: 
su: Authentication failure
[kaze@kaze ~]$ su
Password: 
su: Authentication failure
[kaze@kaze ~]$ su
Password: 
[root@kaze kaze]# cd Quicksort_says_rev9
[root@kaze Quicksort_says_rev9]# ls -l
total 8339456
-rwxrwxrwx. 1 kaze kaze  178708944 Dec  4 22:54 22338618_QWORDS.bin
-rwxrwxrwx. 1 kaze kaze        913 Feb 21 03:29 bench_gcc.sh
-rwxrwxrwx. 1 kaze kaze        660 Feb 20 09:32 BENCH_ICL.BAT
-rwxrwxrwx. 1 kaze kaze        540 Feb 21 03:10 make_elf.sh
-rwxrwxrwx. 1 kaze kaze        346 Feb 21 01:41 MAKE_EXE.bat
-rwxrwxrwx. 1 kaze kaze 7798235442 Feb 18 14:51 math.stackexchange.com_en_all_2019-02.zim
-rwxrwxrwx. 1 kaze kaze   24823016 Dec  4 22:54 mobythesaurus.txt
-rwxrwxrwx. 1 kaze kaze     236647 Feb 21 03:46 QS_bench_r9.asm
-rwxrwxrwx. 1 kaze kaze     116646 Feb 21 03:46 QS_bench_r9.c
-rwxrwxrwx. 1 kaze kaze     367098 Feb 21 03:47 QS_bench_r9.cod
-rwxrwxrwx. 1 kaze kaze  268537344 Feb 21 03:47 QS_bench_r9_FULL-FLEDGED_ICL15.0.exe
-rwxrwxrwx. 1 kaze kaze  268536320 Feb 21 03:47 QS_bench_r9_ICL15.0.exe
[root@kaze Quicksort_says_rev9]# ls -l
total 14016044
-rwxrwxrwx. 1 kaze kaze  178708944 Dec  4 22:54 22338618_QWORDS.bin
-rwxrwxrwx. 1 kaze kaze        913 Feb 21 03:29 bench_gcc.sh
-rwxrwxrwx. 1 kaze kaze        660 Feb 20 09:32 BENCH_ICL.BAT
-rwxrwxrwx. 1 kaze kaze 3803483832 Nov 29 02:06 Fedora-Workstation-35-1.2.aarch64.raw.xz
-rwxrwxrwx. 1 kaze kaze 2009333760 Nov 28 23:21 Fedora-Workstation-Live-x86_64-35-1.2.iso
-rwxrwxrwx. 1 kaze kaze        540 Feb 21 03:10 make_elf.sh
-rwxrwxrwx. 1 kaze kaze        346 Feb 21 01:41 MAKE_EXE.bat
-rwxrwxrwx. 1 kaze kaze 7798235442 Feb 18 14:51 math.stackexchange.com_en_all_2019-02.zim
-rwxrwxrwx. 1 kaze kaze   24823016 Dec  4 22:54 mobythesaurus.txt
-rwxrwxrwx. 1 kaze kaze     236647 Feb 21 03:46 QS_bench_r9.asm
-rwxrwxrwx. 1 kaze kaze     116646 Feb 21 03:46 QS_bench_r9.c
-rwxrwxrwx. 1 kaze kaze     367098 Feb 21 03:47 QS_bench_r9.cod
-rwxrwxrwx. 1 kaze kaze  268537344 Feb 21 03:47 QS_bench_r9_FULL-FLEDGED_ICL15.0.exe
-rwxrwxrwx. 1 kaze kaze  268536320 Feb 21 03:47 QS_bench_r9_ICL15.0.exe
[root@kaze Quicksort_says_rev9]# sh make_elf.sh 
QS_bench_r9.c:1855:1: warning: return type defaults to ‘int’ [-Wimplicit-int]
 1855 | g(d,h){for(i=s;i<1<<25;i*=2)d=d*1LL*d%m;for(p=t;p<t+N;p+=s)for(i=s,c=1;i;i--)a=p[s]*(h?c:1LL)%m,p[s]=(m*1U+*p-a)*(h?1LL:c)%m,*p=(a*1U+*p)%m,p++,c=c*1LL*d%m;}
      | ^
QS_bench_r9.c: In function ‘g’:
QS_bench_r9.c:1855:1: warning: type of ‘d’ defaults to ‘int’ [-Wimplicit-int]
QS_bench_r9.c:1855:1: warning: type of ‘h’ defaults to ‘int’ [-Wimplicit-int]
QS_bench_r9.c:1855:1: warning: return type defaults to ‘int’ [-Wimplicit-int]
 1855 | g(d,h){for(i=s;i<1<<25;i*=2)d=d*1LL*d%m;for(p=t;p<t+N;p+=s)for(i=s,c=1;i;i--)a=p[s]*(h?c:1LL)%m,p[s]=(m*1U+*p-a)*(h?1LL:c)%m,*p=(a*1U+*p)%m,p++,c=c*1LL*d%m;}
      | ^
QS_bench_r9.c: In function ‘g’:
QS_bench_r9.c:1855:1: warning: type of ‘d’ defaults to ‘int’ [-Wimplicit-int]
QS_bench_r9.c:1855:1: warning: type of ‘h’ defaults to ‘int’ [-Wimplicit-int]
QS_bench_r9.c:1855:1: warning: return type defaults to ‘int’ [-Wimplicit-int]
 1855 | g(d,h){for(i=s;i<1<<25;i*=2)d=d*1LL*d%m;for(p=t;p<t+N;p+=s)for(i=s,c=1;i;i--)a=p[s]*(h?c:1LL)%m,p[s]=(m*1U+*p-a)*(h?1LL:c)%m,*p=(a*1U+*p)%m,p++,c=c*1LL*d%m;}
      | ^
QS_bench_r9.c: In function ‘g’:
QS_bench_r9.c:1855:1: warning: type of ‘d’ defaults to ‘int’ [-Wimplicit-int]
QS_bench_r9.c:1855:1: warning: type of ‘h’ defaults to ‘int’ [-Wimplicit-int]
QS_bench_r9.c:1855:1: warning: return type defaults to 'int' [-Wimplicit-int]
 1855 | g(d,h){for(i=s;i<1<<25;i*=2)d=d*1LL*d%m;for(p=t;p<t+N;p+=s)for(i=s,c=1;i;i--)a=p[s]*(h?c:1LL)%m,p[s]=(m*1U+*p-a)*(h?1LL:c)%m,*p=(a*1U+*p)%m,p++,c=c*1LL*d%m;}
      | ^
QS_bench_r9.c: In function 'g':
QS_bench_r9.c:1855:1: warning: type of 'd' defaults to 'int' [-Wimplicit-int]
QS_bench_r9.c:1855:1: warning: type of 'h' defaults to 'int' [-Wimplicit-int]
QS_bench_r9.c:1855:1: warning: return type defaults to 'int' [-Wimplicit-int]
 1855 | g(d,h){for(i=s;i<1<<25;i*=2)d=d*1LL*d%m;for(p=t;p<t+N;p+=s)for(i=s,c=1;i;i--)a=p[s]*(h?c:1LL)%m,p[s]=(m*1U+*p-a)*(h?1LL:c)%m,*p=(a*1U+*p)%m,p++,c=c*1LL*d%m;}
      | ^
QS_bench_r9.c: In function 'g':
QS_bench_r9.c:1855:1: warning: type of 'd' defaults to 'int' [-Wimplicit-int]
QS_bench_r9.c:1855:1: warning: type of 'h' defaults to 'int' [-Wimplicit-int]
[root@kaze Quicksort_says_rev9]# ls -l
total 15068332
-rwxrwxrwx. 1 kaze kaze  178708944 Dec  4 22:54 22338618_QWORDS.bin
-rwxrwxrwx. 1 kaze kaze        913 Feb 21 03:29 bench_gcc.sh
-rwxrwxrwx. 1 kaze kaze        660 Feb 20 09:32 BENCH_ICL.BAT
-rwxrwxrwx. 1 kaze kaze 3803483832 Nov 29 02:06 Fedora-Workstation-35-1.2.aarch64.raw.xz
-rwxrwxrwx. 1 kaze kaze 2009333760 Nov 28 23:21 Fedora-Workstation-Live-x86_64-35-1.2.iso
-rwxrwxrwx. 1 kaze kaze        540 Feb 21 03:10 make_elf.sh
-rwxrwxrwx. 1 kaze kaze        346 Feb 21 01:41 MAKE_EXE.bat
-rwxrwxrwx. 1 kaze kaze 7798235442 Feb 18 14:51 math.stackexchange.com_en_all_2019-02.zim
-rwxrwxrwx. 1 kaze kaze   24823016 Dec  4 22:54 mobythesaurus.txt
-rwxrwxrwx. 1 kaze kaze     236647 Feb 21 03:46 QS_bench_r9.asm
-rwxrwxrwx. 1 kaze kaze     116646 Feb 21 03:46 QS_bench_r9.c
-rwxrwxrwx. 1 kaze kaze     367098 Feb 21 03:47 QS_bench_r9.cod
-rw-r--r--. 1 root root      36303 Feb 21 03:59 QS_bench_r9.elf.asm
-rwxrwxrwx. 1 kaze kaze  268537344 Feb 21 03:47 QS_bench_r9_FULL-FLEDGED_ICL15.0.exe
-rwxr-xr-x. 1 root root  270200672 Feb 21 03:59 QS_bench_r9_GCC11.2.1.elf
-rwxr-xr-x. 1 root root  268544219 Feb 21 03:59 QS_bench_r9_GCC11.2.1.exe
-rwxr-xr-x. 1 root root  270200672 Feb 21 03:59 QS_bench_r9_GCC11.2.1_FULL-FLEDGED.elf
-rwxr-xr-x. 1 root root  268545243 Feb 21 03:59 QS_bench_r9_GCC11.2.1_FULL-FLEDGED.exe
-rwxrwxrwx. 1 kaze kaze  268536320 Feb 21 03:47 QS_bench_r9_ICL15.0.exe
[root@kaze Quicksort_says_rev9]# sh bench_gcc.sh 
Current priority is -20.
Allocating AUX-Buffer 21MB ...
Allocating Master-Buffer 17043MB ...
Sorting in single-thread 2233861800 elements...
Done in 387 seconds.
Checking whether sort went correct... OK. Unique keys = 10

 Performance counter stats for './QS_bench_r9_GCC11.2.1.elf qsort few':

        398,868.70 msec task-clock                #    1.000 CPUs utilized          
             5,058      context-switches          #   12.681 /sec                   
               227      cpu-migrations            #    0.569 /sec                   
         4,406,673      page-faults               #   11.048 K/sec                  
 1,228,567,163,670      cycles                    #    3.080 GHz                      (50.00%)
 3,299,909,622,205      instructions              #    2.69  insn per cycle           (62.50%)
   654,576,044,524      branches                  #    1.641 G/sec                    (62.50%)
     5,453,966,398      branch-misses             #    0.83% of all branches          (62.50%)
   739,433,220,718      L1-dcache-loads           #    1.854 G/sec                    (62.50%)
     7,280,725,752      L1-dcache-load-misses     #    0.98% of all L1-dcache accesses  (62.50%)
       470,898,267      LLC-loads                 #    1.181 M/sec                    (50.00%)
       106,497,784      LLC-load-misses           #   22.62% of all LL-cache accesses  (50.00%)

     398.973179810 seconds time elapsed

     391.225263000 seconds user
       5.177292000 seconds sys


Current priority is -20.
Allocating AUX-Buffer 21MB ...
Allocating Master-Buffer 17043MB ...
Sorting in single-thread 2233861800 elements...
Done in 34 seconds.
Checking whether sort went correct... OK. Unique keys = 10

 Performance counter stats for './QS_bench_r9_GCC11.2.1.elf Magnetica few':

         45,893.51 msec task-clock                #    0.997 CPUs utilized          
               918      context-switches          #   20.003 /sec                   
                64      cpu-migrations            #    1.395 /sec                   
         4,406,674      page-faults               #   96.020 K/sec                  
   141,246,946,749      cycles                    #    3.078 GHz                      (50.00%)
   128,971,506,074      instructions              #    0.91  insn per cycle           (62.50%)
    26,676,938,513      branches                  #  581.279 M/sec                    (62.50%)
     3,364,009,409      branch-misses             #   12.61% of all branches          (62.50%)
    18,312,121,596      L1-dcache-loads           #  399.013 M/sec                    (62.50%)
     2,085,581,382      L1-dcache-load-misses     #   11.39% of all L1-dcache accesses  (62.50%)
        85,006,612      LLC-loads                 #    1.852 M/sec                    (50.00%)
        52,711,137      LLC-load-misses           #   62.01% of all LL-cache accesses  (50.00%)

      46.048990604 seconds time elapsed

      40.278121000 seconds user
       5.290894000 seconds sys


Current priority is -20.
Allocating AUX-Buffer 21MB ...
Allocating Master-Buffer 17043MB ...
Sorting in single-thread 2233861800 elements...
Done in 40 seconds.
Checking whether sort went correct... OK. Unique keys = 10

 Performance counter stats for './QS_bench_r9_GCC11.2.1.elf BM few':

         52,318.65 msec task-clock                #    1.000 CPUs utilized          
               628      context-switches          #   12.003 /sec                   
                29      cpu-migrations            #    0.554 /sec                   
         4,406,674      page-faults               #   84.228 K/sec                  
   161,066,248,831      cycles                    #    3.079 GHz                      (50.00%)
   160,045,020,378      instructions              #    0.99  insn per cycle           (62.50%)
    32,683,776,458      branches                  #  624.706 M/sec                    (62.50%)
     2,986,175,515      branch-misses             #    9.14% of all branches          (62.50%)
    25,552,391,720      L1-dcache-loads           #  488.399 M/sec                    (62.50%)
     2,665,188,526      L1-dcache-load-misses     #   10.43% of all L1-dcache accesses  (62.50%)
       255,843,507      LLC-loads                 #    4.890 M/sec                    (50.00%)
       108,606,963      LLC-load-misses           #   42.45% of all LL-cache accesses  (50.00%)

      52.338686724 seconds time elapsed

      46.831579000 seconds user
       5.122231000 seconds sys


Current priority is -20.
Allocating FILE-Buffer 23MB ...
Allocating AUX-Buffer 189MB ...
Allocating Master-Buffer 18938MB ...
Sorting in single-thread 2482300900 elements...
Done in 553 seconds.
Checking whether sort went correct... OK. Unique keys = 2847531

 Performance counter stats for './QS_bench_r9_GCC11.2.1.elf qsort many':

        565,682.86 msec task-clock                #    1.000 CPUs utilized          
             6,699      context-switches          #   11.842 /sec                   
               287      cpu-migrations            #    0.507 /sec                   
         4,902,819      page-faults               #    8.667 K/sec                  
 1,742,032,470,480      cycles                    #    3.080 GHz                      (50.00%)
 2,960,957,010,479      instructions              #    1.70  insn per cycle           (62.50%)
   661,325,741,342      branches                  #    1.169 G/sec                    (62.50%)
    24,471,940,736      branch-misses             #    3.70% of all branches          (62.50%)
   681,446,613,554      L1-dcache-loads           #    1.205 G/sec                    (62.50%)
     8,991,420,940      L1-dcache-load-misses     #    1.32% of all L1-dcache accesses  (62.50%)
       324,839,902      LLC-loads                 #  574.244 K/sec                    (50.00%)
       125,398,893      LLC-load-misses           #   38.60% of all LL-cache accesses  (50.00%)

     565.826953669 seconds time elapsed

     556.258357000 seconds user
       5.866774000 seconds sys


Current priority is -20.
Allocating FILE-Buffer 23MB ...
Allocating AUX-Buffer 189MB ...
Allocating Master-Buffer 18938MB ...
Sorting in single-thread 2482300900 elements...
Done in 218 seconds.
Checking whether sort went correct... OK. Unique keys = 2847531

 Performance counter stats for './QS_bench_r9_GCC11.2.1.elf Magnetica many':

        231,491.89 msec task-clock                #    1.000 CPUs utilized          
             3,427      context-switches          #   14.804 /sec                   
               155      cpu-migrations            #    0.670 /sec                   
         4,902,820      page-faults               #   21.179 K/sec                  
   712,450,258,071      cycles                    #    3.078 GHz                      (50.00%)
   801,735,343,248      instructions              #    1.13  insn per cycle           (62.50%)
   146,404,311,920      branches                  #  632.438 M/sec                    (62.50%)
    19,425,844,842      branch-misses             #   13.27% of all branches          (62.50%)
   110,872,620,276      L1-dcache-loads           #  478.948 M/sec                    (62.50%)
    10,284,451,506      L1-dcache-load-misses     #    9.28% of all L1-dcache accesses  (62.50%)
       372,008,878      LLC-loads                 #    1.607 M/sec                    (50.00%)
       246,471,537      LLC-load-misses           #   66.25% of all LL-cache accesses  (50.00%)

     231.567481893 seconds time elapsed

     224.145665000 seconds user
       5.675128000 seconds sys


Current priority is -20.
Allocating FILE-Buffer 23MB ...
Allocating AUX-Buffer 189MB ...
Allocating Master-Buffer 18938MB ...
Sorting in single-thread 2482300900 elements...
Done in 219 seconds.
Checking whether sort went correct... OK. Unique keys = 2847531

 Performance counter stats for './QS_bench_r9_GCC11.2.1.elf BM many':

        233,167.45 msec task-clock                #    1.000 CPUs utilized          
             3,005      context-switches          #   12.888 /sec                   
               124      cpu-migrations            #    0.532 /sec                   
         4,902,819      page-faults               #   21.027 K/sec                  
   717,744,265,825      cycles                    #    3.078 GHz                      (50.00%)
   677,549,425,659      instructions              #    0.94  insn per cycle           (62.50%)
   170,121,823,699      branches                  #  729.612 M/sec                    (62.50%)
    18,987,127,843      branch-misses             #   11.16% of all branches          (62.50%)
    90,776,749,587      L1-dcache-loads           #  389.320 M/sec                    (62.50%)
     9,127,736,810      L1-dcache-load-misses     #   10.06% of all L1-dcache accesses  (62.50%)
       323,207,909      LLC-loads                 #    1.386 M/sec                    (50.00%)
       209,837,992      LLC-load-misses           #   64.92% of all LL-cache accesses  (50.00%)

     233.215635718 seconds time elapsed

     225.826429000 seconds user
       5.726386000 seconds sys


Current priority is -20.
Allocating FILE-Buffer 1916MB ...
Allocating AUX-Buffer 15329MB ...
Allocating Master-Buffer 15329MB ...
Sorting in single-thread 2009333753 elements...
Done in 529 seconds.
Checking whether sort went correct... OK. Unique keys = 1912608132

 Performance counter stats for './QS_bench_r9_GCC11.2.1.elf qsort ALL':

        548,149.35 msec task-clock                #    0.995 CPUs utilized          
             8,924      context-switches          #   16.280 /sec                   
               385      cpu-migrations            #    0.702 /sec                   
         8,339,552      page-faults               #   15.214 K/sec                  
 1,687,931,155,049      cycles                    #    3.079 GHz                      (50.00%)
 2,310,758,624,147      instructions              #    1.37  insn per cycle           (62.50%)
   544,818,402,494      branches                  #  993.923 M/sec                    (62.50%)
    27,901,159,413      branch-misses             #    5.12% of all branches          (62.50%)
   530,533,327,691      L1-dcache-loads           #  967.863 M/sec                    (62.50%)
     7,599,385,131      L1-dcache-load-misses     #    1.43% of all L1-dcache accesses  (62.50%)
       290,100,866      LLC-loads                 #  529.237 K/sec                    (50.00%)
       111,744,974      LLC-load-misses           #   38.52% of all LL-cache accesses  (50.00%)

     551.082490803 seconds time elapsed

     534.418502000 seconds user
      10.321482000 seconds sys


Current priority is -20.
Allocating FILE-Buffer 1916MB ...
Allocating AUX-Buffer 15329MB ...
Allocating Master-Buffer 15329MB ...
Sorting in single-thread 2009333753 elements...
Done in 289 seconds.
Checking whether sort went correct... OK. Unique keys = 1912608132

 Performance counter stats for './QS_bench_r9_GCC11.2.1.elf Magnetica ALL':

        309,001.17 msec task-clock                #    0.995 CPUs utilized          
             5,400      context-switches          #   17.476 /sec                   
               189      cpu-migrations            #    0.612 /sec                   
         8,339,552      page-faults               #   26.989 K/sec                  
   950,987,842,682      cycles                    #    3.078 GHz                      (50.00%)
 1,101,560,754,831      instructions              #    1.16  insn per cycle           (62.51%)
   198,371,951,051      branches                  #  641.978 M/sec                    (62.50%)
    25,938,277,968      branch-misses             #   13.08% of all branches          (62.50%)
   156,092,140,810      L1-dcache-loads           #  505.151 M/sec                    (62.50%)
     8,391,760,016      L1-dcache-load-misses     #    5.38% of all L1-dcache accesses  (62.50%)
       316,532,523      LLC-loads                 #    1.024 M/sec                    (50.00%)
       195,952,211      LLC-load-misses           #   61.91% of all LL-cache accesses  (50.00%)

     310.623513195 seconds time elapsed

     295.656723000 seconds user
      11.191107000 seconds sys


Current priority is -20.
Allocating FILE-Buffer 1916MB ...
Allocating AUX-Buffer 15329MB ...
Allocating Master-Buffer 15329MB ...
Sorting in single-thread 2009333753 elements...
Done in 295 seconds.
Checking whether sort went correct... OK. Unique keys = 1912608132

 Performance counter stats for './QS_bench_r9_GCC11.2.1.elf BM ALL':

        314,513.62 msec task-clock                #    0.997 CPUs utilized          
             6,503      context-switches          #   20.676 /sec                   
               223      cpu-migrations            #    0.709 /sec                   
         8,339,552      page-faults               #   26.516 K/sec                  
   968,105,796,590      cycles                    #    3.078 GHz                      (50.00%)
   943,804,081,222      instructions              #    0.97  insn per cycle           (62.50%)
   235,651,132,345      branches                  #  749.256 M/sec                    (62.50%)
    26,272,026,192      branch-misses             #   11.15% of all branches          (62.50%)
   131,672,729,927      L1-dcache-loads           #  418.655 M/sec                    (62.50%)
     8,898,471,801      L1-dcache-load-misses     #    6.76% of all L1-dcache accesses  (62.50%)
       331,556,335      LLC-loads                 #    1.054 M/sec                    (50.00%)
       217,277,816      LLC-load-misses           #   65.53% of all LL-cache accesses  (50.00%)

     315.420184260 seconds time elapsed

     301.474871000 seconds user
      10.907281000 seconds sys


Current priority is -20.
Allocating FILE-Buffer 3627MB ...
Allocating Master-Buffer 29018MB ...
Sorting in single-thread 3803483825 elements...
Done in 1034 seconds.
Checking whether sort went correct... OK. Unique keys = 3346259533

 Performance counter stats for './QS_bench_r9_GCC11.2.1.elf qsort ALLmore':

      1,054,089.24 msec task-clock                #    0.995 CPUs utilized          
            16,227      context-switches          #   15.394 /sec                   
               744      cpu-migrations            #    0.706 /sec                   
         8,357,296      page-faults               #    7.928 K/sec                  
 3,245,946,026,588      cycles                    #    3.079 GHz                      (50.00%)
 4,454,801,921,967      instructions              #    1.37  insn per cycle           (62.50%)
 1,053,786,522,487      branches                  #  999.713 M/sec                    (62.50%)
    54,858,612,776      branch-misses             #    5.21% of all branches          (62.50%)
 1,021,681,499,395      L1-dcache-loads           #  969.255 M/sec                    (62.50%)
    14,019,750,515      L1-dcache-load-misses     #    1.37% of all L1-dcache accesses  (62.50%)
       524,744,956      LLC-loads                 #  497.818 K/sec                    (50.00%)
       212,088,395      LLC-load-misses           #   40.42% of all LL-cache accesses  (50.00%)

    1059.509369408 seconds time elapsed

    1036.844914000 seconds user
      10.573884000 seconds sys


Current priority is -20.
Allocating FILE-Buffer 3627MB ...
Allocating Master-Buffer 29018MB ...
Sorting in single-thread 3803483825 elements...
Done in 571 seconds.
Checking whether sort went correct... OK. Unique keys = 3346259533

 Performance counter stats for './QS_bench_r9_GCC11.2.1.elf Magnetica ALLmore':

        594,187.41 msec task-clock                #    0.995 CPUs utilized          
            17,188      context-switches          #   28.927 /sec                   
               364      cpu-migrations            #    0.613 /sec                   
         8,357,300      page-faults               #   14.065 K/sec                  
 1,828,594,647,771      cycles                    #    3.077 GHz                      (50.00%)
 2,090,685,294,825      instructions              #    1.14  insn per cycle           (62.50%)
   377,739,579,362      branches                  #  635.725 M/sec                    (62.50%)
    51,739,059,233      branch-misses             #   13.70% of all branches          (62.50%)
   291,467,597,289      L1-dcache-loads           #  490.531 M/sec                    (62.50%)
    15,485,690,648      L1-dcache-load-misses     #    5.31% of all L1-dcache accesses  (62.50%)
       625,446,260      LLC-loads                 #    1.053 M/sec                    (50.00%)
       398,274,891      LLC-load-misses           #   63.68% of all LL-cache accesses  (50.00%)

     597.171367494 seconds time elapsed

     577.352877000 seconds user
      12.736028000 seconds sys


Current priority is -20.
Allocating FILE-Buffer 3627MB ...
Allocating Master-Buffer 29018MB ...
Sorting in single-thread 3803483825 elements...
Done in 580 seconds.
Checking whether sort went correct... OK. Unique keys = 3346259533

 Performance counter stats for './QS_bench_r9_GCC11.2.1.elf BM ALLmore':

        602,669.22 msec task-clock                #    0.997 CPUs utilized          
            16,388      context-switches          #   27.192 /sec                   
               468      cpu-migrations            #    0.777 /sec                   
         8,357,299      page-faults               #   13.867 K/sec                  
 1,855,042,047,638      cycles                    #    3.078 GHz                      (50.00%)
 1,718,762,658,492      instructions              #    0.93  insn per cycle           (62.50%)
   434,858,208,781      branches                  #  721.554 M/sec                    (62.50%)
    52,585,329,173      branch-misses             #   12.09% of all branches          (62.50%)
   236,875,195,511      L1-dcache-loads           #  393.043 M/sec                    (62.50%)
    15,080,486,778      L1-dcache-load-misses     #    6.37% of all L1-dcache accesses  (62.50%)
       524,725,096      LLC-loads                 #  870.668 K/sec                    (50.00%)
       329,238,240      LLC-load-misses           #   62.74% of all LL-cache accesses  (50.00%)

     604.273296267 seconds time elapsed

     586.086563000 seconds user
      12.421722000 seconds sys


Current priority is -20.
Allocating AUX-Buffer 21MB ...
Allocating Master-Buffer 17043MB ...
Sorting in single-thread 2233861800 elements...
Done in 39 seconds.
Checking whether sort went correct... OK. Unique keys = 10

 Performance counter stats for './QS_bench_r9_GCC11.2.1_FULL-FLEDGED.elf Magnetica few':

         51,453.88 msec task-clock                #    0.995 CPUs utilized          
               640      context-switches          #   12.438 /sec                   
                46      cpu-migrations            #    0.894 /sec                   
         4,406,678      page-faults               #   85.643 K/sec                  
   158,348,979,809      cycles                    #    3.077 GHz                      (50.00%)
   156,942,283,417      instructions              #    0.99  insn per cycle           (62.51%)
    33,089,010,344      branches                  #  643.081 M/sec                    (62.50%)
     3,187,015,393      branch-misses             #    9.63% of all branches          (62.50%)
    20,337,411,081      L1-dcache-loads           #  395.255 M/sec                    (62.50%)
     2,352,364,606      L1-dcache-load-misses     #   11.57% of all L1-dcache accesses  (62.50%)
        92,071,416      LLC-loads                 #    1.789 M/sec                    (50.01%)
        59,417,604      LLC-load-misses           #   64.53% of all LL-cache accesses  (50.00%)

      51.717105666 seconds time elapsed

      45.850627000 seconds user
       5.229383000 seconds sys


Current priority is -20.
Allocating FILE-Buffer 23MB ...
Allocating AUX-Buffer 189MB ...
Allocating Master-Buffer 18938MB ...
Sorting in single-thread 2482300900 elements...
Done in 240 seconds.
Checking whether sort went correct... OK. Unique keys = 2847531

 Performance counter stats for './QS_bench_r9_GCC11.2.1_FULL-FLEDGED.elf Magnetica many':

        253,173.76 msec task-clock                #    1.000 CPUs utilized          
             3,009      context-switches          #   11.885 /sec                   
               154      cpu-migrations            #    0.608 /sec                   
         4,902,819      page-faults               #   19.365 K/sec                  
   779,130,836,909      cycles                    #    3.077 GHz                      (50.00%)
   754,524,996,392      instructions              #    0.97  insn per cycle           (62.50%)
   142,429,883,242      branches                  #  562.578 M/sec                    (62.50%)
    20,412,452,397      branch-misses             #   14.33% of all branches          (62.50%)
   100,777,844,119      L1-dcache-loads           #  398.058 M/sec                    (62.50%)
     9,156,532,285      L1-dcache-load-misses     #    9.09% of all L1-dcache accesses  (62.50%)
       275,003,541      LLC-loads                 #    1.086 M/sec                    (50.00%)
       177,804,860      LLC-load-misses           #   64.66% of all LL-cache accesses  (50.00%)

     253.279919479 seconds time elapsed

     245.520299000 seconds user
       5.812543000 seconds sys


Current priority is -20.
Allocating FILE-Buffer 1916MB ...
Allocating AUX-Buffer 15329MB ...
Allocating Master-Buffer 15329MB ...
Sorting in single-thread 2009333753 elements...
Done in 343 seconds.
Checking whether sort went correct... OK. Unique keys = 1912608132

 Performance counter stats for './QS_bench_r9_GCC11.2.1_FULL-FLEDGED.elf Magnetica ALL':

        363,525.94 msec task-clock                #    0.995 CPUs utilized          
             6,244      context-switches          #   17.176 /sec                   
               231      cpu-migrations            #    0.635 /sec                   
         8,339,552      page-faults               #   22.941 K/sec                  
 1,119,007,433,266      cycles                    #    3.078 GHz                      (49.99%)
 1,010,978,690,855      instructions              #    0.90  insn per cycle           (62.50%)
   185,866,726,715      branches                  #  511.289 M/sec                    (62.50%)
    24,737,797,715      branch-misses             #   13.31% of all branches          (62.50%)
   136,113,195,244      L1-dcache-loads           #  374.425 M/sec                    (62.51%)
     7,749,501,336      L1-dcache-load-misses     #    5.69% of all L1-dcache accesses  (62.50%)
       283,434,747      LLC-loads                 #  779.682 K/sec                    (50.00%)
       163,877,415      LLC-load-misses           #   57.82% of all LL-cache accesses  (50.00%)

     365.349526755 seconds time elapsed

     349.899219000 seconds user
      11.188385000 seconds sys


Current priority is -20.
Allocating FILE-Buffer 3627MB ...
Allocating Master-Buffer 29018MB ...
Sorting in single-thread 3803483825 elements...
Done in 673 seconds.
Checking whether sort went correct... OK. Unique keys = 3346259533

 Performance counter stats for './QS_bench_r9_GCC11.2.1_FULL-FLEDGED.elf Magnetica ALLmore':

        696,470.98 msec task-clock                #    0.998 CPUs utilized          
            24,679      context-switches          #   35.434 /sec                   
               479      cpu-migrations            #    0.688 /sec                   
         8,357,297      page-faults               #   11.999 K/sec                  
 2,143,805,148,859      cycles                    #    3.078 GHz                      (50.00%)
 1,937,390,447,511      instructions              #    0.90  insn per cycle           (62.50%)
   355,706,833,623      branches                  #  510.727 M/sec                    (62.50%)
    48,912,894,176      branch-misses             #   13.75% of all branches          (62.50%)
   255,278,204,148      L1-dcache-loads           #  366.531 M/sec                    (62.50%)
    13,863,216,926      L1-dcache-load-misses     #    5.43% of all L1-dcache accesses  (62.50%)
       505,908,745      LLC-loads                 #  726.389 K/sec                    (50.00%)
       288,670,201      LLC-load-misses           #   57.06% of all LL-cache accesses  (50.00%)

     698.215491695 seconds time elapsed

     678.975957000 seconds user
      12.666116000 seconds sys


[root@kaze Quicksort_says_rev9]# gcc --version
gcc (GCC) 11.2.1 20211203 (Red Hat 11.2.1-7)
Copyright (C) 2021 Free Software Foundation, Inc.
This is free software; see the source for copying conditions.  There is NO
warranty; not even for MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.

[root@kaze Quicksort_says_rev9]# 

