Test results for amd64, hunsnivy, crypto_sort/int64

[Page version: 20260324 03:36:53]

Measurements for amd64, hunsnivy, crypto_sort Test results for amd64, hunsnivy, crypto_sort Test results for crypto_sort/int64

Computer: hunsnivy
Microarchitecture: amd64; Ivy Bridge+AES (306a9)
Architecture: amd64
CPU ID: GenuineIntel-000306a9-bfebfbff
SUPERCOP version: 20260217
Operation: crypto_sort
Primitive: int64

Time	Object size	Test size	Implementation	Compiler	Benchmark date	SUPERCOP version
43629	36387 0 0	58087 1200 1536	`sse42`	`gcc -march=native -mtune=native -O3 -fwrapv -fPIC -fPIE -gdwarf-4 -Wall`	20260302	20260217
43926	35461 0 0	55663 1200 1536	`sse42`	`gcc -march=native -mtune=native -O2 -fwrapv -fPIC -fPIE -gdwarf-4 -Wall`	20260302	20260217
44852	34720 0 0	54294 1192 1536	`sse42`	`gcc -march=native -mtune=native -O -fwrapv -fPIC -fPIE -gdwarf-4 -Wall`	20260302	20260217
45441	35484 0 0	57568 1272 1472	`sse42`	`clang -march=native -O3 -fwrapv -Qunused-arguments -fPIC -fPIE -gdwarf-4 -Wall`	20260302	20260217
45443	34676 0 0	54240 1272 1472	`sse42`	`clang -march=native -O -fwrapv -Qunused-arguments -fPIC -fPIE -gdwarf-4 -Wall`	20260302	20260217
45471	35484 0 0	56648 1272 1472	`sse42`	`clang -march=native -O2 -fwrapv -Qunused-arguments -fPIC -fPIE -gdwarf-4 -Wall`	20260302	20260217
45658	34761 0 0	53654 1264 1472	`sse42`	`clang -march=native -Os -fwrapv -Qunused-arguments -fPIC -fPIE -gdwarf-4 -Wall`	20260302	20260217
46026	38147 0 0	56610 1176 1504	`sse42`	`gcc -march=native -mtune=native -Os -fwrapv -fPIC -fPIE -gdwarf-4 -Wall`	20260302	20260217
66656	8807 0 0	27790 1264 1472	`x863`	`clang -march=native -Os -fwrapv -Qunused-arguments -fPIC -fPIE -gdwarf-4 -Wall`	20260302	20260217
66666	11704 0 0	33904 1272 1472	`x863`	`clang -march=native -O3 -fwrapv -Qunused-arguments -fPIC -fPIE -gdwarf-4 -Wall`	20260302	20260217
66666	11689 0 0	33744 1272 1472	`x863`	`clang -mcpu=native -O3 -fwrapv -Qunused-arguments -fPIC -fPIE -gdwarf-4 -Wall`	20260302	20260217
66996	10056 0 0	31336 1272 1472	`x863`	`clang -march=native -O2 -fwrapv -Qunused-arguments -fPIC -fPIE -gdwarf-4 -Wall`	20260302	20260217
68564	9690 0 0	29368 1272 1472	`x863`	`clang -march=native -O -fwrapv -Qunused-arguments -fPIC -fPIE -gdwarf-4 -Wall`	20260302	20260217
68693	11348 0 0	32863 1200 1536	`x863`	`gcc -march=native -mtune=native -O3 -fwrapv -fPIC -fPIE -gdwarf-4 -Wall`	20260302	20260217
68716	10445 0 0	29822 1192 1536	`x863`	`gcc -march=native -mtune=native -O -fwrapv -fPIC -fPIE -gdwarf-4 -Wall`	20260302	20260217
70956	11110 0 0	31127 1200 1536	`x863`	`gcc -march=native -mtune=native -O2 -fwrapv -fPIC -fPIE -gdwarf-4 -Wall`	20260302	20260217
71739	917 0 0	23120 1272 1472	`portable4`	`clang -march=native -O3 -fwrapv -Qunused-arguments -fPIC -fPIE -gdwarf-4 -Wall`	20260302	20260217
72930	676 0 0	19670 1264 1472	`portable4`	`clang -march=native -Os -fwrapv -Qunused-arguments -fPIC -fPIE -gdwarf-4 -Wall`	20260302	20260217
73908	837 0 0	22120 1272 1472	`portable4`	`clang -march=native -O2 -fwrapv -Qunused-arguments -fPIC -fPIE -gdwarf-4 -Wall`	20260302	20260217
76218	918 0 0	22976 1272 1472	`portable4`	`clang -mcpu=native -O3 -fwrapv -Qunused-arguments -fPIC -fPIE -gdwarf-4 -Wall`	20260302	20260217
76618	837 0 0	20536 1272 1472	`portable4`	`clang -march=native -O -fwrapv -Qunused-arguments -fPIC -fPIE -gdwarf-4 -Wall`	20260302	20260217
78548	3915 0 0	22178 1176 1504	`x863`	`gcc -march=native -mtune=native -Os -fwrapv -fPIC -fPIE -gdwarf-4 -Wall`	20260302	20260217
79133	865 0 0	20879 1200 1536	`portable4`	`gcc -march=native -mtune=native -O2 -fwrapv -fPIC -fPIE -gdwarf-4 -Wall`	20260302	20260217
79431	865 0 0	22375 1200 1536	`portable4`	`gcc -march=native -mtune=native -O3 -fwrapv -fPIC -fPIE -gdwarf-4 -Wall`	20260302	20260217
80534	1349 0 0	24685 1288 1568	`T:stdsort`	`g++ -march=native -mtune=native -O3 -fwrapv -fPIC -fPIE -gdwarf-4 -Wall`	20260302	20260217
80650	1297 0 0	23180 1296 1568	`T:stdsort`	`g++ -march=native -mtune=native -O2 -fwrapv -fPIC -fPIE -gdwarf-4 -Wall`	20260302	20260217
81282	1334 0 0	21825 1352 1472	`T:stdsort`	`clang++ -march=native -Os -fwrapv -Qunused-arguments -fPIC -fPIE -gdwarf-4 -Wall`	20260302	20260217
81474	1762 0 0	25076 1352 1472	`T:stdsort`	`clang++ -march=native -O3 -fwrapv -Qunused-arguments -fPIC -fPIE -gdwarf-4 -Wall`	20260302	20260217
81805	1523 0 0	24000 1352 1472	`T:stdsort`	`clang++ -march=native -O2 -fwrapv -Qunused-arguments -fPIC -fPIE -gdwarf-4 -Wall`	20260302	20260217
82978	1591 0 0	22547 1360 1472	`T:stdsort`	`clang++ -march=native -O -fwrapv -Qunused-arguments -fPIC -fPIE -gdwarf-4 -Wall`	20260302	20260217
88363	1173 0 0	22355 1288 1568	`T:stdsort`	`g++ -march=native -mtune=native -O -fwrapv -fPIC -fPIE -gdwarf-4 -Wall`	20260302	20260217
93366	928 0 0	20867 1272 1536	`T:stdsort`	`g++ -march=native -mtune=native -Os -fwrapv -fPIC -fPIE -gdwarf-4 -Wall`	20260302	20260217
109243	957 0 0	20342 1192 1536	`portable4`	`gcc -march=native -mtune=native -O -fwrapv -fPIC -fPIE -gdwarf-4 -Wall`	20260302	20260217
165006	664 0 0	18930 1176 1504	`portable4`	`gcc -march=native -mtune=native -Os -fwrapv -fPIC -fPIE -gdwarf-4 -Wall`	20260302	20260217

Compiler output

sort.c: sort.c:127:11: error: always_inline function '_mm256_sub_epi32' requires target feature 'avx2', but would be inlined into function 'int64_sort_8through16' that is compiled without support for 'avx2'
sort.c:   diff2 = int32x8_sub(int32x8_set(16,17,18,19,20,21,22,23),int32x8_broadcast(2*pos2));
sort.c:           ^
sort.c: sort.c:36:21: note: expanded from macro 'int32x8_sub'
sort.c: #define int32x8_sub _mm256_sub_epi32
sort.c:                     ^
sort.c: sort.c:128:36: error: always_inline function '_mm256_permutevar8x32_epi32' requires target feature 'avx2', but would be inlined into function 'int64_sort_8through16' that is compiled without support for 'avx2'
sort.c:   x2 = int8x32_iftopthenelse(diff2,int32x8_varextract(int64x4_load(x+pos2-4),diff2),infty); // 2 6 10 14
sort.c:                                    ^
sort.c: sort.c:39:28: note: expanded from macro 'int32x8_varextract'
sort.c: #define int32x8_varextract _mm256_permutevar8x32_epi32
sort.c:                            ^
sort.c: sort.c:128:8: error: always_inline function '_mm256_blendv_epi8' requires target feature 'avx2', but would be inlined into function 'int64_sort_8through16' that is compiled without support for 'avx2'
sort.c:   x2 = int8x32_iftopthenelse(diff2,int32x8_varextract(int64x4_load(x+pos2-4),diff2),infty); // 2 6 10 14
sort.c:        ^
sort.c: sort.c:23:38: note: expanded from macro 'int8x32_iftopthenelse'
sort.c: #define int8x32_iftopthenelse(c,t,e) _mm256_blendv_epi8(e,t,c)
sort.c:                                      ^
sort.c: sort.c:130:11: error: always_inline function '_mm256_sub_epi32' requires target feature 'avx2', but would be inlined into function 'int64_sort_8through16' that is compiled without support for 'avx2'
sort.c:   diff3 = int32x8_sub(int32x8_set(24,25,26,27,28,29,30,31),int32x8_broadcast(2*pos3));
sort.c:           ^
sort.c: sort.c:36:21: note: expanded from macro 'int32x8_sub'
sort.c: #define int32x8_sub _mm256_sub_epi32
sort.c:                     ^
sort.c: sort.c:131:36: error: always_inline function '_mm256_permutevar8x32_epi32' requires target feature 'avx2', but would be inlined into function 'int64_sort_8through16' that is compiled without support for 'avx2'
sort.c: ...

Number of similar (implementation,compiler) pairs: 4, namely:

Implementation	Compiler
`2026avx2`	`clang -march=native -O2 -fwrapv -Qunused-arguments -fPIC -fPIE -gdwarf-4 -Wall (Debian_Clang_14.0.6)`
`2026avx2`	`clang -march=native -O3 -fwrapv -Qunused-arguments -fPIC -fPIE -gdwarf-4 -Wall (Debian_Clang_14.0.6)`
`2026avx2`	`clang -march=native -O -fwrapv -Qunused-arguments -fPIC -fPIE -gdwarf-4 -Wall (Debian_Clang_14.0.6)`
`2026avx2`	`clang -march=native -Os -fwrapv -Qunused-arguments -fPIC -fPIE -gdwarf-4 -Wall (Debian_Clang_14.0.6)`

Compiler output

sort.c: sort.c:123:8: error: always_inline function '_mm256_loadu_si256' requires target feature 'avx', but would be inlined into function 'int64_sort_8through16' that is compiled without support for 'avx'
sort.c:   x0 = int64x4_load(x+0); // 0 4 8 12
sort.c:        ^
sort.c: sort.c:17:25: note: expanded from macro 'int64x4_load'
sort.c: #define int64x4_load(z) _mm256_loadu_si256((__m256i *) (z))
sort.c:                         ^
sort.c: sort.c:123:8: error: AVX vector return of type '__m256i' (vector of 4 'long long' values) without 'avx' enabled changes the ABI
sort.c: sort.c:17:25: note: expanded from macro 'int64x4_load'
sort.c: #define int64x4_load(z) _mm256_loadu_si256((__m256i *) (z))
sort.c:                         ^
sort.c: sort.c:124:8: error: always_inline function '_mm256_loadu_si256' requires target feature 'avx', but would be inlined into function 'int64_sort_8through16' that is compiled without support for 'avx'
sort.c:   x1 = int64x4_load(x+4); // 1 5 9 13
sort.c:        ^
sort.c: sort.c:17:25: note: expanded from macro 'int64x4_load'
sort.c: #define int64x4_load(z) _mm256_loadu_si256((__m256i *) (z))
sort.c:                         ^
sort.c: sort.c:124:8: error: AVX vector return of type '__m256i' (vector of 4 'long long' values) without 'avx' enabled changes the ABI
sort.c: sort.c:17:25: note: expanded from macro 'int64x4_load'
sort.c: #define int64x4_load(z) _mm256_loadu_si256((__m256i *) (z))
sort.c:                         ^
sort.c: sort.c:125:11: error: always_inline function '_mm256_set1_epi64x' requires target feature 'avx', but would be inlined into function 'int64_sort_8through16' that is compiled without support for 'avx'
sort.c:   infty = int64x4_broadcast(int64_largest);
sort.c:           ^
sort.c: sort.c:41:27: note: expanded from macro 'int64x4_broadcast'
sort.c: #define int64x4_broadcast _mm256_set1_epi64x
sort.c: ...

Number of similar (implementation,compiler) pairs: 1, namely:

Implementation	Compiler
`2026avx2`	`clang -mcpu=native -O3 -fwrapv -Qunused-arguments -fPIC -fPIE -gdwarf-4 -Wall (Debian_Clang_14.0.6)`

Compiler output

sort.c: In file included from /usr/lib/gcc/x86_64-linux-gnu/12/include/immintrin.h:47,
sort.c:                  from sort.c:4:
sort.c: /usr/lib/gcc/x86_64-linux-gnu/12/include/avx2intrin.h: In function 'int64_sort_8through16':
sort.c: /usr/lib/gcc/x86_64-linux-gnu/12/include/avx2intrin.h:1044:1: error: inlining failed in call to 'always_inline' '_mm256_permutevar8x32_epi32': target specific option mismatch
sort.c:  1044 | _mm256_permutevar8x32_epi32 (__m256i __X, __m256i __Y)
sort.c:       | ^~~~~~~~~~~~~~~~~~~~~~~~~~~
sort.c: sort.c:18:28: note: called from here
sort.c:    18 | #define int64x4_store(z,i) _mm256_storeu_si256((__m256i *) (z),(i))
sort.c:       |                            ^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
sort.c: sort.c:222:3: note: in expansion of macro 'int64x4_store'
sort.c:   222 |   int64x4_store(x+pos2-4,int32x8_varextract(x3,int32x8_add(int32x8_set(0,1,2,3,4,5,6,7),int32x8_broadcast(2*pos2))));
sort.c:       |   ^~~~~~~~~~~~~
sort.c: /usr/lib/gcc/x86_64-linux-gnu/12/include/avx2intrin.h:119:1: error: inlining failed in call to 'always_inline' '_mm256_add_epi32': target specific option mismatch
sort.c:   119 | _mm256_add_epi32 (__m256i __A, __m256i __B)
sort.c:       | ^~~~~~~~~~~~~~~~
sort.c: sort.c:18:28: note: called from here
sort.c:    18 | #define int64x4_store(z,i) _mm256_storeu_si256((__m256i *) (z),(i))
sort.c:       |                            ^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
sort.c: sort.c:222:3: note: in expansion of macro 'int64x4_store'
sort.c:   222 |   int64x4_store(x+pos2-4,int32x8_varextract(x3,int32x8_add(int32x8_set(0,1,2,3,4,5,6,7),int32x8_broadcast(2*pos2))));
sort.c:       |   ^~~~~~~~~~~~~
sort.c: /usr/lib/gcc/x86_64-linux-gnu/12/include/avx2intrin.h:1044:1: error: inlining failed in call to 'always_inline' '_mm256_permutevar8x32_epi32': target specific option mismatch
sort.c:  1044 | _mm256_permutevar8x32_epi32 (__m256i __X, __m256i __Y)
sort.c:       | ^~~~~~~~~~~~~~~~~~~~~~~~~~~
sort.c: sort.c:18:28: note: called from here
sort.c: ...

Number of similar (implementation,compiler) pairs: 4, namely:

Implementation	Compiler
`2026avx2`	`gcc -march=native -mtune=native -O2 -fwrapv -fPIC -fPIE -gdwarf-4 -Wall (12.2.0)`
`2026avx2`	`gcc -march=native -mtune=native -O3 -fwrapv -fPIC -fPIE -gdwarf-4 -Wall (12.2.0)`
`2026avx2`	`gcc -march=native -mtune=native -O -fwrapv -fPIC -fPIE -gdwarf-4 -Wall (12.2.0)`
`2026avx2`	`gcc -march=native -mtune=native -Os -fwrapv -fPIC -fPIE -gdwarf-4 -Wall (12.2.0)`

Compiler output

sort.c: sort.c:130:93: error: always_inline function '_mm_shuffle_epi8' requires target feature 'ssse3', but would be inlined into function 'int64_sort_8through16' that is compiled without support for 'ssse3'
sort.c:   x4 = int8x16_iftopthenelse(int64x2_smaller_mask(int64x2_set(8,9),int64x2_broadcast(pos4)),int8x16_varextract(int64x2_load(x+pos4-2),int8x16_sub(int8x16_set(16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31),int8x16_broadcast(8*(pos4&1)))),infty); // 4 12
sort.c:                                                                                             ^
sort.c: sort.c:39:28: note: expanded from macro 'int8x16_varextract'
sort.c: #define int8x16_varextract _mm_shuffle_epi8
sort.c:                            ^
sort.c: sort.c:130:30: error: always_inline function '_mm_cmpgt_epi64' requires target feature 'sse4.2', but would be inlined into function 'int64_sort_8through16' that is compiled without support for 'sse4.2'
sort.c:   x4 = int8x16_iftopthenelse(int64x2_smaller_mask(int64x2_set(8,9),int64x2_broadcast(pos4)),int8x16_varextract(int64x2_load(x+pos4-2),int8x16_sub(int8x16_set(16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31),int8x16_broadcast(8*(pos4&1)))),infty); // 4 12
sort.c:                              ^
sort.c: sort.c:20:35: note: expanded from macro 'int64x2_smaller_mask'
sort.c: #define int64x2_smaller_mask(a,b) _mm_cmpgt_epi64(b,a)
sort.c:                                   ^
sort.c: sort.c:130:8: error: always_inline function '_mm_blendv_epi8' requires target feature 'sse4.1', but would be inlined into function 'int64_sort_8through16' that is compiled without support for 'sse4.1'
sort.c:   x4 = int8x16_iftopthenelse(int64x2_smaller_mask(int64x2_set(8,9),int64x2_broadcast(pos4)),int8x16_varextract(int64x2_load(x+pos4-2),int8x16_sub(int8x16_set(16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31),int8x16_broadcast(8*(pos4&1)))),infty); // 4 12
sort.c:        ^
sort.c: sort.c:23:38: note: expanded from macro 'int8x16_iftopthenelse'
sort.c: #define int8x16_iftopthenelse(c,t,e) _mm_blendv_epi8(e,t,c)
sort.c:                                      ^
sort.c: sort.c:132:95: error: always_inline function '_mm_shuffle_epi8' requires target feature 'ssse3', but would be inlined into function 'int64_sort_8through16' that is compiled without support for 'ssse3'
sort.c:   x5 = int8x16_iftopthenelse(int64x2_smaller_mask(int64x2_set(10,11),int64x2_broadcast(pos5)),int8x16_varextract(int64x2_load(x+pos5-2),int8x16_sub(int8x16_set(16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31),int8x16_broadcast(8*(pos5&1)))),infty); // 5 13
sort.c:                                                                                               ^
sort.c: sort.c:39:28: note: expanded from macro 'int8x16_varextract'
sort.c: #define int8x16_varextract _mm_shuffle_epi8
sort.c:                            ^
sort.c: sort.c:132:30: error: always_inline function '_mm_cmpgt_epi64' requires target feature 'sse4.2', but would be inlined into function 'int64_sort_8through16' that is compiled without support for 'sse4.2'
sort.c: ...

Number of similar (implementation,compiler) pairs: 1, namely:

Implementation	Compiler
`sse42`	`clang -mcpu=native -O3 -fwrapv -Qunused-arguments -fPIC -fPIE -gdwarf-4 -Wall (Debian_Clang_14.0.6)`

Passed TIMECOP

TIMECOP iterations: 10

Number of similar (implementation,compiler) pairs: 26, namely:

Implementation	Compiler
`portable4`	`clang -march=native -O2 -fwrapv -Qunused-arguments -fPIC -fPIE -gdwarf-4 -Wall (Debian_Clang_14.0.6)`
`portable4`	`clang -march=native -O3 -fwrapv -Qunused-arguments -fPIC -fPIE -gdwarf-4 -Wall (Debian_Clang_14.0.6)`
`portable4`	`clang -march=native -O -fwrapv -Qunused-arguments -fPIC -fPIE -gdwarf-4 -Wall (Debian_Clang_14.0.6)`
`portable4`	`clang -march=native -Os -fwrapv -Qunused-arguments -fPIC -fPIE -gdwarf-4 -Wall (Debian_Clang_14.0.6)`
`portable4`	`clang -mcpu=native -O3 -fwrapv -Qunused-arguments -fPIC -fPIE -gdwarf-4 -Wall (Debian_Clang_14.0.6)`
`portable4`	`gcc -march=native -mtune=native -O2 -fwrapv -fPIC -fPIE -gdwarf-4 -Wall (12.2.0)`
`portable4`	`gcc -march=native -mtune=native -O3 -fwrapv -fPIC -fPIE -gdwarf-4 -Wall (12.2.0)`
`portable4`	`gcc -march=native -mtune=native -O -fwrapv -fPIC -fPIE -gdwarf-4 -Wall (12.2.0)`
`portable4`	`gcc -march=native -mtune=native -Os -fwrapv -fPIC -fPIE -gdwarf-4 -Wall (12.2.0)`
`sse42`	`clang -march=native -O2 -fwrapv -Qunused-arguments -fPIC -fPIE -gdwarf-4 -Wall (Debian_Clang_14.0.6)`
`sse42`	`clang -march=native -O3 -fwrapv -Qunused-arguments -fPIC -fPIE -gdwarf-4 -Wall (Debian_Clang_14.0.6)`
`sse42`	`clang -march=native -O -fwrapv -Qunused-arguments -fPIC -fPIE -gdwarf-4 -Wall (Debian_Clang_14.0.6)`
`sse42`	`clang -march=native -Os -fwrapv -Qunused-arguments -fPIC -fPIE -gdwarf-4 -Wall (Debian_Clang_14.0.6)`
`sse42`	`gcc -march=native -mtune=native -O2 -fwrapv -fPIC -fPIE -gdwarf-4 -Wall (12.2.0)`
`sse42`	`gcc -march=native -mtune=native -O3 -fwrapv -fPIC -fPIE -gdwarf-4 -Wall (12.2.0)`
`sse42`	`gcc -march=native -mtune=native -O -fwrapv -fPIC -fPIE -gdwarf-4 -Wall (12.2.0)`
`sse42`	`gcc -march=native -mtune=native -Os -fwrapv -fPIC -fPIE -gdwarf-4 -Wall (12.2.0)`
`x863`	`clang -march=native -O2 -fwrapv -Qunused-arguments -fPIC -fPIE -gdwarf-4 -Wall (Debian_Clang_14.0.6)`
`x863`	`clang -march=native -O3 -fwrapv -Qunused-arguments -fPIC -fPIE -gdwarf-4 -Wall (Debian_Clang_14.0.6)`
`x863`	`clang -march=native -O -fwrapv -Qunused-arguments -fPIC -fPIE -gdwarf-4 -Wall (Debian_Clang_14.0.6)`
`x863`	`clang -march=native -Os -fwrapv -Qunused-arguments -fPIC -fPIE -gdwarf-4 -Wall (Debian_Clang_14.0.6)`
`x863`	`clang -mcpu=native -O3 -fwrapv -Qunused-arguments -fPIC -fPIE -gdwarf-4 -Wall (Debian_Clang_14.0.6)`
`x863`	`gcc -march=native -mtune=native -O2 -fwrapv -fPIC -fPIE -gdwarf-4 -Wall (12.2.0)`
`x863`	`gcc -march=native -mtune=native -O3 -fwrapv -fPIC -fPIE -gdwarf-4 -Wall (12.2.0)`
`x863`	`gcc -march=native -mtune=native -O -fwrapv -fPIC -fPIE -gdwarf-4 -Wall (12.2.0)`
`x863`	`gcc -march=native -mtune=native -Os -fwrapv -fPIC -fPIE -gdwarf-4 -Wall (12.2.0)`