Test results for amd64, speed2supercop, crypto_aead/aezv3
[Page version: 20241023 21:37:24]
Measurements for amd64, speed2supercop, crypto_aead
Test results for amd64, speed2supercop, crypto_aead
Test results for crypto_aead/aezv3
Computer: speed2supercop
Microarchitecture: amd64; Haswell+AES (306c3)
Architecture: amd64
CPU ID: GenuineIntel-000306c3-1fc9cbf5
SUPERCOP version: 20241022
Operation: crypto_aead
Primitive: aezv3
Time | Object size | Test size | Implementation | Compiler | Benchmark date | SUPERCOP version |
3740 | 8335 0 0 | 26496 728 896 | T:aesni | gcc -march=native -mtune=native -Os -fwrapv -fPIC -fPIE -gdwarf-4 -Wall | 20240703 | 20240625 |
3744 | 9787 0 0 | 29997 752 928 | T:aesni | gcc -march=native -mtune=native -O2 -fwrapv -fPIC -fPIE -gdwarf-4 -Wall | 20240703 | 20240625 |
3752 | 16745 0 0 | 38941 752 928 | T:aesni | gcc -march=native -mtune=native -O3 -fwrapv -fPIC -fPIE -gdwarf-4 -Wall | 20240703 | 20240625 |
3772 | 10942 0 0 | 34126 792 872 | T:aesni | clang -march=native -O3 -fwrapv -Qunused-arguments -fPIC -fPIE -gdwarf-4 -Wall | 20240703 | 20240625 |
3776 | 10910 0 0 | 33902 792 872 | T:aesni | clang -march=native -O2 -fwrapv -Qunused-arguments -fPIC -fPIE -gdwarf-4 -Wall | 20240703 | 20240625 |
3824 | 10629 0 0 | 29558 792 856 | T:aesni | clang -march=native -O -fwrapv -Qunused-arguments -fPIC -fPIE -gdwarf-4 -Wall | 20240703 | 20240625 |
3824 | 9638 0 0 | 29695 784 920 | T:aesni | clang -march=native -Os -fwrapv -Qunused-arguments -fPIC -fPIE -gdwarf-4 -Wall | 20240703 | 20240625 |
3864 | 10222 0 0 | 29964 744 928 | T:aesni | gcc -march=native -mtune=native -O -fwrapv -fPIC -fPIE -gdwarf-4 -Wall | 20240703 | 20240625 |
750180 | 33214 0 0 | 55422 808 856 | T:ref | clang -mcpu=native -O3 -fwrapv -Qunused-arguments -fPIC -fPIE -gdwarf-4 -Wall | 20240703 | 20240625 |
781148 | 32467 0 0 | 56134 808 872 | T:ref | clang -march=native -O3 -fwrapv -Qunused-arguments -fPIC -fPIE -gdwarf-4 -Wall | 20240703 | 20240625 |
784240 | 30796 0 0 | 54254 808 872 | T:ref | clang -march=native -O2 -fwrapv -Qunused-arguments -fPIC -fPIE -gdwarf-4 -Wall | 20240703 | 20240625 |
968768 | 24674 0 0 | 45085 768 928 | T:ref | gcc -march=native -mtune=native -O2 -fwrapv -fPIC -fPIE -gdwarf-4 -Wall | 20240703 | 20240625 |
976804 | 52136 0 0 | 74589 768 928 | T:ref | gcc -march=native -mtune=native -O3 -fwrapv -fPIC -fPIE -gdwarf-4 -Wall | 20240703 | 20240625 |
1151480 | 23763 0 0 | 43174 808 856 | T:ref | clang -march=native -O -fwrapv -Qunused-arguments -fPIC -fPIE -gdwarf-4 -Wall | 20240703 | 20240625 |
1210712 | 24948 0 0 | 44917 768 928 | T:ref | gcc -march=native -mtune=native -O -fwrapv -fPIC -fPIE -gdwarf-4 -Wall | 20240703 | 20240625 |
1225520 | 22234 0 0 | 42583 800 920 | T:ref | clang -march=native -Os -fwrapv -Qunused-arguments -fPIC -fPIE -gdwarf-4 -Wall | 20240703 | 20240625 |
1415176 | 21926 0 0 | 40232 744 896 | T:ref | gcc -march=native -mtune=native -Os -fwrapv -fPIC -fPIE -gdwarf-4 -Wall | 20240703 | 20240625 |
Compiler output
aez_ni.c: aez_ni.c:146:22: error: '__builtin_ia32_vec_set_v16qi' needs target feature sse4.1
aez_ni.c: __m128i i1 = _mm_insert_epi8(zero, 1, 7);
aez_ni.c: ^
aez_ni.c: /usr/lib/llvm-16/lib/clang/16/include/smmintrin.h:923:13: note: expanded from macro '_mm_insert_epi8'
aez_ni.c: ((__m128i)__builtin_ia32_vec_set_v16qi((__v16qi)(__m128i)(X), (int)(I), \
aez_ni.c: ^
aez_ni.c: aez_ni.c:147:22: error: '__builtin_ia32_vec_set_v16qi' needs target feature sse4.1
aez_ni.c: __m128i i2 = _mm_insert_epi8(zero, 2, 7);
aez_ni.c: ^
aez_ni.c: /usr/lib/llvm-16/lib/clang/16/include/smmintrin.h:923:13: note: expanded from macro '_mm_insert_epi8'
aez_ni.c: ((__m128i)__builtin_ia32_vec_set_v16qi((__v16qi)(__m128i)(X), (int)(I), \
aez_ni.c: ^
aez_ni.c: aez_ni.c:148:22: error: '__builtin_ia32_vec_set_v16qi' needs target feature sse4.1
aez_ni.c: __m128i i3 = _mm_insert_epi8(zero, 3, 7);
aez_ni.c: ^
aez_ni.c: /usr/lib/llvm-16/lib/clang/16/include/smmintrin.h:923:13: note: expanded from macro '_mm_insert_epi8'
aez_ni.c: ((__m128i)__builtin_ia32_vec_set_v16qi((__v16qi)(__m128i)(X), (int)(I), \
aez_ni.c: ^
aez_ni.c: aez_ni.c:149:26: error: '__builtin_ia32_vec_set_v16qi' needs target feature sse4.1
aez_ni.c: __m128i j, one = _mm_insert_epi8(zero, 1, 15);
aez_ni.c: ^
aez_ni.c: /usr/lib/llvm-16/lib/clang/16/include/smmintrin.h:923:13: note: expanded from macro '_mm_insert_epi8'
aez_ni.c: ((__m128i)__builtin_ia32_vec_set_v16qi((__v16qi)(__m128i)(X), (int)(I), \
aez_ni.c: ^
aez_ni.c: 4 errors generated.
Number of similar (implementation,compiler) pairs: 1, namely:
Implementation | Compiler |
T:aesni | clang -mcpu=native -O3 -fwrapv -Qunused-arguments -fPIC -fPIE -gdwarf-4 -Wall (Debian_Clang_16.0.6_(27+b1)) |
Compiler output
aez_ni.c: In file included from aez_ni.c:37:
aez_ni.c: In function '_mm_loadu_si128',
aez_ni.c: inlined from 'zero_pad' at aez_ni.c:67:12,
aez_ni.c: inlined from 'cipher_aez_tiny' at aez_ni.c:498:18,
aez_ni.c: inlined from 'aez_encrypt' at aez_ni.c:588:9,
aez_ni.c: inlined from 'crypto_aead_aezv3_aesni_timingleaks_encrypt' at aez_ni.c:637:5:
aez_ni.c: /usr/lib/gcc/x86_64-linux-gnu/13/include/emmintrin.h:706:10: warning: array subscript '__m128i_u[2]' is partly outside array bounds of 'const unsigned char[48]' [-Warray-bounds=]
aez_ni.c: 706 | return *__P;
aez_ni.c: | ^~~~
aez_ni.c: aez_ni.c: In function 'crypto_aead_aezv3_aesni_timingleaks_encrypt':
aez_ni.c: aez_ni.c:59:28: note: at offset [33, 48] into object 'pad' of size 48
aez_ni.c: 59 | static const unsigned char pad[] = {0xff,0xff,0xff,0xff,0xff,0xff,0xff,0xff,
aez_ni.c: | ^~~
aez_ni.c: In function 'load_partial',
aez_ni.c: inlined from 'load_partial' at aez_ni.c:119:16,
aez_ni.c: inlined from 'cipher_aez_tiny' at aez_ni.c:498:18,
aez_ni.c: inlined from 'aez_encrypt' at aez_ni.c:588:9,
aez_ni.c: inlined from 'crypto_aead_aezv3_aesni_timingleaks_encrypt' at aez_ni.c:637:5:
aez_ni.c: aez_ni.c:123:46: warning: '__builtin_memcpy' forming offset [16, 4294967263] is out of the bounds [0, 16] of object 'tmp' with type '__m128i' [-Warray-bounds=]
aez_ni.c: 123 | for (i=0; i<n; i++) ((char*)&tmp)[i] = ((char*)p)[i];
aez_ni.c: | ~~~~~~~~~~~~~~~~~^~~~~~~~~~~~~~~
aez_ni.c: aez_ni.c: In function 'crypto_aead_aezv3_aesni_timingleaks_encrypt':
aez_ni.c: aez_ni.c:122:17: note: 'tmp' declared here
aez_ni.c: 122 | __m128i tmp; unsigned i;
aez_ni.c: | ^~~
Number of similar (implementation,compiler) pairs: 1, namely:
Implementation | Compiler |
T:aesni | gcc -march=native -mtune=native -O3 -fwrapv -fPIC -fPIE -gdwarf-4 -Wall (14.2.0) |