• Home
  • Features
  • Pricing
  • Docs
  • Announcements
  • Sign In

randombit / botan / 23086172114

14 Mar 2026 10:30AM UTC coverage: 90.111% (-0.1%) from 90.207%
23086172114

push

github

web-flow
Merge pull request #5440 from randombit/jack/aria-avx512-gfni

Add ARIA implementation using AVX-512 GFNI

104202 of 115637 relevant lines covered (90.11%)

11559627.62 hits per line

Source File
Press 'n' to go to next uncovered line, 'b' for previous

96.69
/src/lib/block/aria/aria.cpp
1
/*
2
* ARIA
3
* Adapted for Botan by Jeffrey Walton, public domain
4
*
5
* Further changes
6
* (C) 2017,2020 Jack Lloyd
7
*
8
* Botan is released under the Simplified BSD License (see license.txt)
9
*
10
* This ARIA implementation is based on the 32-bit implementation by Aaram Yun from the
11
* National Security Research Institute, KOREA. Aaram Yun's implementation is based on
12
* the 8-bit implementation by Jin Hong. The source files are available in ARIA.zip from
13
* the Korea Internet & Security Agency website.
14
* <A HREF="https://tools.ietf.org/html/rfc5794">RFC 5794, A Description of the ARIA Encryption Algorithm</A>,
15
* <A HREF="http://seed.kisa.or.kr/iwt/ko/bbs/EgovReferenceList.do?bbsId=BBSMSTR_000000000002">Korea
16
* Internet & Security Agency homepage</A>
17
*/
18

19
#include <botan/internal/aria.h>
20

21
#include <botan/internal/bswap.h>
22
#include <botan/internal/loadstor.h>
23
#include <botan/internal/prefetch.h>
24
#include <botan/internal/rotate.h>
25

26
#if defined(BOTAN_HAS_CPUID)
27
   #include <botan/internal/cpuid.h>
28
#endif
29

30
namespace Botan {
31

32
namespace {
33

34
namespace ARIA_F {
35

36
alignas(256) const uint8_t S1[256] = {
37
   0x63, 0x7C, 0x77, 0x7B, 0xF2, 0x6B, 0x6F, 0xC5, 0x30, 0x01, 0x67, 0x2B, 0xFE, 0xD7, 0xAB, 0x76, 0xCA, 0x82, 0xC9,
38
   0x7D, 0xFA, 0x59, 0x47, 0xF0, 0xAD, 0xD4, 0xA2, 0xAF, 0x9C, 0xA4, 0x72, 0xC0, 0xB7, 0xFD, 0x93, 0x26, 0x36, 0x3F,
39
   0xF7, 0xCC, 0x34, 0xA5, 0xE5, 0xF1, 0x71, 0xD8, 0x31, 0x15, 0x04, 0xC7, 0x23, 0xC3, 0x18, 0x96, 0x05, 0x9A, 0x07,
40
   0x12, 0x80, 0xE2, 0xEB, 0x27, 0xB2, 0x75, 0x09, 0x83, 0x2C, 0x1A, 0x1B, 0x6E, 0x5A, 0xA0, 0x52, 0x3B, 0xD6, 0xB3,
41
   0x29, 0xE3, 0x2F, 0x84, 0x53, 0xD1, 0x00, 0xED, 0x20, 0xFC, 0xB1, 0x5B, 0x6A, 0xCB, 0xBE, 0x39, 0x4A, 0x4C, 0x58,
42
   0xCF, 0xD0, 0xEF, 0xAA, 0xFB, 0x43, 0x4D, 0x33, 0x85, 0x45, 0xF9, 0x02, 0x7F, 0x50, 0x3C, 0x9F, 0xA8, 0x51, 0xA3,
43
   0x40, 0x8F, 0x92, 0x9D, 0x38, 0xF5, 0xBC, 0xB6, 0xDA, 0x21, 0x10, 0xFF, 0xF3, 0xD2, 0xCD, 0x0C, 0x13, 0xEC, 0x5F,
44
   0x97, 0x44, 0x17, 0xC4, 0xA7, 0x7E, 0x3D, 0x64, 0x5D, 0x19, 0x73, 0x60, 0x81, 0x4F, 0xDC, 0x22, 0x2A, 0x90, 0x88,
45
   0x46, 0xEE, 0xB8, 0x14, 0xDE, 0x5E, 0x0B, 0xDB, 0xE0, 0x32, 0x3A, 0x0A, 0x49, 0x06, 0x24, 0x5C, 0xC2, 0xD3, 0xAC,
46
   0x62, 0x91, 0x95, 0xE4, 0x79, 0xE7, 0xC8, 0x37, 0x6D, 0x8D, 0xD5, 0x4E, 0xA9, 0x6C, 0x56, 0xF4, 0xEA, 0x65, 0x7A,
47
   0xAE, 0x08, 0xBA, 0x78, 0x25, 0x2E, 0x1C, 0xA6, 0xB4, 0xC6, 0xE8, 0xDD, 0x74, 0x1F, 0x4B, 0xBD, 0x8B, 0x8A, 0x70,
48
   0x3E, 0xB5, 0x66, 0x48, 0x03, 0xF6, 0x0E, 0x61, 0x35, 0x57, 0xB9, 0x86, 0xC1, 0x1D, 0x9E, 0xE1, 0xF8, 0x98, 0x11,
49
   0x69, 0xD9, 0x8E, 0x94, 0x9B, 0x1E, 0x87, 0xE9, 0xCE, 0x55, 0x28, 0xDF, 0x8C, 0xA1, 0x89, 0x0D, 0xBF, 0xE6, 0x42,
50
   0x68, 0x41, 0x99, 0x2D, 0x0F, 0xB0, 0x54, 0xBB, 0x16};
51

52
alignas(256) const uint8_t S2[256] = {
53
   0xE2, 0x4E, 0x54, 0xFC, 0x94, 0xC2, 0x4A, 0xCC, 0x62, 0x0D, 0x6A, 0x46, 0x3C, 0x4D, 0x8B, 0xD1, 0x5E, 0xFA, 0x64,
54
   0xCB, 0xB4, 0x97, 0xBE, 0x2B, 0xBC, 0x77, 0x2E, 0x03, 0xD3, 0x19, 0x59, 0xC1, 0x1D, 0x06, 0x41, 0x6B, 0x55, 0xF0,
55
   0x99, 0x69, 0xEA, 0x9C, 0x18, 0xAE, 0x63, 0xDF, 0xE7, 0xBB, 0x00, 0x73, 0x66, 0xFB, 0x96, 0x4C, 0x85, 0xE4, 0x3A,
56
   0x09, 0x45, 0xAA, 0x0F, 0xEE, 0x10, 0xEB, 0x2D, 0x7F, 0xF4, 0x29, 0xAC, 0xCF, 0xAD, 0x91, 0x8D, 0x78, 0xC8, 0x95,
57
   0xF9, 0x2F, 0xCE, 0xCD, 0x08, 0x7A, 0x88, 0x38, 0x5C, 0x83, 0x2A, 0x28, 0x47, 0xDB, 0xB8, 0xC7, 0x93, 0xA4, 0x12,
58
   0x53, 0xFF, 0x87, 0x0E, 0x31, 0x36, 0x21, 0x58, 0x48, 0x01, 0x8E, 0x37, 0x74, 0x32, 0xCA, 0xE9, 0xB1, 0xB7, 0xAB,
59
   0x0C, 0xD7, 0xC4, 0x56, 0x42, 0x26, 0x07, 0x98, 0x60, 0xD9, 0xB6, 0xB9, 0x11, 0x40, 0xEC, 0x20, 0x8C, 0xBD, 0xA0,
60
   0xC9, 0x84, 0x04, 0x49, 0x23, 0xF1, 0x4F, 0x50, 0x1F, 0x13, 0xDC, 0xD8, 0xC0, 0x9E, 0x57, 0xE3, 0xC3, 0x7B, 0x65,
61
   0x3B, 0x02, 0x8F, 0x3E, 0xE8, 0x25, 0x92, 0xE5, 0x15, 0xDD, 0xFD, 0x17, 0xA9, 0xBF, 0xD4, 0x9A, 0x7E, 0xC5, 0x39,
62
   0x67, 0xFE, 0x76, 0x9D, 0x43, 0xA7, 0xE1, 0xD0, 0xF5, 0x68, 0xF2, 0x1B, 0x34, 0x70, 0x05, 0xA3, 0x8A, 0xD5, 0x79,
63
   0x86, 0xA8, 0x30, 0xC6, 0x51, 0x4B, 0x1E, 0xA6, 0x27, 0xF6, 0x35, 0xD2, 0x6E, 0x24, 0x16, 0x82, 0x5F, 0xDA, 0xE6,
64
   0x75, 0xA2, 0xEF, 0x2C, 0xB2, 0x1C, 0x9F, 0x5D, 0x6F, 0x80, 0x0A, 0x72, 0x44, 0x9B, 0x6C, 0x90, 0x0B, 0x5B, 0x33,
65
   0x7D, 0x5A, 0x52, 0xF3, 0x61, 0xA1, 0xF7, 0xB0, 0xD6, 0x3F, 0x7C, 0x6D, 0xED, 0x14, 0xE0, 0xA5, 0x3D, 0x22, 0xB3,
66
   0xF8, 0x89, 0xDE, 0x71, 0x1A, 0xAF, 0xBA, 0xB5, 0x81};
67

68
alignas(256) const uint8_t X1[256] = {
69
   0x52, 0x09, 0x6A, 0xD5, 0x30, 0x36, 0xA5, 0x38, 0xBF, 0x40, 0xA3, 0x9E, 0x81, 0xF3, 0xD7, 0xFB, 0x7C, 0xE3, 0x39,
70
   0x82, 0x9B, 0x2F, 0xFF, 0x87, 0x34, 0x8E, 0x43, 0x44, 0xC4, 0xDE, 0xE9, 0xCB, 0x54, 0x7B, 0x94, 0x32, 0xA6, 0xC2,
71
   0x23, 0x3D, 0xEE, 0x4C, 0x95, 0x0B, 0x42, 0xFA, 0xC3, 0x4E, 0x08, 0x2E, 0xA1, 0x66, 0x28, 0xD9, 0x24, 0xB2, 0x76,
72
   0x5B, 0xA2, 0x49, 0x6D, 0x8B, 0xD1, 0x25, 0x72, 0xF8, 0xF6, 0x64, 0x86, 0x68, 0x98, 0x16, 0xD4, 0xA4, 0x5C, 0xCC,
73
   0x5D, 0x65, 0xB6, 0x92, 0x6C, 0x70, 0x48, 0x50, 0xFD, 0xED, 0xB9, 0xDA, 0x5E, 0x15, 0x46, 0x57, 0xA7, 0x8D, 0x9D,
74
   0x84, 0x90, 0xD8, 0xAB, 0x00, 0x8C, 0xBC, 0xD3, 0x0A, 0xF7, 0xE4, 0x58, 0x05, 0xB8, 0xB3, 0x45, 0x06, 0xD0, 0x2C,
75
   0x1E, 0x8F, 0xCA, 0x3F, 0x0F, 0x02, 0xC1, 0xAF, 0xBD, 0x03, 0x01, 0x13, 0x8A, 0x6B, 0x3A, 0x91, 0x11, 0x41, 0x4F,
76
   0x67, 0xDC, 0xEA, 0x97, 0xF2, 0xCF, 0xCE, 0xF0, 0xB4, 0xE6, 0x73, 0x96, 0xAC, 0x74, 0x22, 0xE7, 0xAD, 0x35, 0x85,
77
   0xE2, 0xF9, 0x37, 0xE8, 0x1C, 0x75, 0xDF, 0x6E, 0x47, 0xF1, 0x1A, 0x71, 0x1D, 0x29, 0xC5, 0x89, 0x6F, 0xB7, 0x62,
78
   0x0E, 0xAA, 0x18, 0xBE, 0x1B, 0xFC, 0x56, 0x3E, 0x4B, 0xC6, 0xD2, 0x79, 0x20, 0x9A, 0xDB, 0xC0, 0xFE, 0x78, 0xCD,
79
   0x5A, 0xF4, 0x1F, 0xDD, 0xA8, 0x33, 0x88, 0x07, 0xC7, 0x31, 0xB1, 0x12, 0x10, 0x59, 0x27, 0x80, 0xEC, 0x5F, 0x60,
80
   0x51, 0x7F, 0xA9, 0x19, 0xB5, 0x4A, 0x0D, 0x2D, 0xE5, 0x7A, 0x9F, 0x93, 0xC9, 0x9C, 0xEF, 0xA0, 0xE0, 0x3B, 0x4D,
81
   0xAE, 0x2A, 0xF5, 0xB0, 0xC8, 0xEB, 0xBB, 0x3C, 0x83, 0x53, 0x99, 0x61, 0x17, 0x2B, 0x04, 0x7E, 0xBA, 0x77, 0xD6,
82
   0x26, 0xE1, 0x69, 0x14, 0x63, 0x55, 0x21, 0x0C, 0x7D};
83

84
alignas(256) const uint8_t X2[256] = {
85
   0x30, 0x68, 0x99, 0x1B, 0x87, 0xB9, 0x21, 0x78, 0x50, 0x39, 0xDB, 0xE1, 0x72, 0x09, 0x62, 0x3C, 0x3E, 0x7E, 0x5E,
86
   0x8E, 0xF1, 0xA0, 0xCC, 0xA3, 0x2A, 0x1D, 0xFB, 0xB6, 0xD6, 0x20, 0xC4, 0x8D, 0x81, 0x65, 0xF5, 0x89, 0xCB, 0x9D,
87
   0x77, 0xC6, 0x57, 0x43, 0x56, 0x17, 0xD4, 0x40, 0x1A, 0x4D, 0xC0, 0x63, 0x6C, 0xE3, 0xB7, 0xC8, 0x64, 0x6A, 0x53,
88
   0xAA, 0x38, 0x98, 0x0C, 0xF4, 0x9B, 0xED, 0x7F, 0x22, 0x76, 0xAF, 0xDD, 0x3A, 0x0B, 0x58, 0x67, 0x88, 0x06, 0xC3,
89
   0x35, 0x0D, 0x01, 0x8B, 0x8C, 0xC2, 0xE6, 0x5F, 0x02, 0x24, 0x75, 0x93, 0x66, 0x1E, 0xE5, 0xE2, 0x54, 0xD8, 0x10,
90
   0xCE, 0x7A, 0xE8, 0x08, 0x2C, 0x12, 0x97, 0x32, 0xAB, 0xB4, 0x27, 0x0A, 0x23, 0xDF, 0xEF, 0xCA, 0xD9, 0xB8, 0xFA,
91
   0xDC, 0x31, 0x6B, 0xD1, 0xAD, 0x19, 0x49, 0xBD, 0x51, 0x96, 0xEE, 0xE4, 0xA8, 0x41, 0xDA, 0xFF, 0xCD, 0x55, 0x86,
92
   0x36, 0xBE, 0x61, 0x52, 0xF8, 0xBB, 0x0E, 0x82, 0x48, 0x69, 0x9A, 0xE0, 0x47, 0x9E, 0x5C, 0x04, 0x4B, 0x34, 0x15,
93
   0x79, 0x26, 0xA7, 0xDE, 0x29, 0xAE, 0x92, 0xD7, 0x84, 0xE9, 0xD2, 0xBA, 0x5D, 0xF3, 0xC5, 0xB0, 0xBF, 0xA4, 0x3B,
94
   0x71, 0x44, 0x46, 0x2B, 0xFC, 0xEB, 0x6F, 0xD5, 0xF6, 0x14, 0xFE, 0x7C, 0x70, 0x5A, 0x7D, 0xFD, 0x2F, 0x18, 0x83,
95
   0x16, 0xA5, 0x91, 0x1F, 0x05, 0x95, 0x74, 0xA9, 0xC1, 0x5B, 0x4A, 0x85, 0x6D, 0x13, 0x07, 0x4F, 0x4E, 0x45, 0xB2,
96
   0x0F, 0xC9, 0x1C, 0xA6, 0xBC, 0xEC, 0x73, 0x90, 0x7B, 0xCF, 0x59, 0x8F, 0xA1, 0xF9, 0x2D, 0xF2, 0xB1, 0x00, 0x94,
97
   0x37, 0x9F, 0xD0, 0x2E, 0x9C, 0x6E, 0x28, 0x3F, 0x80, 0xF0, 0x3D, 0xD3, 0x25, 0x8A, 0xB5, 0xE7, 0x42, 0xB3, 0xC7,
98
   0xEA, 0xF7, 0x4C, 0x11, 0x33, 0x03, 0xA2, 0xAC, 0x60};
99

100
inline uint32_t ARIA_F1(uint32_t X) {
181,132✔
101
   const uint32_t M1 = 0x00010101;
181,132✔
102
   const uint32_t M2 = 0x01000101;
181,132✔
103
   const uint32_t M3 = 0x01010001;
181,132✔
104
   const uint32_t M4 = 0x01010100;
181,132✔
105

106
   return (S1[get_byte<0>(X)] * M1) ^ (S2[get_byte<1>(X)] * M2) ^ (X1[get_byte<2>(X)] * M3) ^ (X2[get_byte<3>(X)] * M4);
181,132✔
107
}
108

109
inline uint32_t ARIA_F2(uint32_t X) {
153,664✔
110
   const uint32_t M1 = 0x00010101;
153,664✔
111
   const uint32_t M2 = 0x01000101;
153,664✔
112
   const uint32_t M3 = 0x01010001;
153,664✔
113
   const uint32_t M4 = 0x01010100;
153,664✔
114

115
   return (X1[get_byte<0>(X)] * M3) ^ (X2[get_byte<1>(X)] * M4) ^ (S1[get_byte<2>(X)] * M1) ^ (S2[get_byte<3>(X)] * M2);
153,664✔
116
}
117

118
inline void ARIA_FO(uint32_t& T0, uint32_t& T1, uint32_t& T2, uint32_t& T3) {
45,283✔
119
   T0 = ARIA_F1(T0);
45,283✔
120
   T1 = ARIA_F1(T1);
45,283✔
121
   T2 = ARIA_F1(T2);
45,283✔
122
   T3 = ARIA_F1(T3);
45,283✔
123

124
   T1 ^= T2;
45,283✔
125
   T2 ^= T3;
45,283✔
126
   T0 ^= T1;
45,283✔
127
   T3 ^= T1;
45,283✔
128
   T2 ^= T0;
45,283✔
129
   T1 ^= T2;
45,283✔
130

131
   T1 = ((T1 << 8) & 0xFF00FF00) | ((T1 >> 8) & 0x00FF00FF);
45,283✔
132
   T2 = rotr<16>(T2);
45,283✔
133
   T3 = reverse_bytes(T3);
45,283✔
134

135
   T1 ^= T2;
45,283✔
136
   T2 ^= T3;
45,283✔
137
   T0 ^= T1;
45,283✔
138
   T3 ^= T1;
45,283✔
139
   T2 ^= T0;
45,283✔
140
   T1 ^= T2;
45,283✔
141
}
45,283✔
142

143
inline void ARIA_FE(uint32_t& T0, uint32_t& T1, uint32_t& T2, uint32_t& T3) {
38,416✔
144
   T0 = ARIA_F2(T0);
38,416✔
145
   T1 = ARIA_F2(T1);
38,416✔
146
   T2 = ARIA_F2(T2);
38,416✔
147
   T3 = ARIA_F2(T3);
38,416✔
148

149
   T1 ^= T2;
38,416✔
150
   T2 ^= T3;
38,416✔
151
   T0 ^= T1;
38,416✔
152
   T3 ^= T1;
38,416✔
153
   T2 ^= T0;
38,416✔
154
   T1 ^= T2;
38,416✔
155

156
   T3 = ((T3 << 8) & 0xFF00FF00) | ((T3 >> 8) & 0x00FF00FF);
38,416✔
157
   T0 = rotr<16>(T0);
38,416✔
158
   T1 = reverse_bytes(T1);
38,416✔
159

160
   T1 ^= T2;
38,416✔
161
   T2 ^= T3;
38,416✔
162
   T0 ^= T1;
38,416✔
163
   T3 ^= T1;
38,416✔
164
   T2 ^= T0;
38,416✔
165
   T1 ^= T2;
38,416✔
166
}
38,416✔
167

168
/*
169
* ARIA encryption and decryption
170
*/
171
void transform(const uint8_t in[], uint8_t out[], size_t blocks, const secure_vector<uint32_t>& KS) {
2,082✔
172
   prefetch_arrays(S1, S2, X1, X2);
2,082✔
173

174
   const size_t ROUNDS = (KS.size() / 4) - 1;
2,082✔
175

176
   for(size_t i = 0; i != blocks; ++i) {
8,872✔
177
      uint32_t t0 = 0;
6,790✔
178
      uint32_t t1 = 0;
6,790✔
179
      uint32_t t2 = 0;
6,790✔
180
      uint32_t t3 = 0;
6,790✔
181
      load_be(in + 16 * i, t0, t1, t2, t3);
6,790✔
182

183
      for(size_t r = 0; r < ROUNDS; r += 2) {
51,919✔
184
         t0 ^= KS[4 * r];
45,129✔
185
         t1 ^= KS[4 * r + 1];
45,129✔
186
         t2 ^= KS[4 * r + 2];
45,129✔
187
         t3 ^= KS[4 * r + 3];
45,129✔
188
         ARIA_FO(t0, t1, t2, t3);
45,129✔
189

190
         t0 ^= KS[4 * r + 4];
45,129✔
191
         t1 ^= KS[4 * r + 5];
45,129✔
192
         t2 ^= KS[4 * r + 6];
45,129✔
193
         t3 ^= KS[4 * r + 7];
45,129✔
194

195
         if(r != ROUNDS - 2) {
45,129✔
196
            ARIA_FE(t0, t1, t2, t3);
38,339✔
197
         }
198
      }
199

200
      out[16 * i + 0] = X1[get_byte<0>(t0)] ^ get_byte<0>(KS[4 * ROUNDS]);
6,790✔
201
      out[16 * i + 1] = X2[get_byte<1>(t0)] ^ get_byte<1>(KS[4 * ROUNDS]);
6,790✔
202
      out[16 * i + 2] = S1[get_byte<2>(t0)] ^ get_byte<2>(KS[4 * ROUNDS]);
6,790✔
203
      out[16 * i + 3] = S2[get_byte<3>(t0)] ^ get_byte<3>(KS[4 * ROUNDS]);
6,790✔
204
      out[16 * i + 4] = X1[get_byte<0>(t1)] ^ get_byte<0>(KS[4 * ROUNDS + 1]);
6,790✔
205
      out[16 * i + 5] = X2[get_byte<1>(t1)] ^ get_byte<1>(KS[4 * ROUNDS + 1]);
6,790✔
206
      out[16 * i + 6] = S1[get_byte<2>(t1)] ^ get_byte<2>(KS[4 * ROUNDS + 1]);
6,790✔
207
      out[16 * i + 7] = S2[get_byte<3>(t1)] ^ get_byte<3>(KS[4 * ROUNDS + 1]);
6,790✔
208
      out[16 * i + 8] = X1[get_byte<0>(t2)] ^ get_byte<0>(KS[4 * ROUNDS + 2]);
6,790✔
209
      out[16 * i + 9] = X2[get_byte<1>(t2)] ^ get_byte<1>(KS[4 * ROUNDS + 2]);
6,790✔
210
      out[16 * i + 10] = S1[get_byte<2>(t2)] ^ get_byte<2>(KS[4 * ROUNDS + 2]);
6,790✔
211
      out[16 * i + 11] = S2[get_byte<3>(t2)] ^ get_byte<3>(KS[4 * ROUNDS + 2]);
6,790✔
212
      out[16 * i + 12] = X1[get_byte<0>(t3)] ^ get_byte<0>(KS[4 * ROUNDS + 3]);
6,790✔
213
      out[16 * i + 13] = X2[get_byte<1>(t3)] ^ get_byte<1>(KS[4 * ROUNDS + 3]);
6,790✔
214
      out[16 * i + 14] = S1[get_byte<2>(t3)] ^ get_byte<2>(KS[4 * ROUNDS + 3]);
6,790✔
215
      out[16 * i + 15] = S2[get_byte<3>(t3)] ^ get_byte<3>(KS[4 * ROUNDS + 3]);
6,790✔
216
   }
217
}
2,082✔
218

219
// n-bit right shift of Y XORed to X
220
template <size_t N>
221
inline void ARIA_ROL128(const uint32_t X[4], const uint32_t Y[4], uint32_t KS[4]) {
1,123✔
222
   // MSVC is not generating a "rotate immediate". Constify to help it along.
223
   static const size_t Q = 4 - (N / 32);
224
   static const size_t R = N % 32;
225
   static_assert(R > 0 && R < 32, "Rotation in range for type");
226
   KS[0] = (X[0]) ^ ((Y[(Q) % 4]) >> R) ^ ((Y[(Q + 3) % 4]) << (32 - R));
1,123✔
227
   KS[1] = (X[1]) ^ ((Y[(Q + 1) % 4]) >> R) ^ ((Y[(Q) % 4]) << (32 - R));
1,123✔
228
   KS[2] = (X[2]) ^ ((Y[(Q + 2) % 4]) >> R) ^ ((Y[(Q + 1) % 4]) << (32 - R));
1,123✔
229
   KS[3] = (X[3]) ^ ((Y[(Q + 3) % 4]) >> R) ^ ((Y[(Q + 2) % 4]) << (32 - R));
1,123✔
230
}
1,123✔
231

232
void aria_ks_dk_transform(uint32_t& K0, uint32_t& K1, uint32_t& K2, uint32_t& K3) {
969✔
233
   K0 = rotr<8>(K0) ^ rotr<16>(K0) ^ rotr<24>(K0);
969✔
234
   K1 = rotr<8>(K1) ^ rotr<16>(K1) ^ rotr<24>(K1);
969✔
235
   K2 = rotr<8>(K2) ^ rotr<16>(K2) ^ rotr<24>(K2);
969✔
236
   K3 = rotr<8>(K3) ^ rotr<16>(K3) ^ rotr<24>(K3);
969✔
237

238
   K1 ^= K2;
969✔
239
   K2 ^= K3;
969✔
240
   K0 ^= K1;
969✔
241
   K3 ^= K1;
969✔
242
   K2 ^= K0;
969✔
243
   K1 ^= K2;
969✔
244

245
   K1 = ((K1 << 8) & 0xFF00FF00) | ((K1 >> 8) & 0x00FF00FF);
969✔
246
   K2 = rotr<16>(K2);
969✔
247
   K3 = reverse_bytes(K3);
969✔
248

249
   K1 ^= K2;
969✔
250
   K2 ^= K3;
969✔
251
   K0 ^= K1;
969✔
252
   K3 ^= K1;
969✔
253
   K2 ^= K0;
969✔
254
   K1 ^= K2;
969✔
255
}
969✔
256

257
/*
258
* ARIA Key Schedule
259
*/
260
void key_schedule(secure_vector<uint32_t>& ERK, secure_vector<uint32_t>& DRK, std::span<const uint8_t> key) {
77✔
261
   const uint32_t KRK[3][4] = {{0x517cc1b7, 0x27220a94, 0xfe13abe8, 0xfa9a6ee0},
77✔
262
                               {0x6db14acc, 0x9e21c820, 0xff28b1d5, 0xef5de2b0},
263
                               {0xdb92371d, 0x2126e970, 0x03249775, 0x04e8c90e}};
264

265
   const size_t CK0 = (key.size() / 8) - 2;
77✔
266
   const size_t CK1 = (CK0 + 1) % 3;
77✔
267
   const size_t CK2 = (CK1 + 1) % 3;
77✔
268

269
   uint32_t w0[4];
77✔
270
   uint32_t w1[4];
77✔
271
   uint32_t w2[4];
77✔
272
   uint32_t w3[4];
77✔
273

274
   w0[0] = load_be<uint32_t>(key.data(), 0);
77✔
275
   w0[1] = load_be<uint32_t>(key.data(), 1);
77✔
276
   w0[2] = load_be<uint32_t>(key.data(), 2);
77✔
277
   w0[3] = load_be<uint32_t>(key.data(), 3);
77✔
278

279
   w1[0] = w0[0] ^ KRK[CK0][0];
77✔
280
   w1[1] = w0[1] ^ KRK[CK0][1];
77✔
281
   w1[2] = w0[2] ^ KRK[CK0][2];
77✔
282
   w1[3] = w0[3] ^ KRK[CK0][3];
77✔
283

284
   ARIA_FO(w1[0], w1[1], w1[2], w1[3]);
77✔
285

286
   if(key.size() == 24 || key.size() == 32) {
77✔
287
      w1[0] ^= load_be<uint32_t>(key.data(), 4);
35✔
288
      w1[1] ^= load_be<uint32_t>(key.data(), 5);
35✔
289
   }
290
   if(key.size() == 32) {
77✔
291
      w1[2] ^= load_be<uint32_t>(key.data(), 6);
26✔
292
      w1[3] ^= load_be<uint32_t>(key.data(), 7);
26✔
293
   }
294

295
   w2[0] = w1[0] ^ KRK[CK1][0];
77✔
296
   w2[1] = w1[1] ^ KRK[CK1][1];
77✔
297
   w2[2] = w1[2] ^ KRK[CK1][2];
77✔
298
   w2[3] = w1[3] ^ KRK[CK1][3];
77✔
299

300
   ARIA_FE(w2[0], w2[1], w2[2], w2[3]);
77✔
301

302
   w2[0] ^= w0[0];
77✔
303
   w2[1] ^= w0[1];
77✔
304
   w2[2] ^= w0[2];
77✔
305
   w2[3] ^= w0[3];
77✔
306

307
   w3[0] = w2[0] ^ KRK[CK2][0];
77✔
308
   w3[1] = w2[1] ^ KRK[CK2][1];
77✔
309
   w3[2] = w2[2] ^ KRK[CK2][2];
77✔
310
   w3[3] = w2[3] ^ KRK[CK2][3];
77✔
311

312
   ARIA_FO(w3[0], w3[1], w3[2], w3[3]);
77✔
313

314
   w3[0] ^= w1[0];
77✔
315
   w3[1] ^= w1[1];
77✔
316
   w3[2] ^= w1[2];
77✔
317
   w3[3] ^= w1[3];
77✔
318

319
   if(key.size() == 16) {
77✔
320
      ERK.resize(4 * 13);
42✔
321
   } else if(key.size() == 24) {
35✔
322
      ERK.resize(4 * 15);
9✔
323
   } else if(key.size() == 32) {
26✔
324
      ERK.resize(4 * 17);
26✔
325
   }
326

327
   ARIA_ROL128<19>(w0, w1, &ERK[0]);  // NOLINT(*-container-data-pointer)
77✔
328
   ARIA_ROL128<19>(w1, w2, &ERK[4]);
77✔
329
   ARIA_ROL128<19>(w2, w3, &ERK[8]);
77✔
330
   ARIA_ROL128<19>(w3, w0, &ERK[12]);
77✔
331
   ARIA_ROL128<31>(w0, w1, &ERK[16]);
77✔
332
   ARIA_ROL128<31>(w1, w2, &ERK[20]);
77✔
333
   ARIA_ROL128<31>(w2, w3, &ERK[24]);
77✔
334
   ARIA_ROL128<31>(w3, w0, &ERK[28]);
77✔
335
   ARIA_ROL128<67>(w0, w1, &ERK[32]);
77✔
336
   ARIA_ROL128<67>(w1, w2, &ERK[36]);
77✔
337
   ARIA_ROL128<67>(w2, w3, &ERK[40]);
77✔
338
   ARIA_ROL128<67>(w3, w0, &ERK[44]);
77✔
339
   ARIA_ROL128<97>(w0, w1, &ERK[48]);
77✔
340

341
   if(key.size() == 24 || key.size() == 32) {
77✔
342
      ARIA_ROL128<97>(w1, w2, &ERK[52]);
35✔
343
      ARIA_ROL128<97>(w2, w3, &ERK[56]);
35✔
344

345
      if(key.size() == 32) {
35✔
346
         ARIA_ROL128<97>(w3, w0, &ERK[60]);
26✔
347
         ARIA_ROL128<109>(w0, w1, &ERK[64]);
26✔
348
      }
349
   }
350

351
   // Now create the decryption key schedule
352
   DRK.resize(ERK.size());
77✔
353

354
   for(size_t i = 0; i != DRK.size(); i += 4) {
1,200✔
355
      DRK[i] = ERK[ERK.size() - 4 - i];
1,123✔
356
      DRK[i + 1] = ERK[ERK.size() - 3 - i];
1,123✔
357
      DRK[i + 2] = ERK[ERK.size() - 2 - i];
1,123✔
358
      DRK[i + 3] = ERK[ERK.size() - 1 - i];
1,123✔
359
   }
360

361
   for(size_t i = 4; i != DRK.size() - 4; i += 4) {
1,046✔
362
      aria_ks_dk_transform(DRK[i + 0], DRK[i + 1], DRK[i + 2], DRK[i + 3]);
969✔
363
   }
364
}
77✔
365

366
}  // namespace ARIA_F
367

368
}  // namespace
369

370
void ARIA_128::encrypt_n(const uint8_t in[], uint8_t out[], size_t blocks) const {
1,061✔
371
   assert_key_material_set();
1,061✔
372

373
#if defined(BOTAN_HAS_ARIA_AVX512_GFNI)
374
   if(CPUID::has(CPUID::Feature::AVX512, CPUID::Feature::GFNI)) {
1,052✔
375
      return aria_avx512_gfni_encrypt(in, out, blocks);
×
376
   }
377
#endif
378

379
   ARIA_F::transform(in, out, blocks, m_ERK);
1,052✔
380
}
381

382
void ARIA_192::encrypt_n(const uint8_t in[], uint8_t out[], size_t blocks) const {
15✔
383
   assert_key_material_set();
15✔
384

385
#if defined(BOTAN_HAS_ARIA_AVX512_GFNI)
386
   if(CPUID::has(CPUID::Feature::AVX512, CPUID::Feature::GFNI)) {
9✔
387
      return aria_avx512_gfni_encrypt(in, out, blocks);
×
388
   }
389
#endif
390

391
   ARIA_F::transform(in, out, blocks, m_ERK);
9✔
392
}
393

394
void ARIA_256::encrypt_n(const uint8_t in[], uint8_t out[], size_t blocks) const {
472✔
395
   assert_key_material_set();
472✔
396

397
#if defined(BOTAN_HAS_ARIA_AVX512_GFNI)
398
   if(CPUID::has(CPUID::Feature::AVX512, CPUID::Feature::GFNI)) {
466✔
399
      return aria_avx512_gfni_encrypt(in, out, blocks);
×
400
   }
401
#endif
402

403
   ARIA_F::transform(in, out, blocks, m_ERK);
466✔
404
}
405

406
void ARIA_128::decrypt_n(const uint8_t in[], uint8_t out[], size_t blocks) const {
268✔
407
   assert_key_material_set();
268✔
408

409
#if defined(BOTAN_HAS_ARIA_AVX512_GFNI)
410
   if(CPUID::has(CPUID::Feature::AVX512, CPUID::Feature::GFNI)) {
262✔
411
      return aria_avx512_gfni_decrypt(in, out, blocks);
×
412
   }
413
#endif
414

415
   ARIA_F::transform(in, out, blocks, m_DRK);
262✔
416
}
417

418
void ARIA_192::decrypt_n(const uint8_t in[], uint8_t out[], size_t blocks) const {
12✔
419
   assert_key_material_set();
12✔
420

421
#if defined(BOTAN_HAS_ARIA_AVX512_GFNI)
422
   if(CPUID::has(CPUID::Feature::AVX512, CPUID::Feature::GFNI)) {
6✔
423
      return aria_avx512_gfni_decrypt(in, out, blocks);
×
424
   }
425
#endif
426

427
   ARIA_F::transform(in, out, blocks, m_DRK);
6✔
428
}
429

430
void ARIA_256::decrypt_n(const uint8_t in[], uint8_t out[], size_t blocks) const {
293✔
431
   assert_key_material_set();
293✔
432

433
#if defined(BOTAN_HAS_ARIA_AVX512_GFNI)
434
   if(CPUID::has(CPUID::Feature::AVX512, CPUID::Feature::GFNI)) {
287✔
435
      return aria_avx512_gfni_decrypt(in, out, blocks);
×
436
   }
437
#endif
438

439
   ARIA_F::transform(in, out, blocks, m_DRK);
287✔
440
}
441

442
bool ARIA_128::has_keying_material() const {
3,134✔
443
   return !m_ERK.empty();
3,134✔
444
}
445

446
bool ARIA_192::has_keying_material() const {
39✔
447
   return !m_ERK.empty();
39✔
448
}
449

450
bool ARIA_256::has_keying_material() const {
2,291✔
451
   return !m_ERK.empty();
2,291✔
452
}
453

454
namespace {
455

456
size_t aria_parallelism() {
141✔
457
#if defined(BOTAN_HAS_ARIA_AVX512_GFNI)
458
   if(CPUID::has(CPUID::Feature::AVX512, CPUID::Feature::GFNI)) {
141✔
459
      return 16;
×
460
   }
461
#endif
462
   return 1;
463
}
464

465
std::string aria_provider() {
9✔
466
#if defined(BOTAN_HAS_ARIA_AVX512_GFNI)
467
   if(auto feat = CPUID::check(CPUID::Feature::AVX512, CPUID::Feature::GFNI)) {
9✔
468
      return *feat;
×
469
   }
×
470
#endif
471
   return "base";
9✔
472
}
473

474
}  // namespace
475

476
size_t ARIA_128::parallelism() const {
78✔
477
   return aria_parallelism();
78✔
478
}
479

480
std::string ARIA_128::provider() const {
3✔
481
   return aria_provider();
3✔
482
}
483

484
size_t ARIA_192::parallelism() const {
9✔
485
   return aria_parallelism();
9✔
486
}
487

488
std::string ARIA_192::provider() const {
3✔
489
   return aria_provider();
3✔
490
}
491

492
size_t ARIA_256::parallelism() const {
54✔
493
   return aria_parallelism();
54✔
494
}
495

496
std::string ARIA_256::provider() const {
3✔
497
   return aria_provider();
3✔
498
}
499

500
void ARIA_128::key_schedule(std::span<const uint8_t> key) {
42✔
501
   ARIA_F::key_schedule(m_ERK, m_DRK, key);
42✔
502
}
42✔
503

504
void ARIA_192::key_schedule(std::span<const uint8_t> key) {
9✔
505
   ARIA_F::key_schedule(m_ERK, m_DRK, key);
9✔
506
}
9✔
507

508
void ARIA_256::key_schedule(std::span<const uint8_t> key) {
26✔
509
   ARIA_F::key_schedule(m_ERK, m_DRK, key);
26✔
510
}
26✔
511

512
void ARIA_128::clear() {
22✔
513
   zap(m_ERK);
22✔
514
   zap(m_DRK);
22✔
515
}
22✔
516

517
void ARIA_192::clear() {
6✔
518
   zap(m_ERK);
6✔
519
   zap(m_DRK);
6✔
520
}
6✔
521

522
void ARIA_256::clear() {
16✔
523
   zap(m_ERK);
16✔
524
   zap(m_DRK);
16✔
525
}
16✔
526

527
}  // namespace Botan
STATUS · Troubleshooting · Open an Issue · Sales · Support · CAREERS · ENTERPRISE · START FREE · SCHEDULE DEMO
ANNOUNCEMENTS · TWITTER · TOS & SLA · Supported CI Services · What's a CI service? · Automated Testing

© 2026 Coveralls, Inc