Botan 3.10.0
Crypto and TLS for C&
base64.cpp
Go to the documentation of this file.
1/*
2* Base64 Encoding and Decoding
3* (C) 2010,2015,2020 Jack Lloyd
4*
5* Botan is released under the Simplified BSD License (see license.txt)
6*/
7
8#include <botan/base64.h>
9
10#include <botan/exceptn.h>
11#include <botan/internal/charset.h>
12#include <botan/internal/codec_base.h>
13#include <botan/internal/fmt.h>
14#include <botan/internal/int_utils.h>
15#include <botan/internal/loadstor.h>
16#include <botan/internal/rounding.h>
17
18namespace Botan {
19
20namespace {
21
22class Base64 final {
23 public:
24 static std::string name() noexcept { return "base64"; }
25
26 static constexpr size_t encoding_bytes_in() noexcept { return m_encoding_bytes_in; }
27
28 static constexpr size_t encoding_bytes_out() noexcept { return m_encoding_bytes_out; }
29
30 static constexpr size_t decoding_bytes_in() noexcept { return m_encoding_bytes_out; }
31
32 static constexpr size_t decoding_bytes_out() noexcept { return m_encoding_bytes_in; }
33
34 static constexpr size_t bits_consumed() noexcept { return m_encoding_bits; }
35
36 static constexpr size_t remaining_bits_before_padding() noexcept { return m_remaining_bits_before_padding; }
37
38 static constexpr size_t encode_max_output(size_t input_length) {
39 return (round_up(input_length, m_encoding_bytes_in) / m_encoding_bytes_in) * m_encoding_bytes_out;
40 }
41
42 static constexpr size_t decode_max_output(size_t input_length) {
43 return (round_up(input_length, m_encoding_bytes_out) * m_encoding_bytes_in) / m_encoding_bytes_out;
44 }
45
46 static void encode(char out[4], const uint8_t in[3]) noexcept;
47
48 static uint8_t lookup_binary_value(char input) noexcept;
49
50 static bool check_bad_char(uint8_t bin, char input, bool ignore_ws);
51
52 static void decode(uint8_t* out_ptr, const uint8_t decode_buf[4]) {
53 out_ptr[0] = (decode_buf[0] << 2) | (decode_buf[1] >> 4);
54 out_ptr[1] = (decode_buf[1] << 4) | (decode_buf[2] >> 2);
55 out_ptr[2] = (decode_buf[2] << 6) | decode_buf[3];
56 }
57
58 static size_t bytes_to_remove(size_t final_truncate) { return final_truncate; }
59
60 private:
61 static constexpr size_t m_encoding_bits = 6;
62 static constexpr size_t m_remaining_bits_before_padding = 8;
63
64 static constexpr size_t m_encoding_bytes_in = 3;
65 static constexpr size_t m_encoding_bytes_out = 4;
66};
67
68uint32_t lookup_base64_chars(uint32_t x32) {
69 /*
70 * The basic insight of this approach is that our goal is computing
71 * f(x) = y where x is in [0,63) and y is the correct base64 encoding.
72 *
73 * Instead of doing this directly, we compute
74 * offset(x) such that f(x) = x + offset(x)
75 *
76 * This is described in
77 * http://0x80.pl/notesen/2016-01-12-sse-base64-encoding.html#improved-version
78 *
79 * Here we do a SWAR (simd within a register) implementation of Wojciech's lookup_version2_swar
80 */
81
82 uint32_t r = x32 + 0x41414141;
83
84 r += (~swar_lt<uint32_t>(x32, 0x1A1A1A1A)) & 0x06060606;
85 r -= (~swar_lt<uint32_t>(x32, 0x34343434)) & 0x4B4B4B4B;
86 r -= (~swar_lt<uint32_t>(x32, 0x3E3E3E3E)) & 0x0F0F0F0F;
87 r += (~swar_lt<uint32_t>(x32, 0x3F3F3F3F)) & 0x03030303;
88
89 return r;
90}
91
92//static
93void Base64::encode(char out[4], const uint8_t in[3]) noexcept {
94 const uint32_t b0 = (in[0] & 0xFC) >> 2;
95 const uint32_t b1 = ((in[0] & 0x03) << 4) | (in[1] >> 4);
96 const uint32_t b2 = ((in[1] & 0x0F) << 2) | (in[2] >> 6);
97 const uint32_t b3 = in[2] & 0x3F;
98
99 const uint32_t z = (b0 << 24) | (b1 << 16) | (b2 << 8) | b3;
100
101 const uint32_t b64 = lookup_base64_chars(z);
102
103 out[0] = static_cast<char>(get_byte<0>(b64));
104 out[1] = static_cast<char>(get_byte<1>(b64));
105 out[2] = static_cast<char>(get_byte<2>(b64));
106 out[3] = static_cast<char>(get_byte<3>(b64));
107}
108
109//static
110uint8_t Base64::lookup_binary_value(char input) noexcept {
111 auto has_zero_byte = [](uint64_t v) { return ((v - 0x0101010101010101) & ~(v) & 0x8080808080808080); };
112
113 // Assumes each byte is either 0x00 or 0x80
114 auto index_of_first_set_byte = [](uint64_t v) {
115 return ((((v - 1) & 0x0101010101010101) * 0x0101010101010101) >> 56) - 1;
116 };
117
118 constexpr uint64_t lo = 0x0101010101010101;
119
120 const uint8_t x = static_cast<uint8_t>(input);
121
122 const uint64_t x8 = x * lo;
123
124 // Defines the valid ASCII ranges of base64, except the special chars (below)
125 constexpr uint64_t val_l = make_uint64(0, 0, 0, 0, 0, 'A', 'a', '0');
126 constexpr uint64_t val_u = make_uint64(0, 0, 0, 0, 0, 26, 26, 10);
127
128 // If x is in one of the ranges return a mask. Otherwise we xor in at the
129 // high word which will be our invalid marker
130 auto v_mask = swar_in_range<uint64_t>(x8, val_l, val_u) ^ 0x80000000;
131
132 // This is the offset added to x to get the value
133 const uint64_t val_v = 0xbfb904 ^ (0xFF000000 - (x << 24));
134
135 uint8_t z = x + static_cast<uint8_t>(val_v >> (8 * index_of_first_set_byte(v_mask)));
136
137 // Valid base64 special characters, and some whitespace chars
138 constexpr uint64_t specials_i = make_uint64(0, '+', '/', '=', ' ', '\n', '\t', '\r');
139
140 const uint64_t specials_v = 0x3e3f8180808080 ^ (static_cast<uint64_t>(z) << 56);
141
142 const uint64_t smask = has_zero_byte(x8 ^ specials_i) ^ 0x8000000000000000;
143
144 return static_cast<uint8_t>(specials_v >> (8 * index_of_first_set_byte(smask)));
145}
146
147//static
148bool Base64::check_bad_char(uint8_t bin, char input, bool ignore_ws) {
149 if(bin <= 0x3F) {
150 return true;
151 } else if(!(bin == 0x81 || (bin == 0x80 && ignore_ws))) {
152 throw Invalid_Argument(fmt("base64_decode: invalid character '{}'", format_char_for_display(input)));
153 }
154 return false;
155}
156
157} // namespace
158
159size_t base64_encode(char out[], const uint8_t in[], size_t input_length, size_t& input_consumed, bool final_inputs) {
160 return base_encode(Base64(), out, in, input_length, input_consumed, final_inputs);
161}
162
163std::string base64_encode(const uint8_t input[], size_t input_length) {
164 return base_encode_to_string(Base64(), input, input_length);
165}
166
168 uint8_t out[], const char in[], size_t input_length, size_t& input_consumed, bool final_inputs, bool ignore_ws) {
169 return base_decode(Base64(), out, in, input_length, input_consumed, final_inputs, ignore_ws);
170}
171
172size_t base64_decode(uint8_t output[], const char input[], size_t input_length, bool ignore_ws) {
173 return base_decode_full(Base64(), output, input, input_length, ignore_ws);
174}
175
176size_t base64_decode(uint8_t output[], std::string_view input, bool ignore_ws) {
177 return base64_decode(output, input.data(), input.length(), ignore_ws);
178}
179
180size_t base64_decode(std::span<uint8_t> output, std::string_view input, bool ignore_ws) {
181 if(output.size() < base64_decode_max_output(input.size())) {
182 throw Invalid_Argument("base64_decode: output buffer is too short");
183 }
184 return base64_decode(output.data(), input.data(), input.length(), ignore_ws);
185}
186
187secure_vector<uint8_t> base64_decode(const char input[], size_t input_length, bool ignore_ws) {
188 return base_decode_to_vec<secure_vector<uint8_t>>(Base64(), input, input_length, ignore_ws);
189}
190
191secure_vector<uint8_t> base64_decode(std::string_view input, bool ignore_ws) {
192 return base64_decode(input.data(), input.size(), ignore_ws);
193}
194
195size_t base64_encode_max_output(size_t input_length) {
196 return Base64::encode_max_output(input_length);
197}
198
199size_t base64_decode_max_output(size_t input_length) {
200 return Base64::decode_max_output(input_length);
201}
202
203} // namespace Botan
std::string encode(const uint8_t der[], size_t length, std::string_view label, size_t width)
Definition pem.cpp:39
secure_vector< uint8_t > decode(DataSource &source, std::string &label)
Definition pem.cpp:62
constexpr uint8_t get_byte(T input)
Definition loadstor.h:79
std::string format_char_for_display(char c)
Definition charset.cpp:98
constexpr T swar_lt(T a, T b)
Definition int_utils.h:91
std::string base_encode_to_string(const Base &base, const uint8_t input[], size_t input_length)
Definition codec_base.h:84
constexpr auto out_ptr(T &outptr) noexcept
Definition stl_util.h:414
constexpr uint64_t make_uint64(uint8_t i0, uint8_t i1, uint8_t i2, uint8_t i3, uint8_t i4, uint8_t i5, uint8_t i6, uint8_t i7)
Definition loadstor.h:121
std::string fmt(std::string_view format, const T &... args)
Definition fmt.h:53
constexpr T swar_in_range(T v, T lower, T upper)
Definition int_utils.h:114
constexpr size_t round_up(size_t n, size_t align_to)
Definition rounding.h:26
constexpr size_t index_of_first_set_byte(T v)
Definition int_utils.h:130
size_t base64_encode(char out[], const uint8_t in[], size_t input_length, size_t &input_consumed, bool final_inputs)
Definition base64.cpp:159
size_t base_encode(const Base &base, char output[], const uint8_t input[], size_t input_length, size_t &input_consumed, bool final_inputs)
Definition codec_base.h:35
size_t base64_decode(uint8_t out[], const char in[], size_t input_length, size_t &input_consumed, bool final_inputs, bool ignore_ws)
Definition base64.cpp:167
size_t base_decode(const Base &base, uint8_t output[], const char input[], size_t input_length, size_t &input_consumed, bool final_inputs, bool ignore_ws=true)
Definition codec_base.h:118
size_t base64_encode_max_output(size_t input_length)
Definition base64.cpp:195
size_t base64_decode_max_output(size_t input_length)
Definition base64.cpp:199
std::vector< T, secure_allocator< T > > secure_vector
Definition secmem.h:69
Vector base_decode_to_vec(const Base &base, const char input[], size_t input_length, bool ignore_ws)
Definition codec_base.h:190
size_t base_decode_full(const Base &base, uint8_t output[], const char input[], size_t input_length, bool ignore_ws)
Definition codec_base.h:178