Botan 3.10.0
Crypto and TLS for C&
hex.cpp
Go to the documentation of this file.
1/*
2* Hex Encoding and Decoding
3* (C) 2010,2020 Jack Lloyd
4*
5* Botan is released under the Simplified BSD License (see license.txt)
6*/
7
8#include <botan/hex.h>
9
10#include <botan/exceptn.h>
11#include <botan/mem_ops.h>
12#include <botan/internal/charset.h>
13#include <botan/internal/fmt.h>
14#include <botan/internal/int_utils.h>
15#include <botan/internal/loadstor.h>
16
17namespace Botan {
18
19namespace {
20
21uint16_t hex_encode_2nibble(uint8_t n8, bool uppercase) {
22 // Offset for upper or lower case 'a' resp
23 const uint16_t a_mask = uppercase ? 0x0707 : 0x2727;
24
25 const uint16_t n = (static_cast<uint16_t>(n8 & 0xF0) << 4) | (n8 & 0x0F);
26 // n >= 10? If so add offset
27 const uint16_t diff = swar_lt<uint16_t>(0x0909, n) & a_mask;
28 // Can't overflow between bytes, so don't need explicit SWAR addition:
29 return n + 0x3030 + diff;
30}
31
32} // namespace
33
34void hex_encode(char output[], const uint8_t input[], size_t input_length, bool uppercase) {
35 for(size_t i = 0; i != input_length; ++i) {
36 const uint16_t h = hex_encode_2nibble(input[i], uppercase);
37 output[2 * i] = get_byte<0>(h);
38 output[2 * i + 1] = get_byte<1>(h);
39 }
40}
41
42std::string hex_encode(const uint8_t input[], size_t input_length, bool uppercase) {
43 std::string output(2 * input_length, 0);
44
45 if(input_length > 0) {
46 hex_encode(&output.front(), input, input_length, uppercase);
47 }
48
49 return output;
50}
51
52namespace {
53
54uint8_t hex_char_to_bin(char input) {
55 // Starts of valid value ranges (v_lo) and their lengths (v_range)
56 constexpr uint64_t v_lo = make_uint64(0, '0', 'a', 'A', ' ', '\n', '\t', '\r');
57 constexpr uint64_t v_range = make_uint64(0, 10, 6, 6, 1, 1, 1, 1);
58
59 const uint8_t x = static_cast<uint8_t>(input);
60 const uint64_t x8 = x * 0x0101010101010101;
61
62 const uint64_t v_mask = swar_in_range<uint64_t>(x8, v_lo, v_range) ^ 0x8000000000000000;
63
64 // This is the offset added to x to get the value we need
65 const uint64_t val_v = 0xd0a9c960767773 ^ static_cast<uint64_t>(0xFF - x) << 56;
66
67 return x + static_cast<uint8_t>(val_v >> (8 * index_of_first_set_byte(v_mask)));
68}
69
70} // namespace
71
72size_t hex_decode(uint8_t output[], const char input[], size_t input_length, size_t& input_consumed, bool ignore_ws) {
73 uint8_t* out_ptr = output;
74 bool top_nibble = true;
75
76 clear_mem(output, input_length / 2);
77
78 for(size_t i = 0; i != input_length; ++i) {
79 const uint8_t bin = hex_char_to_bin(input[i]);
80
81 if(bin >= 0x10) {
82 if(bin == 0x80 && ignore_ws) {
83 continue;
84 }
85
86 throw Invalid_Argument(fmt("hex_decode: invalid character '{}'", format_char_for_display(input[i])));
87 }
88
89 if(top_nibble) {
90 *out_ptr |= bin << 4;
91 } else {
92 *out_ptr |= bin;
93 }
94
95 top_nibble = !top_nibble;
96 if(top_nibble) {
97 ++out_ptr;
98 }
99 }
100
101 input_consumed = input_length;
102 size_t written = (out_ptr - output);
103
104 /*
105 * We only got half of a uint8_t at the end; zap the half-written
106 * output and mark it as unread
107 */
108 if(!top_nibble) {
109 *out_ptr = 0;
110 input_consumed -= 1;
111 }
112
113 return written;
114}
115
116size_t hex_decode(uint8_t output[], const char input[], size_t input_length, bool ignore_ws) {
117 size_t consumed = 0;
118 size_t written = hex_decode(output, input, input_length, consumed, ignore_ws);
119
120 if(consumed != input_length) {
121 throw Invalid_Argument("hex_decode: input did not have full bytes");
122 }
123
124 return written;
125}
126
127size_t hex_decode(uint8_t output[], std::string_view input, bool ignore_ws) {
128 return hex_decode(output, input.data(), input.length(), ignore_ws);
129}
130
131size_t hex_decode(std::span<uint8_t> output, std::string_view input, bool ignore_ws) {
132 return hex_decode(output.data(), input.data(), input.length(), ignore_ws);
133}
134
135secure_vector<uint8_t> hex_decode_locked(const char input[], size_t input_length, bool ignore_ws) {
136 secure_vector<uint8_t> bin(1 + input_length / 2);
137
138 size_t written = hex_decode(bin.data(), input, input_length, ignore_ws);
139
140 bin.resize(written);
141 return bin;
142}
143
144secure_vector<uint8_t> hex_decode_locked(std::string_view input, bool ignore_ws) {
145 return hex_decode_locked(input.data(), input.size(), ignore_ws);
146}
147
148std::vector<uint8_t> hex_decode(const char input[], size_t input_length, bool ignore_ws) {
149 std::vector<uint8_t> bin(1 + input_length / 2);
150
151 size_t written = hex_decode(bin.data(), input, input_length, ignore_ws);
152
153 bin.resize(written);
154 return bin;
155}
156
157std::vector<uint8_t> hex_decode(std::string_view input, bool ignore_ws) {
158 return hex_decode(input.data(), input.size(), ignore_ws);
159}
160
161} // namespace Botan
constexpr uint8_t get_byte(T input)
Definition loadstor.h:79
std::string format_char_for_display(char c)
Definition charset.cpp:98
constexpr T swar_lt(T a, T b)
Definition int_utils.h:91
constexpr auto out_ptr(T &outptr) noexcept
Definition stl_util.h:414
constexpr uint64_t make_uint64(uint8_t i0, uint8_t i1, uint8_t i2, uint8_t i3, uint8_t i4, uint8_t i5, uint8_t i6, uint8_t i7)
Definition loadstor.h:121
std::string fmt(std::string_view format, const T &... args)
Definition fmt.h:53
constexpr T swar_in_range(T v, T lower, T upper)
Definition int_utils.h:114
secure_vector< uint8_t > hex_decode_locked(const char input[], size_t input_length, bool ignore_ws)
Definition hex.cpp:135
constexpr size_t index_of_first_set_byte(T v)
Definition int_utils.h:130
void hex_encode(char output[], const uint8_t input[], size_t input_length, bool uppercase)
Definition hex.cpp:34
size_t hex_decode(uint8_t output[], const char input[], size_t input_length, size_t &input_consumed, bool ignore_ws)
Definition hex.cpp:72
std::vector< T, secure_allocator< T > > secure_vector
Definition secmem.h:69
constexpr void clear_mem(T *ptr, size_t n)
Definition mem_ops.h:119