| /* hex.c - conversion for hexadecimal and base32 strings. |
| * |
| * Copyright (c) 2008, Aleksey Kravchenko <rhash.admin@gmail.com> |
| * |
| * Permission to use, copy, modify, and/or distribute this software for any |
| * purpose with or without fee is hereby granted. |
| * |
| * THE SOFTWARE IS PROVIDED "AS IS" AND THE AUTHOR DISCLAIMS ALL WARRANTIES WITH |
| * REGARD TO THIS SOFTWARE INCLUDING ALL IMPLIED WARRANTIES OF MERCHANTABILITY |
| * AND FITNESS. IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY SPECIAL, DIRECT, |
| * INDIRECT, OR CONSEQUENTIAL DAMAGES OR ANY DAMAGES WHATSOEVER RESULTING FROM |
| * LOSS OF USE, DATA OR PROFITS, WHETHER IN AN ACTION OF CONTRACT, NEGLIGENCE |
| * OR OTHER TORTIOUS ACTION, ARISING OUT OF OR IN CONNECTION WITH THE USE OR |
| * PERFORMANCE OF THIS SOFTWARE. |
| */ |
| #include "hex.h" |
| #include "util.h" |
| #include <ctype.h> |
| #include <string.h> |
| |
| /** |
| * Store hexadecimal representation of a binary string to given buffer. |
| * |
| * @param dst the buffer to receive hexadecimal representation |
| * @param src binary string |
| * @param length string length |
| * @param upper_case flag to print string in uppercase |
| */ |
| void rhash_byte_to_hex(char* dst, const unsigned char* src, size_t length, int upper_case) |
| { |
| const char hex_add = (upper_case ? 'A' - 10 : 'a' - 10); |
| for (; length > 0; src++, length--) { |
| const unsigned char hi = (*src >> 4) & 15; |
| const unsigned char lo = *src & 15; |
| *dst++ = (hi > 9 ? hi + hex_add : hi + '0'); |
| *dst++ = (lo > 9 ? lo + hex_add : lo + '0'); |
| } |
| *dst = '\0'; |
| } |
| |
| /** |
| * Encode a binary string to base32. |
| * |
| * @param dst the buffer to store result |
| * @param src binary string |
| * @param length string length |
| * @param upper_case flag to print string in uppercase |
| */ |
| void rhash_byte_to_base32(char* dst, const unsigned char* src, size_t length, int upper_case) |
| { |
| const char a = (upper_case ? 'A' : 'a'); |
| unsigned shift = 0; |
| unsigned char word; |
| const unsigned char* e = src + length; |
| while (src < e) { |
| if (shift > 3) { |
| word = (*src & (0xFF >> shift)); |
| shift = (shift + 5) % 8; |
| word <<= shift; |
| if (src + 1 < e) |
| word |= *(src + 1) >> (8 - shift); |
| ++src; |
| } else { |
| shift = (shift + 5) % 8; |
| word = ( *src >> ( (8 - shift) & 7 ) ) & 0x1F; |
| if (shift == 0) src++; |
| } |
| *dst++ = ( word < 26 ? word + a : word + '2' - 26 ); |
| } |
| *dst = '\0'; |
| } |
| |
| /** |
| * Encode a binary string to base64. |
| * Encoded output length is always a multiple of 4 bytes. |
| * |
| * @param dst the buffer to store result |
| * @param src binary string |
| * @param length string length |
| */ |
| void rhash_byte_to_base64(char* dst, const unsigned char* src, size_t length) |
| { |
| static const char* tail = "0123456789+/"; |
| unsigned shift = 0; |
| unsigned char word; |
| const unsigned char* e = src + length; |
| while (src < e) { |
| if (shift > 2) { |
| word = (*src & (0xFF >> shift)); |
| shift = (shift + 6) % 8; |
| word <<= shift; |
| if (src + 1 < e) |
| word |= *(src + 1) >> (8 - shift); |
| ++src; |
| } else { |
| shift = (shift + 6) % 8; |
| word = ( *src >> ( (8 - shift) & 7 ) ) & 0x3F; |
| if (shift == 0) src++; |
| } |
| *dst++ = ( word < 52 ? (word < 26 ? word + 'A' : word - 26 + 'a') : tail[word - 52]); |
| } |
| if (shift > 0) { |
| *dst++ = '='; |
| if (shift == 4) *dst++ = '='; |
| } |
| *dst = '\0'; |
| } |
| |
| size_t rhash_base64_url_encoded_helper(char* dst, const unsigned char* src, size_t length, int url_encode, int upper_case) |
| { |
| #define B64_CHUNK_SIZE 120 |
| char buffer[164]; |
| #ifdef __clang_analyzer__ |
| memset(buffer, 0, sizeof(buffer)); |
| #endif |
| RHASH_ASSERT((BASE64_LENGTH(B64_CHUNK_SIZE) + 4) <= sizeof(buffer)); |
| RHASH_ASSERT((B64_CHUNK_SIZE % 6) == 0); |
| if (url_encode) { |
| size_t result_length = 0; |
| for (; length > 0; src += B64_CHUNK_SIZE) { |
| size_t chunk_size = (length < B64_CHUNK_SIZE ? length : B64_CHUNK_SIZE); |
| size_t encoded_length; |
| rhash_byte_to_base64(buffer, src, chunk_size); |
| encoded_length = rhash_urlencode(dst, buffer, BASE64_LENGTH(chunk_size), upper_case); |
| result_length += encoded_length; |
| dst += encoded_length; |
| length -= chunk_size; |
| } |
| return result_length; |
| } |
| rhash_byte_to_base64(dst, src, length); |
| return BASE64_LENGTH(length); |
| } |
| |
| /* RFC 3986: safe url characters are ascii alpha-numeric and "-._~", other characters should be percent-encoded */ |
| static unsigned url_safe_char_mask[4] = { 0, 0x03ff6000, 0x87fffffe, 0x47fffffe }; |
| #define IS_URL_GOOD_CHAR(c) ((unsigned)(c) < 128 && (url_safe_char_mask[c >> 5] & (1 << (c & 31)))) |
| |
| /** |
| * URL-encode specified binary string. |
| * |
| * @param dst (nullable) buffer to output encoded string to, |
| * NULL to just calculate the lengths of encoded string |
| * @param src binary string to encode |
| * @param size size of the binary string |
| * @param upper_case flag to output hex-codes in uppercase |
| * @return the length of the result string |
| */ |
| size_t rhash_urlencode(char* dst, const char* src, size_t size, int upper_case) |
| { |
| const char* start; |
| size_t i; |
| if (!dst) { |
| size_t length = size; |
| for (i = 0; i < size; i++) |
| if (!IS_URL_GOOD_CHAR(src[i])) |
| length += 2; |
| return length; |
| } else { |
| const char hex_add = (upper_case ? 'A' - 10 : 'a' - 10); |
| start = dst; |
| /* percent-encode all but unreserved URL characters */ |
| for (i = 0; i < size; i++) { |
| if (IS_URL_GOOD_CHAR(src[i])) { |
| *dst++ = src[i]; |
| } else { |
| unsigned char hi = ((unsigned char)(src[i]) >> 4) & 0x0f; |
| unsigned char lo = (unsigned char)(src[i]) & 0x0f; |
| *dst++ = '%'; |
| *dst++ = (hi > 9 ? hi + hex_add : hi + '0'); |
| *dst++ = (lo > 9 ? lo + hex_add : lo + '0'); |
| } |
| } |
| *dst = 0; |
| } |
| return dst - start; |
| } |
| |
| /** |
| * Print 64-bit number with trailing '\0' to a string buffer. |
| * if dst is NULL, then just return the length of the number. |
| * |
| * @param dst output buffer |
| * @param number the number to print |
| * @return length of the printed number (without trailing '\0') |
| */ |
| int rhash_sprintI64(char* dst, uint64_t number) |
| { |
| /* The biggest number has 20 digits: 2^64 = 18 446 744 073 709 551 616 */ |
| char buf[24]; |
| char* p; |
| size_t length; |
| |
| if (dst == NULL) { |
| /* just calculate the length of the number */ |
| if (number == 0) return 1; |
| for (length = 0; number != 0; number /= 10) length++; |
| return (int)length; |
| } |
| |
| p = buf + 23; |
| *p = '\0'; /* last symbol should be '\0' */ |
| if (number == 0) { |
| *(--p) = '0'; |
| } else { |
| for (; p >= buf && number != 0; number /= 10) { |
| *(--p) = '0' + (char)(number % 10); |
| } |
| } |
| length = buf + 23 - p; |
| memcpy(dst, p, length + 1); |
| return (int)length; |
| } |