HikoGUI
A low latency retained GUI
Loading...
Searching...
No Matches
BON8.hpp
1// Copyright Take Vos 2020-2021.
2// Distributed under the Boost Software License, Version 1.0.
3// (See accompanying file LICENSE_1_0.txt or copy at https://www.boost.org/LICENSE_1_0.txt)
4
5#pragma once
6
7#include "../byte_string.hpp"
8#include "../required.hpp"
9#include "../datum.hpp"
10#include "../exception.hpp"
11#include "../cast.hpp"
12#include <cstddef>
13#include <string>
14
15namespace hi::inline v1 {
16namespace detail {
17constexpr auto BON8_code_array_count0 = uint8_t{0x80};
18constexpr auto BON8_code_array_count1 = uint8_t{0x81};
19constexpr auto BON8_code_array_count2 = uint8_t{0x82};
20constexpr auto BON8_code_array_count3 = uint8_t{0x83};
21constexpr auto BON8_code_array_count4 = uint8_t{0x84};
22constexpr auto BON8_code_array = uint8_t{0x85};
23constexpr auto BON8_code_object_count0 = uint8_t{0x86};
24constexpr auto BON8_code_object_count1 = uint8_t{0x87};
25constexpr auto BON8_code_object_count2 = uint8_t{0x88};
26constexpr auto BON8_code_object_count3 = uint8_t{0x89};
27constexpr auto BON8_code_object_count4 = uint8_t{0x8a};
28constexpr auto BON8_code_object = uint8_t{0x8b};
29constexpr auto BON8_code_int32 = uint8_t{0x8c};
30constexpr auto BON8_code_int64 = uint8_t{0x8d};
31constexpr auto BON8_code_binary32 = uint8_t{0x8e};
32constexpr auto BON8_code_binary64 = uint8_t{0x8f};
33constexpr auto BON8_code_positive_s = uint8_t{0x90};
34constexpr auto BON8_code_positive_e = uint8_t{0xb7};
35constexpr auto BON8_code_negative_s = uint8_t{0xb8};
36constexpr auto BON8_code_negative_e = uint8_t{0xc1};
37
38// The last 8 code-units after the extended characters.
39constexpr auto BON8_code_bool_false = uint8_t{0xf8};
40constexpr auto BON8_code_bool_true = uint8_t{0xf9};
41constexpr auto BON8_code_null = uint8_t{0xfa};
42constexpr auto BON8_code_float_min_one = uint8_t{0xfb};
43constexpr auto BON8_code_float_zero = uint8_t{0xfc};
44constexpr auto BON8_code_float_one = uint8_t{0xfd};
45constexpr auto BON8_code_eoc = uint8_t{0xfe};
46constexpr auto BON8_code_eot = uint8_t{0xff};
47
54[[nodiscard]] datum decode_BON8(cbyteptr &ptr, cbyteptr last);
55
56[[nodiscard]] bstring encode_BON8(datum const &value);
57
61 bool open_string;
62 bstring output;
63
64public:
65 BON8_encoder() noexcept : open_string(false), output() {}
66
69 bstring const &get() noexcept
70 {
71 if (open_string) {
72 output += static_cast<std::byte>(BON8_code_eot);
73 open_string = false;
74 }
75 return output;
76 }
77
81 void add(signed long long value) noexcept
82 {
83 open_string = false;
84
86 output += static_cast<std::byte>(BON8_code_int64);
87 for (int i = 0; i != 8; ++i) {
88 output += static_cast<std::byte>(value >> (56 - i * 8));
89 }
90
91 } else if (value <= -33818507) {
92 output += static_cast<std::byte>(BON8_code_int32);
93 for (int i = 0; i != 4; ++i) {
94 output += static_cast<std::byte>(value >> (24 - i * 8));
95 }
96
97 } else if (value <= -264075) {
98 value = -(value + 264075);
99 output += static_cast<std::byte>(0xf0 + (value >> 22 & 0x07));
100 output += static_cast<std::byte>(0xc0 + (value >> 16 & 0x3f));
101 output += static_cast<std::byte>(value >> 8);
102 output += static_cast<std::byte>(value);
103
104 } else if (value <= -1931) {
105 value = -(value + 1931);
106 output += static_cast<std::byte>(0xe0 + (value >> 14 & 0x0f));
107 output += static_cast<std::byte>(0xc0 + (value >> 8 & 0x3f));
108 output += static_cast<std::byte>(value);
109
110 } else if (value <= -11) {
111 value = -(value + 11);
112 output += static_cast<std::byte>(0xc2 + (value >> 6 & 0x1f));
113 output += static_cast<std::byte>(0xc0 + (value & 0x3f));
114
115 } else if (value <= -1) {
116 value = -(value + 1);
117 output += static_cast<std::byte>(BON8_code_negative_s + value);
118
119 } else if (value <= 39) {
120 output += static_cast<std::byte>(BON8_code_positive_s + value);
121
122 } else if (value <= 3879) {
123 value -= 40;
124 output += static_cast<std::byte>(0xc2 + (value >> 7 & 0x1f));
125 output += static_cast<std::byte>(value & 0x7f);
126
127 } else if (value <= 528167) {
128 value -= 3880;
129 output += static_cast<std::byte>(0xe0 + (value >> 15 & 0x0f));
130 output += static_cast<std::byte>(value >> 8 & 0x7f);
131 output += static_cast<std::byte>(value);
132
133 } else if (value <= 67637031) {
134 value -= 528168;
135 output += static_cast<std::byte>(0xf0 + (value >> 23 & 0x17));
136 output += static_cast<std::byte>(value >> 16 & 0x7f);
137 output += static_cast<std::byte>(value >> 8);
138 output += static_cast<std::byte>(value);
139
140 } else if (value <= std::numeric_limits<int32_t>::max()) {
141 output += static_cast<std::byte>(BON8_code_int32);
142 for (int i = 0; i != 4; ++i) {
143 output += static_cast<std::byte>(value >> (24 - i * 8));
144 }
145
146 } else {
147 output += static_cast<std::byte>(BON8_code_int64);
148 for (int i = 0; i != 8; ++i) {
149 output += static_cast<std::byte>(value >> (56 - i * 8));
150 }
151 }
152 }
153
157 void add(unsigned long long value) noexcept
158 {
159 return add(narrow_cast<signed long long>(value));
160 }
161
165 void add(signed long value) noexcept
166 {
167 return add(narrow_cast<signed long long>(value));
168 }
169
173 void add(unsigned long value) noexcept
174 {
175 return add(narrow_cast<signed long long>(value));
176 }
177
181 void add(signed int value) noexcept
182 {
183 return add(narrow_cast<signed long long>(value));
184 }
185
189 void add(unsigned int value) noexcept
190 {
191 return add(narrow_cast<signed long long>(value));
192 }
193
197 void add(signed short value) noexcept
198 {
199 return add(narrow_cast<signed long long>(value));
200 }
201
205 void add(unsigned short value) noexcept
206 {
207 return add(narrow_cast<signed long long>(value));
208 }
209
213 void add(signed char value) noexcept
214 {
215 return add(narrow_cast<signed long long>(value));
216 }
217
221 void add(unsigned char value) noexcept
222 {
223 return add(narrow_cast<signed long long>(value));
224 }
225
229 void add(double value) noexcept
230 {
231 open_string = false;
232
233 hilet f32 = static_cast<float>(value);
234 hilet f32_64 = static_cast<double>(f32);
235
236 if (value == -1.0) {
237 output += static_cast<std::byte>(BON8_code_float_min_one);
238
239 } else if (value == 0.0 and not std::signbit(value)) {
240 output += static_cast<std::byte>(BON8_code_float_zero);
241
242 } else if (value == 1.0) {
243 output += static_cast<std::byte>(BON8_code_float_one);
244
245 } else if (f32_64 == value) {
246 // After conversion to 32-bit float, precession was not reduced.
247 uint32_t u32;
248 std::memcpy(&u32, &f32, sizeof(u32));
249
250 output += static_cast<std::byte>(BON8_code_binary32);
251 for (int i = 0; i != 4; ++i) {
252 output += static_cast<std::byte>(u32 >> (24 - i * 8));
253 }
254
255 } else {
256 uint64_t u64;
257 std::memcpy(&u64, &value, sizeof(u64));
258
259 output += static_cast<std::byte>(BON8_code_binary64);
260 for (int i = 0; i != 8; ++i) {
261 output += static_cast<std::byte>(u64 >> (56 - i * 8));
262 }
263 }
264 }
265
269 void add(float value) noexcept
270 {
271 return add(static_cast<double>(value));
272 }
273
277 void add(bool value) noexcept
278 {
279 open_string = false;
280 output += static_cast<std::byte>(value ? BON8_code_bool_true : BON8_code_bool_false);
281 }
282
286 void add(nullptr_t value) noexcept
287 {
288 open_string = false;
289 output += static_cast<std::byte>(BON8_code_null);
290 }
291
297 void add(std::string_view value) noexcept
298 {
299 if (open_string) {
300 output += static_cast<std::byte>(BON8_code_eot);
301 }
302
303 if (value.empty()) {
304 output += static_cast<std::byte>(BON8_code_eot);
305 open_string = false;
306
307 } else {
308 int multi_byte = 0;
309
310 for (hilet _c : value) {
311 hilet c = static_cast<uint8_t>(_c);
312
313 if constexpr (build_type::current == build_type::debug) {
314 if (multi_byte == 0) {
315 if (c >= 0xc2 and c <= 0xdf) {
316 multi_byte = 1;
317 } else if (c >= 0xe0 and c <= 0xef) {
318 multi_byte = 2;
319 } else if (c >= 0xf0 and c <= 0xf7) {
320 multi_byte = 3;
321 } else {
322 hi_assert(c <= 0x7f);
323 }
324
325 } else {
326 hi_assert(c >= 0x80 and c <= 0xbf);
327 --multi_byte;
328 }
329 }
330
331 output += static_cast<std::byte>(c);
332 }
333 hi_axiom(multi_byte == 0);
334
335 open_string = true;
336 }
337 }
338
344 void add(std::string const &value) noexcept
345 {
346 add(std::string_view{value});
347 }
348
354 void add(char const *value) noexcept
355 {
356 add(std::string_view{value});
357 }
358
362 void add(datum const &value);
363
368 template<typename T>
369 void add(std::vector<T> const &items)
370 {
371 open_string = false;
372 if (size(items) <= 4) {
373 output += static_cast<std::byte>(BON8_code_array_count0 + size(items));
374 } else {
375 output += static_cast<std::byte>(BON8_code_array);
376 }
377
378 for (hilet &item : items) {
379 add(item);
380 }
381
382 if (size(items) > 4) {
383 output += static_cast<std::byte>(BON8_code_eoc);
384 open_string = false;
385 }
386 }
387
393 template<typename Key, typename Value>
394 void add(std::map<Key, Value> const &items)
395 {
396 using key_type = typename std::remove_cvref_t<decltype(items)>::key_type;
397
398 open_string = false;
399 if (size(items) <= 4) {
400 output += static_cast<std::byte>(BON8_code_object_count0 + size(items));
401 } else {
402 output += static_cast<std::byte>(BON8_code_object);
403 }
404
405 for (hilet &item : items) {
406 if (auto *s = get_if<std::string>(item.first)) {
407 add(*s);
408 } else {
409 throw operation_error("BON8 object keys must be strings");
410 }
411 add(item.second);
412 }
413
414 if (size(items) > 4) {
415 output += static_cast<std::byte>(BON8_code_eoc);
416 open_string = false;
417 }
418 }
419};
420
421void BON8_encoder::add(datum const &value)
422{
423 if (auto s = get_if<std::string>(value)) {
424 add(*s);
425 } else if (auto u = get_if<URL>(value)) {
426 add(to_string(*u));
427 } else if (auto b = get_if<bool>(value)) {
428 add(*b);
429 } else if (holds_alternative<nullptr_t>(value)) {
430 add(nullptr);
431 } else if (auto i = get_if<long long>(value)) {
432 add(*i);
433 } else if (auto f = get_if<double>(value)) {
434 add(*f);
435 } else if (auto v = get_if<datum::vector_type>(value)) {
436 add(*v);
437 } else if (auto m = get_if<datum::map_type>(value)) {
438 add(*m);
439 } else {
440 throw operation_error("Datum value can not be encoded to BON8");
441 }
442}
443
452[[nodiscard]] int BON8_multibyte_count(cbyteptr ptr, cbyteptr last)
453{
454 hilet c0 = static_cast<uint8_t>(*ptr);
455 int count = c0 <= 0xdf ? 2 : c0 <= 0xef ? 3 : 4;
456
457 hi_parse_check(ptr + count <= last, "Incomplete Multi-byte character at end of buffer");
458
459 hilet c1 = static_cast<uint8_t>(*(ptr + 1));
460 return (c1 < 0x80 or c1 > 0xbf) ? -count : count;
461}
462
471[[nodiscard]] datum decode_BON8_int(cbyteptr &ptr, cbyteptr last, int count)
472{
473 hi_axiom(count == 4 || count == 8);
474
475 auto u64 = uint64_t{0};
476 for (int i = 0; i != count; ++i) {
477 hi_parse_check(ptr != last, "Incomplete signed integer at end of buffer");
478 u64 <<= 8;
479 u64 |= static_cast<uint64_t>(*(ptr++));
480 }
481
482 if (count == 4) {
483 hilet u32 = static_cast<uint32_t>(u64);
484 hilet i32 = static_cast<int32_t>(u32);
485 return datum{i32};
486 } else {
487 hilet i64 = static_cast<int64_t>(u64);
488 return datum{i64};
489 }
490}
491
492[[nodiscard]] datum decode_BON8_float(cbyteptr &ptr, cbyteptr last, int count)
493{
494 hi_axiom(count == 4 || count == 8);
495
496 auto u64 = uint64_t{0};
497 for (int i = 0; i != count; ++i) {
498 hi_parse_check(ptr != last, "Incomplete signed integer at end of buffer");
499 u64 <<= 8;
500 u64 |= static_cast<uint64_t>(*(ptr++));
501 }
502
503 if (count == 4) {
504 hilet u32 = static_cast<uint32_t>(u64);
505 float f32;
506 std::memcpy(&f32, &u32, sizeof(f32));
507 return datum{f32};
508
509 } else {
510 double f64;
511 std::memcpy(&f64, &u64, sizeof(f64));
512 return datum{f64};
513 }
514}
515
516[[nodiscard]] datum decode_BON8_array(cbyteptr &ptr, cbyteptr last)
517{
518 auto r = datum::make_vector();
519 auto &vector = get<datum::vector_type>(r);
520
521 while (ptr != last) {
522 if (*ptr == static_cast<std::byte>(BON8_code_eoc)) {
523 ++ptr;
524 return r;
525
526 } else {
527 vector.push_back(decode_BON8(ptr, last));
528 }
529 }
530 throw parse_error("Incomplete array at end of buffer");
531}
532
533[[nodiscard]] datum decode_BON8_array(cbyteptr &ptr, cbyteptr last, std::size_t count)
534{
535 auto r = datum::make_vector();
536 auto &vector = get<datum::vector_type>(r);
537
538 while (count--) {
539 vector.push_back(decode_BON8(ptr, last));
540 }
541 return r;
542}
543
544[[nodiscard]] datum decode_BON8_object(cbyteptr &ptr, cbyteptr last)
545{
546 auto r = datum::make_map();
547 auto &map = get<datum::map_type>(r);
548
549 while (ptr != last) {
550 if (*ptr == static_cast<std::byte>(BON8_code_eoc)) {
551 ++ptr;
552 return r;
553
554 } else {
555 auto key = decode_BON8(ptr, last);
556 hi_parse_check(holds_alternative<std::string>(key), "Key in object is not a string");
557
558 auto value = decode_BON8(ptr, last);
559 map.emplace(std::move(key), std::move(value));
560 }
561 }
562 throw parse_error("Incomplete object at end of buffer");
563}
564
565[[nodiscard]] datum decode_BON8_object(cbyteptr &ptr, cbyteptr last, std::size_t count)
566{
567 auto r = datum::make_map();
568 auto &map = get<datum::map_type>(r);
569
570 while (count--) {
571 auto key = decode_BON8(ptr, last);
572 hi_parse_check(holds_alternative<std::string>(key), "Key in object is not a string");
573
574 auto value = decode_BON8(ptr, last);
575 map.emplace(std::move(key), std::move(value));
576 }
577 return r;
578}
579
580[[nodiscard]] long long decode_BON8_UTF8_like_int(cbyteptr &ptr, cbyteptr last, int count) noexcept
581{
582 hi_axiom(count >= 2 && count <= 4);
583 hi_axiom(ptr != last);
584 hilet c0 = static_cast<uint8_t>(*(ptr++));
585
586 hilet mask = uint8_t{0b0111'1111} >> count;
587 auto value = static_cast<long long>(c0 & mask);
588 if (count == 2) {
589 // The two byte sequence starts with 0xc2, leaving only 30 entries in the first byte.
590 value -= 2;
591 }
592
593 // The second byte determines the sign, and adds 6 or 7 bits to the number.
594 hi_axiom(ptr != last);
595 hilet c1 = static_cast<uint8_t>(*(ptr++));
596 hilet is_positive = c1 <= 0x7f;
597 if (is_positive) {
598 value <<= 7;
599 value |= static_cast<long long>(c1);
600 } else {
601 value <<= 6;
602 value |= static_cast<long long>(c1 & 0b0011'1111);
603 }
604
605 switch (count) {
606 case 4:
607 hi_axiom(ptr != last);
608 value <<= 8;
609 value |= static_cast<int>(*(ptr++));
610 [[fallthrough]];
611 case 3:
612 hi_axiom(ptr != last);
613 value <<= 8;
614 value |= static_cast<int>(*(ptr++));
615 [[fallthrough]];
616 default:;
617 }
618
619 if (is_positive) {
620 switch (count) {
621 case 2: return value + 40;
622 case 3: return value + 3880;
623 case 4: return value + 528168;
624 default: hi_no_default();
625 }
626
627 } else {
628 switch (count) {
629 case 2: return -(value + 11);
630 case 3: return -(value + 1931);
631 case 4: return -(value + 264075);
632 default: hi_no_default();
633 }
634 }
635}
636
637[[nodiscard]] datum decode_BON8(cbyteptr &ptr, cbyteptr last)
638{
639 std::string str;
640
641 while (ptr != last) {
642 hilet c = static_cast<uint8_t>(*ptr);
643
644 if (c == BON8_code_eot) {
645 // End of string found, return the current string.
646 ++ptr;
647 return datum{str};
648
649 } else if (c <= 0x7f) {
650 // ASCII character.
651 str += static_cast<char>(*(ptr++));
652 continue;
653
654 } else if (c >= 0xc2 && c <= 0xf7) {
655 hilet count = BON8_multibyte_count(ptr, last);
656 if (count > 0) {
657 // Multibyte UTF-8 code-point, The count includes the first code-unit.
658 for (int i = 0; i != count; ++i) {
659 str += static_cast<char>(*(ptr++));
660 }
661 continue;
662
663 } else if (not str.empty()) {
664 // Multibyte integer found, but first return the current string.
665 return datum{str};
666
667 } else {
668 // Multibyte integer, the first code-unit includes part of the integer.
669 return datum{decode_BON8_UTF8_like_int(ptr, last, -count)};
670 }
671
672 } else if (not str.empty()) {
673 // This must be a non-string type, but first return the current string.
674 return datum{str};
675
676 } else {
677 // This is one of the non-string types.
678 ++ptr;
679 switch (c) {
680 case BON8_code_null: return datum{nullptr};
681 case BON8_code_bool_false: return datum{false};
682 case BON8_code_bool_true: return datum{true};
683 case BON8_code_float_min_one: return datum{-1.0f};
684 case BON8_code_float_zero: return datum{0.0f};
685 case BON8_code_float_one: return datum{1.0f};
686 case BON8_code_int32: return decode_BON8_int(ptr, last, 4);
687 case BON8_code_int64: return decode_BON8_int(ptr, last, 8);
688 case BON8_code_binary32: return decode_BON8_float(ptr, last, 4);
689 case BON8_code_binary64: return decode_BON8_float(ptr, last, 8);
690 case BON8_code_array_count0: return datum::make_vector();
691 case BON8_code_array_count1: return decode_BON8_array(ptr, last, 1);
692 case BON8_code_array_count2: return decode_BON8_array(ptr, last, 2);
693 case BON8_code_array_count3: return decode_BON8_array(ptr, last, 3);
694 case BON8_code_array_count4: return decode_BON8_array(ptr, last, 4);
695 case BON8_code_array: return decode_BON8_array(ptr, last);
696 case BON8_code_object_count0: return datum::make_map();
697 case BON8_code_object_count1: return decode_BON8_object(ptr, last, 1);
698 case BON8_code_object_count2: return decode_BON8_object(ptr, last, 2);
699 case BON8_code_object_count3: return decode_BON8_object(ptr, last, 3);
700 case BON8_code_object_count4: return decode_BON8_object(ptr, last, 4);
701 case BON8_code_object: return decode_BON8_object(ptr, last);
702 case BON8_code_eoc: throw parse_error("Unexpected end-of-container");
703 case BON8_code_eot: throw parse_error("Unexpected end-of-text");
704 default:
705 // Everything below this, are non-string types.
706 if (c >= BON8_code_positive_s and c <= BON8_code_positive_e) {
707 return datum{c - BON8_code_positive_s};
708
709 } else if (c >= BON8_code_negative_s and c <= BON8_code_negative_e) {
710 return datum{~static_cast<int>(c - BON8_code_negative_s)};
711
712 } else {
713 hi_no_default();
714 }
715 }
716 }
717 }
718 throw parse_error("Unexpected end-of-buffer");
719}
720} // namespace detail
721
726[[nodiscard]] datum decode_BON8(std::span<const std::byte> buffer)
727{
728 auto *ptr = buffer.data();
729 auto *last = ptr + buffer.size();
730 return detail::decode_BON8(ptr, last);
731}
732
737[[nodiscard]] datum decode_BON8(bstring const &buffer)
738{
739 auto *ptr = buffer.data();
740 auto *last = ptr + buffer.size();
741 return detail::decode_BON8(ptr, last);
742}
743
748[[nodiscard]] datum decode_BON8(bstring_view buffer)
749{
750 auto *ptr = buffer.data();
751 auto *last = ptr + buffer.size();
752 return detail::decode_BON8(ptr, last);
753}
754
759[[nodiscard]] bstring encode_BON8(datum const &value)
760{
761 auto encoder = detail::BON8_encoder{};
762 encoder.add(value);
763 return encoder.get();
764}
765
766} // namespace hi::inline v1
This file includes required definitions.
#define hilet
Invariant should be the default for variables.
Definition required.hpp:23
BON8 encoder.
Definition BON8.hpp:60
void add(std::string const &value) noexcept
Add a UTF-8 string.
Definition BON8.hpp:344
void add(double value) noexcept
Add a floating point number.
Definition BON8.hpp:229
void add(float value) noexcept
Add a floating point number.
Definition BON8.hpp:269
void add(unsigned long long value) noexcept
And a unsigned integer.
Definition BON8.hpp:157
void add(nullptr_t value) noexcept
Add a null.
Definition BON8.hpp:286
void add(bool value) noexcept
Add a boolean.
Definition BON8.hpp:277
void add(signed long value) noexcept
And a signed integer.
Definition BON8.hpp:165
void add(signed int value) noexcept
And a signed integer.
Definition BON8.hpp:181
void add(signed short value) noexcept
And a signed integer.
Definition BON8.hpp:197
void add(std::vector< T > const &items)
Add a vector of values of the same type.
Definition BON8.hpp:369
void add(unsigned int value) noexcept
And a unsigned integer.
Definition BON8.hpp:189
void add(unsigned long value) noexcept
And a unsigned integer.
Definition BON8.hpp:173
void add(char const *value) noexcept
Add a UTF-8 string.
Definition BON8.hpp:354
void add(signed char value) noexcept
And a signed integer.
Definition BON8.hpp:213
void add(signed long long value) noexcept
And a signed integer.
Definition BON8.hpp:81
bstring const & get() noexcept
Return a byte_string of the encoded object.
Definition BON8.hpp:69
void add(unsigned short value) noexcept
And a unsigned integer.
Definition BON8.hpp:205
void add(unsigned char value) noexcept
And a unsigned integer.
Definition BON8.hpp:221
void add(std::string_view value) noexcept
Add a UTF-8 string.
Definition BON8.hpp:297
void add(std::map< Key, Value > const &items)
Add a map of key/values pairs.
Definition BON8.hpp:394
A dynamic data type.
Definition datum.hpp:209
Exception thrown during execution of a dynamic operation.
Definition exception.hpp:37
T count(T... args)
T empty(T... args)
T memcpy(T... args)
T move(T... args)
T signbit(T... args)