HikoGUI
A low latency retained GUI
Loading...
Searching...
No Matches
text_shaper.hpp
1// Copyright Take Vos 2021-2022.
2// Distributed under the Boost Software License, Version 1.0.
3// (See accompanying file LICENSE_1_0.txt or copy at https://www.boost.org/LICENSE_1_0.txt)
4
5#pragma once
6
7#include "text_shaper_char.hpp"
8#include "text_shaper_line.hpp"
9#include "text_cursor.hpp"
10#include "text_style_set.hpp"
11#include "../layout/layout.hpp"
12#include "../font/font.hpp"
13#include "../geometry/geometry.hpp"
14#include "../unicode/unicode.hpp"
15#include "../units/units.hpp"
16#include "../macros.hpp"
17#include <vector>
18#include <tuple>
19#include <coroutine>
20
21hi_export_module(hikogui.text.text_shaper);
22
23hi_export namespace hi::inline v1 {
24
38class text_shaper {
39public:
40 using char_vector = std::vector<text_shaper_char>;
41 using char_iterator = char_vector::iterator;
42 using char_const_iterator = char_vector::const_iterator;
43 using char_reference = char_vector::reference;
44 using char_const_reference = char_vector::const_reference;
45 using line_vector = std::vector<text_shaper_line>;
46 using line_iterator = line_vector::iterator;
47 using line_const_iterator = line_vector::const_iterator;
48
49 constexpr text_shaper() noexcept = default;
50 constexpr text_shaper(text_shaper const&) noexcept = default;
51 constexpr text_shaper(text_shaper&&) noexcept = default;
52 constexpr text_shaper& operator=(text_shaper const&) noexcept = default;
53 constexpr text_shaper& operator=(text_shaper&&) noexcept = default;
54
83 [[nodiscard]] text_shaper(
84 gstring const& text,
85 text_style_set const& style,
86 unit::pixel_density pixel_density,
87 hi::alignment alignment,
88 bool left_to_right,
89 iso_15924 script = iso_15924{"Zyyy"}) noexcept :
90 _bidi_context(left_to_right ? unicode_bidi_class::L : unicode_bidi_class::R),
91 _pixel_density(pixel_density),
92 _alignment(alignment),
93 _script(script)
94 {
95 auto const font = style.front().font_chain()[0];
96 _initial_line_metrics = style.front().size() * _pixel_density * font->metrics;
97
98 _text.reserve(text.size());
99 for (auto const& c : text) {
100 auto const clean_c = c == '\n' ? grapheme{unicode_PS} : c;
101
102 auto& tmp = _text.emplace_back(clean_c, style, _pixel_density);
103 tmp.initialize_glyph(font);
104 }
105
106 _text_direction = unicode_bidi_direction(
107 _text.begin(),
108 _text.end(),
109 [](text_shaper::char_const_reference it) {
110 return it.grapheme.starter();
111 },
112 _bidi_context);
113
114 _line_break_opportunities = unicode_line_break(_text.begin(), _text.end(), [](auto const& c) -> decltype(auto) {
115 return c.grapheme.starter();
116 });
117
118 _line_break_widths.reserve(text.size());
119 for (auto const& c : _text) {
120 _line_break_widths.push_back(is_visible(c.general_category) ? c.width : -c.width);
121 }
122
123 _word_break_opportunities = unicode_word_break(_text.begin(), _text.end(), [](auto const& c) -> decltype(auto) {
124 return c.grapheme.starter();
125 });
126
127 _sentence_break_opportunities = unicode_sentence_break(_text.begin(), _text.end(), [](auto const& c) -> decltype(auto) {
128 return c.grapheme.starter();
129 });
130
131 resolve_script();
132 }
133
134 [[nodiscard]] text_shaper(
135 std::string_view text,
136 text_style_set const& style,
137 unit::pixel_density pixel_density,
138 hi::alignment alignment,
139 bool left_to_right,
140 iso_15924 script = iso_15924{"Zyyy"}) noexcept :
141 text_shaper(to_gstring(text), style, pixel_density, alignment, left_to_right, script)
142 {
143 }
144
145 [[nodiscard]] bool empty() const noexcept
146 {
147 return _text.empty();
148 }
149
150 [[nodiscard]] size_t size() const noexcept
151 {
152 return _text.size();
153 }
154
155 [[nodiscard]] char_iterator begin() noexcept
156 {
157 return _text.begin();
158 }
159
160 [[nodiscard]] char_const_iterator begin() const noexcept
161 {
162 return _text.begin();
163 }
164
165 [[nodiscard]] char_const_iterator cbegin() const noexcept
166 {
167 return _text.cbegin();
168 }
169
170 [[nodiscard]] char_iterator end() noexcept
171 {
172 return _text.end();
173 }
174
175 [[nodiscard]] char_const_iterator end() const noexcept
176 {
177 return _text.end();
178 }
179
180 [[nodiscard]] char_const_iterator cend() const noexcept
181 {
182 return _text.cend();
183 }
184
185 auto const& lines() const noexcept
186 {
187 return _lines;
188 }
189
206 [[nodiscard]] aarectangle
207 bounding_rectangle(float maximum_line_width) noexcept
208 {
209 auto const rectangle = aarectangle{
211 constexpr auto baseline = 0.0f;
212 constexpr auto sub_pixel_size = extent2{1.0f, 1.0f};
213
214 auto const lines = make_lines(rectangle, baseline, sub_pixel_size);
215 hi_assert(not lines.empty());
216
217 auto max_width = 0.0f;
218 for (auto& line : lines) {
219 inplace_max(max_width, line.width);
220 }
221
222 auto const max_y = lines.front().y + std::ceil(lines.front().metrics.ascender.in(unit::pixels));
223 auto const min_y = lines.back().y - std::ceil(lines.back().metrics.descender.in(unit::pixels));
224 return aarectangle{point2{0.0f, min_y}, point2{std::ceil(max_width), max_y}};
225 }
226
239 void layout(
240 aarectangle rectangle,
241 float baseline,
242 extent2 sub_pixel_size) noexcept
243 {
244 _rectangle = rectangle;
245 _lines = make_lines(rectangle, baseline, sub_pixel_size);
246 hi_assert(not _lines.empty());
247 position_glyphs(rectangle, sub_pixel_size);
248 }
249
252 [[nodiscard]] aarectangle rectangle() const noexcept
253 {
254 return _rectangle;
255 }
256
259 [[nodiscard]] unicode_bidi_class text_direction() const noexcept
260 {
261 return _text_direction;
262 }
263
269 [[nodiscard]] alignment resolved_alignment() const noexcept
270 {
271 return resolve(_alignment, _text_direction == unicode_bidi_class::L);
272 }
273
281 [[nodiscard]] char_const_iterator get_it(size_t index) const noexcept
282 {
283 if (static_cast<ptrdiff_t>(index) < 0) {
284 return begin();
285 } else if (index >= size()) {
286 return end();
287 }
288
289 return begin() + index;
290 }
291
299 [[nodiscard]] char_const_iterator get_it(text_cursor cursor) const noexcept
300 {
301 return get_it(cursor.index());
302 }
303
312 [[nodiscard]] char_const_iterator get_it(size_t column_nr, size_t line_nr) const noexcept
313 {
314 hi_assert(not _lines.empty());
315
316 if (static_cast<ptrdiff_t>(line_nr) < 0) {
317 return begin();
318 } else if (line_nr >= _lines.size()) {
319 return end();
320 }
321
322 auto const left_of_line = static_cast<ptrdiff_t>(column_nr) < 0;
323 auto const right_of_line = column_nr >= _lines[line_nr].size();
324
325 if (left_of_line or right_of_line) {
326 auto const ltr = _lines[line_nr].paragraph_direction == unicode_bidi_class::L;
327 auto const go_up = left_of_line == ltr;
328 if (go_up) {
329 // Go to line above.
330 if (static_cast<ptrdiff_t>(--line_nr) < 0) {
331 return begin();
332 } else {
333 // Go to end of line above.
334 return _lines[line_nr].paragraph_direction == unicode_bidi_class::L ? _lines[line_nr].back() :
335 _lines[line_nr].front();
336 }
337
338 } else {
339 // Go to the line below.
340 if (++line_nr >= _lines.size()) {
341 return end();
342 } else {
343 // Go to begin of line below.
344 return _lines[line_nr].paragraph_direction == unicode_bidi_class::L ? _lines[line_nr].front() :
345 _lines[line_nr].back();
346 }
347 }
348 }
349
350 return _lines[line_nr][column_nr];
351 }
352
360 [[nodiscard]] char_const_iterator get_it(std::pair<size_t, size_t> column_row) const noexcept
361 {
362 return get_it(column_row.first, column_row.second);
363 }
364
370 [[nodiscard]] std::pair<size_t, size_t> get_column_line(text_shaper::char_const_iterator it) const noexcept
371 {
372 if (it != end()) {
373 return {it->column_nr, it->line_nr};
374 } else {
375 hi_assert(not _lines.empty());
376 return {_lines.size() - 1, _lines.back().size()};
377 }
378 }
379
385 [[nodiscard]] std::pair<size_t, size_t> get_column_line(size_t index) const noexcept
386 {
387 return get_column_line(get_it(index));
388 }
389
395 [[nodiscard]] std::pair<size_t, size_t> get_column_line(text_cursor cursor) const noexcept
396 {
397 return get_column_line(cursor.index());
398 }
399
405 [[nodiscard]] size_t get_index(text_shaper::char_const_iterator it) const noexcept
406 {
407 return narrow_cast<size_t>(std::distance(begin(), it));
408 }
409
414 [[nodiscard]] text_cursor get_begin_cursor() const noexcept
415 {
416 return {};
417 }
418
423 [[nodiscard]] text_cursor get_end_cursor() const noexcept
424 {
425 return text_cursor{size() - 1, true}.resize(size());
426 }
427
433 [[nodiscard]] text_cursor get_before_cursor(size_t index) const noexcept
434 {
435 return text_cursor{index, false}.resize(size());
436 }
437
443 [[nodiscard]] text_cursor get_after_cursor(size_t index) const noexcept
444 {
445 return text_cursor{index, true}.resize(size());
446 }
447
453 [[nodiscard]] text_cursor get_before_cursor(text_shaper::char_const_iterator it) const noexcept
454 {
455 return get_before_cursor(get_index(it));
456 }
457
463 [[nodiscard]] text_cursor get_after_cursor(text_shaper::char_const_iterator it) const noexcept
464 {
465 return get_after_cursor(get_index(it));
466 }
467
473 [[nodiscard]] text_cursor get_left_cursor(text_shaper::char_const_iterator it) const noexcept
474 {
475 if (it != end()) {
476 if (it->direction == unicode_bidi_class::L) {
477 return get_before_cursor(it);
478 } else {
479 return get_after_cursor(it);
480 }
481 } else {
482 return get_end_cursor();
483 }
484 }
485
491 [[nodiscard]] text_cursor get_right_cursor(text_shaper::char_const_iterator it) const noexcept
492 {
493 if (it != end()) {
494 if (it->direction == unicode_bidi_class::L) {
495 return get_after_cursor(it);
496 } else {
497 return get_before_cursor(it);
498 }
499 } else {
500 return get_end_cursor();
501 }
502 }
503
509 [[nodiscard]] bool is_on_left(text_cursor cursor) const noexcept
510 {
511 auto const it = get_it(cursor);
512 if (it != end()) {
513 return (it->direction == unicode_bidi_class::L) == cursor.before();
514 } else {
515 hi_assert(begin() == end());
516 return true;
517 }
518 }
519
525 [[nodiscard]] bool is_on_right(text_cursor cursor) const noexcept
526 {
527 auto const it = get_it(cursor);
528 if (it != end()) {
529 return (it->direction == unicode_bidi_class::L) == cursor.after();
530 } else {
531 hi_assert(begin() == end());
532 return true;
533 }
534 }
535
541 [[nodiscard]] text_cursor get_nearest_cursor(point2 position) const noexcept
542 {
543 if (_text.empty()) {
544 return {};
545 }
546
547 auto const line_it = std::ranges::min_element(_lines, std::ranges::less{}, [position](auto const& line) {
548 return std::abs(line.y - position.y());
549 });
550
551 if (line_it != _lines.end()) {
552 auto const[char_it, after] = line_it->get_nearest(position);
553 return {narrow_cast<size_t>(std::distance(_text.begin(), char_it)), after};
554 } else {
555 return {};
556 }
557 }
558
562 {
563 auto const index = cursor.index();
564 return {get_before_cursor(index), get_after_cursor(index)};
565 }
566
570 {
571 return get_selection_from_break(cursor, _word_break_opportunities);
572 }
573
577 {
578 return get_selection_from_break(cursor, _sentence_break_opportunities);
579 }
580
584 {
585 auto const first_index = [&]() {
586 auto i = cursor.index();
587 while (i > 0) {
588 if (_text[i - 1].general_category == unicode_general_category::Zp) {
589 return i;
590 }
591 --i;
592 }
593 return i;
594 }();
595 auto const last_index = [&]() {
596 auto i = cursor.index();
597 while (i < _text.size()) {
598 if (_text[i].general_category == unicode_general_category::Zp) {
599 return i;
600 }
601 ++i;
602 }
603 return i;
604 }();
605
606 return {get_before_cursor(first_index), get_after_cursor(last_index)};
607 }
608
612 {
613 if (_text.empty()) {
614 return {{}, {}};
615 }
616
617 return {{}, get_end_cursor()};
618 }
619
625 [[nodiscard]] char_const_iterator move_left_char(char_const_iterator it) const noexcept
626 {
627 auto const[column_nr, line_nr] = get_column_line(it);
628 return get_it(column_nr - 1, line_nr);
629 }
630
636 [[nodiscard]] char_const_iterator move_right_char(char_const_iterator it) const noexcept
637 {
638 auto const[column_nr, line_nr] = get_column_line(it);
639 return get_it(column_nr + 1, line_nr);
640 }
641
642 [[nodiscard]] text_cursor move_left_char(text_cursor cursor, bool overwrite_mode) const noexcept
643 {
644 auto it = get_it(cursor);
645 if (overwrite_mode) {
646 it = move_left_char(it);
647 return get_before_cursor(it);
648
649 } else {
650 if (is_on_left(cursor)) {
651 // If the cursor is on the left side of a character, then move one character left.
652 it = move_left_char(it);
653 }
654
655 return get_left_cursor(it);
656 }
657 }
658
659 [[nodiscard]] text_cursor move_right_char(text_cursor cursor, bool overwrite_mode) const noexcept
660 {
661 auto it = get_it(cursor);
662 if (overwrite_mode) {
663 it = move_right_char(it);
664 return get_before_cursor(it);
665
666 } else {
667 if (is_on_right(cursor)) {
668 // If the cursor is on the left side of a character, then move one character left.
669 it = move_right_char(it);
670 }
671
672 return get_right_cursor(it);
673 }
674 }
675
676 [[nodiscard]] text_cursor move_down_char(text_cursor cursor, float& x) const noexcept
677 {
678 if (_text.empty()) {
679 return {};
680 }
681
682 auto [column_nr, line_nr] = get_column_line(cursor);
683 if (++line_nr == _lines.size()) {
684 return get_end_cursor();
685 }
686
687 if (std::isnan(x)) {
688 auto const char_it = get_it(cursor);
689 hi_assert(char_it != _text.end());
690 x = is_on_left(cursor) ? char_it->rectangle.left() : char_it->rectangle.right();
691 }
692
693 auto const[new_char_it, after] = _lines[line_nr].get_nearest(point2{x, 0.0f});
694 return get_before_cursor(new_char_it);
695 }
696
697 [[nodiscard]] text_cursor move_up_char(text_cursor cursor, float& x) const noexcept
698 {
699 if (_text.empty()) {
700 return {};
701 }
702
703 auto [column_nr, line_nr] = get_column_line(cursor);
704 if (line_nr-- == 0) {
705 return {};
706 }
707
708 if (std::isnan(x)) {
709 auto char_it = get_it(cursor);
710 hi_assert(char_it < _text.end());
711 x = is_on_left(cursor) ? char_it->rectangle.left() : char_it->rectangle.right();
712 }
713
714 auto const[new_char_it, after] = _lines[line_nr].get_nearest(point2{x, 0.0f});
715 return get_before_cursor(new_char_it);
716 }
717
718 [[nodiscard]] text_cursor move_left_word(text_cursor cursor, bool overwrite_mode) const noexcept
719 {
720 cursor = move_left_char(cursor, overwrite_mode).before_neighbor(size());
721 auto it = get_it(cursor);
722 while (it != end()) {
723 if (it->general_category != unicode_general_category::Zs and
724 _word_break_opportunities[get_index(it)] != unicode_break_opportunity::no) {
725 return get_before_cursor(it);
726 }
727 it = move_left_char(it);
728 }
729 return get_end_cursor();
730 }
731
732 [[nodiscard]] text_cursor move_right_word(text_cursor cursor, bool overwrite_mode) const noexcept
733 {
734 cursor = move_right_char(cursor, overwrite_mode).before_neighbor(size());
735 auto it = get_it(cursor);
736 while (it != end()) {
737 if (it->general_category != unicode_general_category::Zs and
738 _word_break_opportunities[get_index(it)] != unicode_break_opportunity::no) {
739 return get_before_cursor(it);
740 }
741 it = move_right_char(it);
742 }
743 return get_end_cursor();
744 }
745
746 [[nodiscard]] text_cursor move_begin_line(text_cursor cursor) const noexcept
747 {
748 auto const[column_nr, line_nr] = get_column_line(cursor);
749 auto const& line = _lines[line_nr];
750 return get_before_cursor(line.first);
751 }
752
753 [[nodiscard]] text_cursor move_end_line(text_cursor cursor) const noexcept
754 {
755 auto const[column_nr, line_nr] = get_column_line(cursor);
756 auto const& line = _lines[line_nr];
757
758 auto it = line.last;
759 while (it != line.first) {
760 --it;
761 if (not it->is_trailing_white_space) {
762 break;
763 }
764 }
765
766 return get_after_cursor(it);
767 }
768
769 [[nodiscard]] text_cursor move_begin_sentence(text_cursor cursor) const noexcept
770 {
771 if (cursor.after()) {
772 cursor = {cursor.index(), false};
773 } else if (cursor.index() != 0) {
774 cursor = {cursor.index() - 1, false};
775 }
776 auto const[first, last] = select_sentence(cursor);
777 return first.before_neighbor(size());
778 }
779
780 [[nodiscard]] text_cursor move_end_sentence(text_cursor cursor) const noexcept
781 {
782 if (cursor.before()) {
783 cursor = {cursor.index(), true};
784 } else if (cursor.index() != _text.size() - 1) {
785 cursor = {cursor.index() + 1, true};
786 }
787 auto const[first, last] = select_sentence(cursor);
788 return last.before_neighbor(size());
789 }
790
791 [[nodiscard]] text_cursor move_begin_paragraph(text_cursor cursor) const noexcept
792 {
793 if (cursor.after()) {
794 cursor = {cursor.index(), false};
795 } else if (cursor.index() != 0) {
796 cursor = {cursor.index() - 1, false};
797 }
798 auto const[first, last] = select_paragraph(cursor);
799 return first.before_neighbor(size());
800 }
801
802 [[nodiscard]] text_cursor move_end_paragraph(text_cursor cursor) const noexcept
803 {
804 if (cursor.before()) {
805 cursor = {cursor.index(), true};
806 } else if (cursor.index() != _text.size() - 1) {
807 cursor = {cursor.index() + 1, true};
808 }
809 auto const[first, last] = select_paragraph(cursor);
810 return last.before_neighbor(size());
811 }
812
813 [[nodiscard]] text_cursor move_begin_document(text_cursor cursor) const noexcept
814 {
815 return {};
816 }
817
818 [[nodiscard]] text_cursor move_end_document(text_cursor cursor) const noexcept
819 {
820 if (_text.empty()) {
821 return {};
822 }
823
824 return get_end_cursor();
825 }
826
827private:
830 unit::pixel_density _pixel_density;
831
838 char_vector _text;
839
840 hi::alignment _alignment;
841
844 unicode_break_vector _line_break_opportunities;
845
848 std::vector<float> _line_break_widths;
849
852 unicode_break_vector _word_break_opportunities;
853
856 unicode_break_vector _sentence_break_opportunities;
857
860 unicode_bidi_context _bidi_context;
861
864 unicode_bidi_class _text_direction;
865
868 iso_15924 _script;
869
874 line_vector _lines;
875
878 font_metrics_px _initial_line_metrics;
879
882 aarectangle _rectangle;
883
884 static void
885 layout_lines_vertical_spacing(text_shaper::line_vector& lines) noexcept
886 {
887 hi_assert(not lines.empty());
888
889 auto prev = lines.begin();
890 prev->y = 0.0f;
891 for (auto it = prev + 1; it != lines.end(); ++it) {
892 auto const height =
893 prev->metrics.descender + std::max(prev->metrics.line_gap, it->metrics.line_gap) + it->metrics.ascender;
894
895 auto const line_spacing = std::max(prev->line_spacing, it->line_spacing);
896 auto const paragraph_spacing = std::max(prev->paragraph_spacing, it->paragraph_spacing);
897 auto const spacing = prev->last_category == unicode_general_category::Zp ? paragraph_spacing : line_spacing;
898 // Lines advance downward on the y-axis.
899 it->y = prev->y - spacing * height.in(unit::pixels);
900 prev = it;
901 }
902 }
903
904 static void layout_lines_vertical_alignment(
905 text_shaper::line_vector& lines,
906 vertical_alignment alignment,
907 float baseline,
908 float min_y,
909 float max_y,
910 float sub_pixel_height) noexcept
911 {
912 hi_assert(not lines.empty());
913
914 // Calculate the y-adjustment needed to position the base-line of the text to y=0
915 auto adjustment = [&]() {
916 if (alignment == vertical_alignment::top) {
917 return -lines.front().y;
918
919 } else if (alignment == vertical_alignment::bottom) {
920 return -lines.back().y;
921
922 } else {
923 auto const mp_index = lines.size() / 2;
924 if (lines.size() % 2 == 1) {
925 return -lines[mp_index].y;
926
927 } else {
928 return -std::midpoint(lines[mp_index - 1].y, lines[mp_index].y);
929 }
930 }
931 }();
932
933 // Add the base-line to the adjustment.
934 adjustment += baseline;
935
936 // Clamp the adjustment between min_y and max_y.
937 // The text may not fit, prioritize to show the top lines.
938 if (lines.back().y + adjustment < min_y) {
939 adjustment = min_y - lines.back().y;
940 }
941 if (lines.front().y + adjustment > max_y) {
942 adjustment = max_y - lines.front().y;
943 }
944
945 // Reposition the lines, and round to sub-pixel boundary.
946 auto const rcp_sub_pixel_height = 1.0f / sub_pixel_height;
947 for (auto& line : lines) {
948 line.y = std::round((line.y + adjustment) * rcp_sub_pixel_height) * sub_pixel_height;
949 }
950 }
951
958 static void
959 bidi_algorithm(text_shaper::line_vector& lines, text_shaper::char_vector& text, unicode_bidi_context bidi_context) noexcept
960 {
961 hi_assert(not lines.empty());
962
963 // Create a list of all character indices.
964 auto char_its = std::vector<text_shaper::char_iterator>{};
965 // Make room for implicit line-separators.
966 char_its.reserve(text.size() + lines.size());
967 for (auto const& line : lines) {
968 // Add all the characters of a line.
969 for (auto it = line.first; it != line.last; ++it) {
970 char_its.push_back(it);
971 }
972 if (not is_Zp_or_Zl(line.last_category)) {
973 // No explicit paragraph-separator or line-separator, at a virtual one.
974 char_its.push_back(text.end());
975 }
976 }
977
978 auto const[char_its_last, paragraph_directions] = unicode_bidi(
979 char_its.begin(),
980 char_its.end(),
981 [&](text_shaper::char_const_iterator it) {
982 if (it != text.end()) {
983 return it->grapheme.starter();
984 } else {
985 return unicode_LS;
986 }
987 },
988 [&](text_shaper::char_iterator it, char32_t code_point) {
989 hi_axiom(it != text.end());
990 it->replace_glyph(code_point);
991 },
992 [&](text_shaper::char_iterator it, unicode_bidi_class direction) {
993 if (it != text.end()) {
994 it->direction = direction;
995 }
996 },
997 bidi_context);
998
999 // The unicode bidi algorithm may have deleted a few characters.
1000 char_its.erase(char_its_last, char_its.cend());
1001
1002 // Add the paragraph direction for each line.
1003 auto par_it = paragraph_directions.cbegin();
1004 for (auto& line : lines) {
1005 hi_axiom(par_it != paragraph_directions.cend());
1006 line.paragraph_direction = *par_it;
1007 if (line.last_category == unicode_general_category::Zp) {
1008 par_it++;
1009 }
1010 }
1011 hi_assert(par_it <= paragraph_directions.cend());
1012
1013 // Add the character indices for each line in display order.
1014 auto line_it = lines.begin();
1015 line_it->columns.clear();
1016 auto column_nr = 0_uz;
1017 for (auto const char_it : char_its) {
1018 if (char_it == text.end()) {
1019 // Ignore the virtual line separators.
1020 continue;
1021 } else if (char_it >= line_it->last) {
1022 // Skip to the next line.
1023 hi_axiom(line_it->columns.size() <= narrow_cast<size_t>(std::distance(line_it->first, line_it->last)));
1024 ++line_it;
1025 line_it->columns.clear();
1026 column_nr = 0_uz;
1027 }
1028 hi_axiom(line_it != lines.end());
1029 hi_axiom(char_it >= line_it->first);
1030 hi_axiom(char_it < line_it->last);
1031 line_it->columns.push_back(char_it);
1032
1033 // Assign line_nr and column_nr, for quick back referencing.
1034 char_it->line_nr = line_it->line_nr;
1035 char_it->column_nr = column_nr++;
1036 }
1037
1038 // All of the characters in the text must be positioned.
1039 for (auto& c : text) {
1040 hi_axiom(c.line_nr != std::numeric_limits<size_t>::max() and c.column_nr != std::numeric_limits<size_t>::max());
1041 }
1042 }
1043
1044 [[nodiscard]] static generator<std::pair<std::vector<size_t>, float>>
1045 get_widths(unicode_break_vector const& opportunities, std::vector<float> const& widths, unit::pixel_density pixel_density) noexcept
1046 {
1047 struct entry_type {
1048 size_t min_height;
1049 size_t max_height;
1050 float min_width;
1051 float max_width;
1052 };
1053
1054 auto stack = std::vector<entry_type>{};
1055
1056 auto const a4_one_column = (au::milli(au::meters)(172.0f) * pixel_density.ppi).in(unit::pixels);
1057 auto const a4_two_column = (au::milli(au::meters)(88.0f) * pixel_density.ppi).in(unit::pixels);
1058
1059 // Max-width first.
1060 auto [max_width, max_lines] = detail::unicode_LB_maximum_width(opportunities, widths);
1061 auto height = max_lines.size();
1062 co_yield {std::move(max_lines), max_width};
1063
1064 if (max_width >= a4_two_column) {
1065 // If this is wide text, then only try a few sizes.
1066 if (max_width > a4_one_column) {
1067 auto [width, lines] = detail::unicode_LB_width(opportunities, widths, a4_one_column);
1068 if (std::exchange(height, lines.size()) > lines.size()) {
1069 co_yield {std::move(lines), width};
1070 }
1071 }
1072
1073 auto [width, lines] = detail::unicode_LB_width(opportunities, widths, a4_two_column);
1074 if (std::exchange(height, lines.size()) > lines.size()) {
1075 co_yield {std::move(lines), width};
1076 }
1077
1078 } else {
1079 // With small text we try every size that changes the number of lines.
1080 auto [min_width, min_lines] = detail::unicode_LB_minimum_width(opportunities, widths);
1081 if (min_lines.size() >= height) {
1082 // There are no multiple sizes.
1083 co_return;
1084 }
1085
1086 stack.emplace_back(min_lines.size(), height, min_width, max_width);
1087 co_yield {std::move(min_lines), min_width};
1088
1089 do {
1090 auto const entry = stack.back();
1091 stack.pop_back();
1092
1093 if (entry.max_height > entry.max_height + 1 and entry.max_width >= entry.min_width + 2.0f) {
1094 // There lines between the current two sizes; split in two.
1095 auto const half_width = (entry.min_width + entry.max_width) * 0.5f;
1096
1097 auto [split_width, split_lines] = detail::unicode_LB_width(opportunities, widths, half_width);
1098 auto const split_height = split_lines.size();
1099
1100 if (split_height == entry.min_height) {
1101 // We didn't find a proper split, need to try the upper half. Use `half_width` to split right down the
1102 // middle.
1103 stack.emplace_back(split_height, entry.max_height, half_width, entry.max_width);
1104
1105 } else if (split_height == entry.max_height) {
1106 // We didn't find a proper split, need to try the lower half. Use `half_width` to split right down the
1107 // middle.
1108 stack.emplace_back(entry.min_height, split_height, entry.min_width, half_width);
1109
1110 } else {
1111 // Split through the middle, use the split_width for faster searching.
1112 co_yield {std::move(split_lines), split_width};
1113 stack.emplace_back(entry.min_height, split_height, entry.min_width, split_width);
1114 stack.emplace_back(split_height, entry.max_height, split_width, entry.max_width);
1115 }
1116 }
1117 } while (not stack.empty());
1118 }
1119 }
1120
1129 [[nodiscard]] line_vector make_lines(
1130 aarectangle rectangle,
1131 float baseline,
1132 extent2 sub_pixel_size) noexcept
1133 {
1134 auto const line_sizes = unicode_line_break(_line_break_opportunities, _line_break_widths, rectangle.width());
1135
1136 auto r = text_shaper::line_vector{};
1137 r.reserve(line_sizes.size());
1138
1139 auto char_it = _text.begin();
1140 auto width_it = _line_break_widths.begin();
1141 auto line_nr = 0_uz;
1142 for (auto const line_size : line_sizes) {
1143 hi_axiom(line_size > 0);
1144 auto const char_eol = char_it + line_size;
1145 auto const width_eol = width_it + line_size;
1146
1147 auto const line_width = detail::unicode_LB_width(width_it, width_eol);
1148 r.emplace_back(line_nr++, _text.begin(), char_it, char_eol, line_width, _initial_line_metrics);
1149
1150 char_it = char_eol;
1151 width_it = width_eol;
1152 }
1153
1154 if (r.empty() or is_Zp_or_Zl(r.back().last_category)) {
1155 r.emplace_back(line_nr++, _text.begin(), _text.end(), _text.end(), 0.0f, _initial_line_metrics);
1156 r.back().paragraph_direction = _text_direction;
1157 }
1158
1159 layout_lines_vertical_spacing(r);
1160 layout_lines_vertical_alignment(
1161 r, _alignment.vertical(), baseline, rectangle.bottom(), rectangle.top(), sub_pixel_size.height());
1162
1163 return r;
1164 }
1165
1172 void position_glyphs(aarectangle rectangle, extent2 sub_pixel_size) noexcept
1173 {
1174 hi_assert(not _lines.empty());
1175
1176 // The bidi algorithm will reorder the characters on each line, and mirror the brackets in the text when needed.
1177 bidi_algorithm(_lines, _text, _bidi_context);
1178 for (auto& line : _lines) {
1179 // Position the glyphs on each line. Possibly morph glyphs to handle ligatures and calculate the bounding rectangles.
1180 line.layout(_alignment.horizontal(), rectangle.left(), rectangle.right(), sub_pixel_size.width());
1181 }
1182 }
1183
1186 void resolve_script() noexcept
1187 {
1188 // Find the first script in the text if no script is found use the text_shaper's default script.
1189 auto first_script = _script;
1190 for (auto& c : _text) {
1191 auto const script = ucd_get_script(c.grapheme.starter());
1192 if (script != iso_15924::wildcard() or script == iso_15924::uncoded() or script == iso_15924::common() or
1193 script == iso_15924::inherited()) {
1194 first_script = script;
1195 break;
1196 }
1197 }
1198
1199 // Backward pass: fix start of words and open-brackets.
1200 // After this pass unknown-script is no longer in the text.
1201 // Close brackets will not be fixed, those will be fixed in the last forward pass.
1202 auto word_script = iso_15924::common();
1203 auto previous_script = first_script;
1204 for (auto i = std::ssize(_text) - 1; i >= 0; --i) {
1205 auto& c = _text[i];
1206
1207 if (_word_break_opportunities[i + 1] != unicode_break_opportunity::no) {
1208 word_script = iso_15924::common();
1209 }
1210
1211 c.script = ucd_get_script(c.grapheme.starter());
1212 if (c.script == iso_15924::uncoded() or c.script == iso_15924::common()) {
1213 auto const bracket_type = ucd_get_bidi_paired_bracket_type(c.grapheme.starter());
1214 // clang-format off
1215 c.script =
1216 bracket_type == unicode_bidi_paired_bracket_type::o ? previous_script :
1217 bracket_type == unicode_bidi_paired_bracket_type::c ? iso_15924::common() :
1218 word_script;
1219 // clang-format on
1220
1221 } else if (c.script != iso_15924::inherited()) {
1222 previous_script = word_script = c.script;
1223 }
1224 }
1225
1226 // Forward pass: fix all common and inherited with previous or first script.
1227 previous_script = first_script;
1228 for (auto i = 0_uz; i != _text.size(); ++i) {
1229 auto& c = _text[i];
1230
1231 if (c.script == iso_15924::common() or c.script == iso_15924::inherited()) {
1232 c.script = previous_script;
1233
1234 } else {
1235 previous_script = c.script;
1236 }
1237 }
1238 }
1239
1240 [[nodiscard]] std::pair<text_cursor, text_cursor>
1241 get_selection_from_break(text_cursor cursor, unicode_break_vector const& break_opportunities) const noexcept
1242 {
1243 if (_text.empty()) {
1244 return {{}, {}};
1245 }
1246
1247 // In the algorithm below we search before and after the character that the cursor is at.
1248 // We do not use the before/after differentiation.
1249
1250 auto const first_index = [&]() {
1251 auto i = cursor.index();
1252 while (break_opportunities[i] == unicode_break_opportunity::no) {
1253 --i;
1254 }
1255 return i;
1256 }();
1257 auto const last_index = [&]() {
1258 auto i = cursor.index();
1259 while (break_opportunities[i + 1] == unicode_break_opportunity::no) {
1260 ++i;
1261 }
1262 return i;
1263 }();
1264
1265 return {get_before_cursor(first_index), get_after_cursor(last_index)};
1266 }
1267
1268 [[nodiscard]] std::pair<font_metrics_px, unicode_general_category>
1269 get_line_metrics(text_shaper::char_const_iterator first, text_shaper::char_const_iterator last) const noexcept
1270 {
1271 auto metrics = _initial_line_metrics;
1272 for (auto it = first; it != last; ++it) {
1273 // Only calculate line metrics based on visible characters.
1274 // For example a paragraph separator is seldom available in a font.
1275 if (is_visible(it->general_category)) {
1276 inplace_max(metrics, it->font_metrics());
1277 }
1278 }
1279
1280 auto const last_category = (first != last) ? (last - 1)->general_category : unicode_general_category::Cn;
1281 return {metrics, last_category};
1282 }
1283
1290 [[nodiscard]] float get_text_height(std::vector<size_t> const& lines) const noexcept
1291 {
1292 if (lines.empty()) {
1293 return 0.0f;
1294 }
1295
1296 auto line_it = lines.cbegin();
1297 auto char_it_first = _text.begin();
1298 auto char_it_last = char_it_first + *line_it++;
1299
1300 // Add the x-height of the first line.
1301 auto [previous_metrics, previous_category] = get_line_metrics(char_it_first, char_it_last);
1302 auto total_height = previous_metrics.x_height;
1303
1304 for (; line_it != lines.cend(); ++line_it) {
1305 char_it_first = std::exchange(char_it_last, char_it_last + *line_it);
1306
1307 // Advance to the base-line of the next line.
1308 auto [current_metrics, current_category] = get_line_metrics(char_it_first, char_it_last);
1309 auto const line_height = previous_metrics.descender + std::max(previous_metrics.line_gap, current_metrics.line_gap) +
1310 current_metrics.ascender;
1311
1312 auto const spacing = previous_category == unicode_general_category::Zp ? previous_metrics.paragraph_spacing :
1313 previous_metrics.line_spacing;
1314 total_height = total_height + spacing * line_height;
1315
1316 previous_metrics = std::move(current_metrics);
1317 previous_category = std::move(current_category);
1318 }
1319
1320 return total_height.in(unit::pixels);
1321 }
1322};
1323
1324} // namespace hi::inline v1
@ rectangle
The gui_event has rectangle data.
Definition gui_event_variant.hpp:44
@ alignment
A alignment was changed.
Definition style_modify_mask.hpp:43
@ pixel_density
The attributes that need to be modified when the pixel density changes.
Definition style_modify_mask.hpp:59
unicode_bidi_class
Bidirectional class Unicode Standard Annex #9: https://unicode.org/reports/tr9/.
Definition ucd_bidi_classes.hpp:861
DOXYGEN BUG.
Definition algorithm_misc.hpp:20
constexpr gstring to_gstring(std::u32string_view rhs, unicode_normalize_config config=unicode_normalize_config::NFC()) noexcept
Convert a UTF-32 string-view to a grapheme-string.
Definition gstring.hpp:263
unicode_break_vector unicode_line_break(It first, ItEnd last, CodePointFunc const &code_point_func) noexcept
The unicode line break algorithm UAX #14.
Definition unicode_line_break.hpp:633
unicode_break_vector unicode_sentence_break(It first, ItEnd last, CodePointFunc const &code_point_func) noexcept
The unicode word break algorithm UAX#29.
Definition unicode_sentence_break.hpp:258
constexpr extent2 sub_pixel_size(subpixel_orientation orientation) noexcept
Get the size of a sub-pixel based on the sub-pixel orientation.
Definition subpixel_orientation.hpp:41
constexpr std::pair< It, std::vector< unicode_bidi_class > > unicode_bidi(It first, It last, GetCodePoint get_code_point, SetCodePoint set_code_point, SetTextDirection set_text_direction, unicode_bidi_context const &context={})
Reorder a given range of characters based on the unicode_bidi algorithm.
Definition unicode_bidi.hpp:1219
constexpr unicode_bidi_class unicode_bidi_direction(It first, It last, GetCodePoint get_code_point, unicode_bidi_context const &context={})
Get the unicode bidi direction for the first paragraph and context.
Definition unicode_bidi.hpp:1259
unicode_break_vector unicode_word_break(It first, ItEnd last, CodePointFunc const &code_point_func) noexcept
The unicode word break algorithm UAX#29.
Definition unicode_word_break.hpp:240
Definition font_font.hpp:32
font_metrics_em metrics
The metrics of a font.
Definition font_font.hpp:66
Horizontal/Vertical alignment combination.
Definition alignment.hpp:244
A high-level geometric point Part of the high-level vec, point, mat and color types.
Definition point2.hpp:28
A cursor-position in text.
Definition text_cursor.hpp:26
constexpr text_cursor & resize(size_t size) &noexcept
Set the text size.
Definition text_cursor.hpp:49
text_cursor get_before_cursor(text_shaper::char_const_iterator it) const noexcept
Get the cursor before the character in logical order.
Definition text_shaper.hpp:453
std::pair< text_cursor, text_cursor > select_paragraph(text_cursor cursor) const noexcept
Get the selection for a paragraph at the cursor.
Definition text_shaper.hpp:583
std::pair< size_t, size_t > get_column_line(size_t index) const noexcept
Get the column and line of a character.
Definition text_shaper.hpp:385
char_const_iterator get_it(text_cursor cursor) const noexcept
Get the character at the cursor.
Definition text_shaper.hpp:299
char_const_iterator get_it(size_t column_nr, size_t line_nr) const noexcept
Get the character at column and row in display order.
Definition text_shaper.hpp:312
std::pair< text_cursor, text_cursor > select_sentence(text_cursor cursor) const noexcept
Get the selection for the sentence at the cursor.
Definition text_shaper.hpp:576
bool is_on_left(text_cursor cursor) const noexcept
Check if the cursor is on the left side of the character in display order.
Definition text_shaper.hpp:509
bool is_on_right(text_cursor cursor) const noexcept
Check if the cursor is on the right side of the character in display order.
Definition text_shaper.hpp:525
text_cursor get_after_cursor(text_shaper::char_const_iterator it) const noexcept
Get the cursor after the character in logical order.
Definition text_shaper.hpp:463
unicode_bidi_class text_direction() const noexcept
Get the text-direction as a whole.
Definition text_shaper.hpp:259
text_shaper(gstring const &text, text_style_set const &style, unit::pixel_density pixel_density, hi::alignment alignment, bool left_to_right, iso_15924 script=iso_15924{"Zyyy"}) noexcept
Construct a text_shaper with a text and alignment.
Definition text_shaper.hpp:83
aarectangle rectangle() const noexcept
The rectangle used when laying out the text.
Definition text_shaper.hpp:252
std::pair< text_cursor, text_cursor > select_char(text_cursor cursor) const noexcept
Get the selection for the character at the cursor.
Definition text_shaper.hpp:561
std::pair< size_t, size_t > get_column_line(text_shaper::char_const_iterator it) const noexcept
Get the column and line of a character.
Definition text_shaper.hpp:370
text_cursor get_left_cursor(text_shaper::char_const_iterator it) const noexcept
Get the cursor left of the character in display order.
Definition text_shaper.hpp:473
std::pair< text_cursor, text_cursor > select_word(text_cursor cursor) const noexcept
Get the selection for the word at the cursor.
Definition text_shaper.hpp:569
size_t get_index(text_shaper::char_const_iterator it) const noexcept
Get the index of the character in logical order.
Definition text_shaper.hpp:405
char_const_iterator get_it(size_t index) const noexcept
Get the character at index in logical order.
Definition text_shaper.hpp:281
text_cursor get_end_cursor() const noexcept
Get the cursor at the end of the document.
Definition text_shaper.hpp:423
std::pair< text_cursor, text_cursor > select_document(text_cursor cursor) const noexcept
Get the selection for a paragraph at the cursor.
Definition text_shaper.hpp:611
aarectangle bounding_rectangle(float maximum_line_width) noexcept
Get bounding rectangle.
Definition text_shaper.hpp:207
char_const_iterator move_right_char(char_const_iterator it) const noexcept
Get the character to the right.
Definition text_shaper.hpp:636
char_const_iterator get_it(std::pair< size_t, size_t > column_row) const noexcept
Get the character at column and row in display order.
Definition text_shaper.hpp:360
void layout(aarectangle rectangle, float baseline, extent2 sub_pixel_size) noexcept
Layout the lines of the text.
Definition text_shaper.hpp:239
text_cursor get_begin_cursor() const noexcept
Get the cursor at the beginning of the document.
Definition text_shaper.hpp:414
text_cursor get_after_cursor(size_t index) const noexcept
Get the cursor after the character in logical order.
Definition text_shaper.hpp:443
alignment resolved_alignment() const noexcept
Get the resolved alignment of the text.
Definition text_shaper.hpp:269
text_cursor get_nearest_cursor(point2 position) const noexcept
find the nearest character.
Definition text_shaper.hpp:541
text_cursor get_before_cursor(size_t index) const noexcept
Get the cursor before the character in logical order.
Definition text_shaper.hpp:433
std::pair< size_t, size_t > get_column_line(text_cursor cursor) const noexcept
Get the column and line of a character.
Definition text_shaper.hpp:395
text_cursor get_right_cursor(text_shaper::char_const_iterator it) const noexcept
Get the cursor right of the character in display order.
Definition text_shaper.hpp:491
char_const_iterator move_left_char(char_const_iterator it) const noexcept
Get the character to the left.
Definition text_shaper.hpp:625
A grapheme-cluster, what a user thinks a character is.
Definition grapheme.hpp:168
T begin(T... args)
T ceil(T... args)
T distance(T... args)
T end(T... args)
T isnan(T... args)
T lowest(T... args)
T max(T... args)
T move(T... args)
T prev(T... args)
T round(T... args)
T size(T... args)