From 44d04124f33902f783dd5fc2901fcf4011b2ea42 Mon Sep 17 00:00:00 2001 From: Mercury13 Date: Tue, 17 Dec 2024 03:01:33 +0200 Subject: [PATCH] Improved search for non-European typography --- Lang-src/en.uorig | 9 ++++++--- Lang-src/ja.utran | 27 ++++++++++++++++++--------- Lang-src/ru.utran | 17 +++++++++++++---- Lang-src/uk.utran | 17 +++++++++++++---- Unicodia/FmMain.cpp | 12 ++++++------ 5 files changed, 56 insertions(+), 26 deletions(-) diff --git a/Lang-src/en.uorig b/Lang-src/en.uorig index 35ac661b4..5271b7688 100644 --- a/Lang-src/en.uorig +++ b/Lang-src/en.uorig @@ -8262,9 +8262,12 @@ Unassigned code Test: search for A0000 - - Vacant position - Test: search for everything vacant, e.g. 03A2 + + Vacant position: {1} + +

1 = block name

+

Test: search for 03A2

+
Not found diff --git a/Lang-src/ja.utran b/Lang-src/ja.utran index 2c998ec57..5b4533558 100644 --- a/Lang-src/ja.utran +++ b/Lang-src/ja.utran @@ -1429,9 +1429,9 @@ -

Letters of small Cyrillic languages: Abkhaz, Kurdish ''(as minority of USSR)'', Komi, Mordovian, Aleut, Azeri ''(now [[ps:Latn|Latin]])'' and Chuvash in Yakovlev alphabet ''(used 1873–1938)''.

+

Letters of small Cyrillic languages: Abkhaz, Kurdish ''(as minority of the USSR)'', Komi, Mordovian, Aleut, Azeri ''(now [[ps:Latn|Latin]])'' and Chuvash in Yakovlev alphabet ''(used 1873–1938)''.

-

Contains a funny letter {{sm|Ԥ}} (looks like a word of Russian mat meaning “epic fail”). It was “invented” by Leonid Kaganov; it turned out, not{{_}}the{{_}}first: three years before his post (2008) T-shirts with this letter were sold in Russia. And independently from him, Abkhazians instead of hook {{sm|Ҧ}} {{t|pʰ}} started to write descender, and that gave letter {{sm|Ԥ}} a place in Unicode.

+

Contains a funny letter {{sm|Ԥ}} (looks like the word of Russian mat meaning “epic fail”). It was “invented” by Leonid Kaganov; it turned out, not{{_}}the{{_}}first: three years before his post (2008) T-shirts with this letter were sold in Russia. And independently from him, Abkhazians instead of hook {{sm|Ҧ}} {{t|pʰ}} started to write descender, and that gave letter {{sm|Ԥ}} a place in Unicode.

@@ -2110,7 +2110,7 @@ - Coptic + Coptic @@ -6393,11 +6393,11 @@
-

Invented by Krishna Bahadur Jentich (1926–1991). Initially pure alphabet, because of interaction with Brahmic scripts it started to use inherent {{t|a}} and [[pt:virama|virama]]. Official ortography does not recognize these changes.

+

Invented by Krishna Bahadur Jentich (1926–1991). Initially pure alphabet, because of interaction with Brahmic scripts it started to use inherent {{t|a}}, [[pt:virama|virama]], a mark for final {{t|r}}, and even [[pt:ligature|ligatures]] for consonant conjuncts. The official orthography does not recognize these changes.

The script did not mark tones until recently, and tone marks are basic 0300, 0301 and 030D.

-

The main script is [[ps:Deva|Devanagari]], poorly conveys Sunuwar phonetics. Also there’s Tikamuli, unencoded Brahmic abugida promoted since 2005 by influential funds.

+

The main script is [[ps:Deva|Devanagari]], which poorly conveys Sunuwar phonetics. Also, there’s Tikamuli, an unencoded Brahmic abugida promoted by influential funds since 2005.

@@ -9439,23 +9439,28 @@ Non-character + Test: search for FFFF 非文字 Private-use character + Test: search for E000 私用文字 Code from surrogate pair + Test: search for D800 サロゲートペアからのコード Unassigned code + Test: search for A0000 未割り当てコード - - Vacant position - 空席 + + Vacant position: {1} + 1 = block name + 空席: {1} Not found @@ -9471,11 +9476,15 @@ No such character + Test: find something other than character (e.g. U+FFFF), 2-click そのような文字はありません {1} emoji - “Emoji” is unchangeable, but you may still use one/few/many + +

“Emoji” is unchangeable, but you may still use one/few/many

+

Test: version info → emoji search

+
{1} 絵文字
diff --git a/Lang-src/ru.utran b/Lang-src/ru.utran index 77e091060..2dc7f95ce 100644 --- a/Lang-src/ru.utran +++ b/Lang-src/ru.utran @@ -11952,23 +11952,28 @@ Non-character + Test: search for FFFF Выброшенная позиция Private-use character + Test: search for E000 Символ для личного пользования Code from surrogate pair + Test: search for D800 Код из суррогатной пары Unassigned code + Test: search for A0000 Нераспределённый код - - Vacant position - Свободное место + + Vacant position: {1} + 1 = block name + Свободное место: {1} Not found @@ -11984,11 +11989,15 @@ No such character + Test: find something other than character (e.g. U+FFFF), 2-click Такого символа нет {1} emoji - “Emoji” is unchangeable, but you may still use one/few/many + +

“Emoji” is unchangeable, but you may still use one/few/many

+

Test: version info → emoji search

+
{1} эмодзи
diff --git a/Lang-src/uk.utran b/Lang-src/uk.utran index e04b17587..c94655bd7 100644 --- a/Lang-src/uk.utran +++ b/Lang-src/uk.utran @@ -11955,23 +11955,28 @@ Non-character + Test: search for FFFF Викинута позиція Private-use character + Test: search for E000 Символ для приватного користування Code from surrogate pair + Test: search for D800 Код з сурогатної пари Unassigned code + Test: search for A0000 Нерозподілений код - - Vacant position - Вільне місце + + Vacant position: {1} + 1 = block name + Вільне місце: {1} Not found @@ -11987,11 +11992,15 @@ No such character + Test: find something other than character (e.g. U+FFFF), 2-click Такого символа немає {1} emoji - “Emoji” is unchangeable, but you may still use one/few/many + +

“Emoji” is unchangeable, but you may still use one/few/many

+

Test: version info → emoji search

+
{1} емодзі
diff --git a/Unicodia/FmMain.cpp b/Unicodia/FmMain.cpp index df56add78..1c66efa87 100644 --- a/Unicodia/FmMain.cpp +++ b/Unicodia/FmMain.cpp @@ -839,8 +839,9 @@ QVariant SearchModel::data(const QModelIndex& index, int role) const switch (role) { case Qt::DisplayRole: { QString s; + // LINE 1: What found if (line.code < uc::CAPACITY) { - // Character code + // …Character code uc::sprintUPLUS(buf, line.code); s += buf; if (line.prio.high == uc::HIPRIO_DEC) { @@ -850,7 +851,7 @@ QVariant SearchModel::data(const QModelIndex& index, int role) const s += "₁₀"; } } else if (line.node) { - // Library node + // …Library object std::u32string_view val = line.node->value; static constexpr auto SHORTLEN = 2; bool needShort = (val.length() > SHORTLEN && !line.triggerName.empty()); @@ -869,6 +870,7 @@ QVariant SearchModel::data(const QModelIndex& index, int role) const switch (primaryObj) { case uc::PrimaryObj::NUMERIC: if (auto sNum = toNumeric(line); !sNum.isEmpty()) { + // Code on the left → probably common for all LtR typography s += ": "; s += sNum; } @@ -883,14 +885,12 @@ QVariant SearchModel::data(const QModelIndex& index, int role) const break; } s += '\n'; + // LINE 2: Description switch (line.type) { case uc::CpType::EXISTING: return s + line.cp->viewableName(); case uc::CpType::RESERVED: - // Sloppy here, but the colon is probably replaced with something else - // globally in lockit - return s + loc::get("Search.Empty") + ": " - + str::toQ(uc::blockOf(line.code)->loc.name); + return s + loc::get("Search.Vacant").argQ(uc::blockOf(line.code)->loc.name); case uc::CpType::LIBNODE: if (!line.node) // -warn, should not happen for now return s;