public inbox for libc-alpha@sourceware.org
 help / color / mirror / Atom feed
* [PATCH v2] localedata: Updates for Taiwanese locales [BZ #24409]
@ 2021-04-21  5:38 Wei-Lun Chao
  2021-05-07 21:23 ` Carlos O'Donell
  0 siblings, 1 reply; 11+ messages in thread
From: Wei-Lun Chao @ 2021-04-21  5:38 UTC (permalink / raw)
  To: libc-alpha

From: Wei-Lun Chao <bluebat@member.fsf.org>

Rationale:
* Header cleanup: make the header of localedata files consistent
* Remove space (abmon): remove the extra prefix space in abmon 1~9
* Add (week): add the missing definition of week and first_weekday to 2
* Change (thousands_sep): change the thousands_sep from <U002C> to
<U2009> to avoid confusion of grouping 4 with usual grouping 3
* Simplify (yesexpr) and (noexpr): remove unusual full-width characters
* Add collation: add missing collation used in cmn_TW

Changelog:
* localedata/locales/cmn_TW: Header cleanup; Remove space (abmon); Add
(week); Change (thousands_sep); Simplify (yesexpr) and (noexpr).
* localedata/locales/hak_TW: Likewise and add collation.
* localedata/locales/nan_TW: Likewise and add collation.
* localedata/locales/lzh_TW: Likewise and add collation.

---
 localedata/locales/cmn_TW |  40 +++++++-------
 localedata/locales/hak_TW |  76 +++++++++++++-------------
 localedata/locales/lzh_TW | 110 ++++++++++++++++++++++++--------------
 localedata/locales/nan_TW |  90 ++++++++++++++++---------------
 4 files changed, 174 insertions(+), 142 deletions(-)

diff --git a/localedata/locales/cmn_TW b/localedata/locales/cmn_TW
index 9d9aca0f9e..bc90121012 100644
--- a/localedata/locales/cmn_TW
+++ b/localedata/locales/cmn_TW
@@ -8,15 +8,9 @@ escape_char /
 % exempt you from the conditions of the license if your use would
 % otherwise be governed by that license.

-%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%
-%
 % Mandarin Chinese locale for the Republic of China
-%
 % Prepared and contributed to glibc by Wei-Lun Chao <bluebat@member.fsf.org>
-%
 % build with: localedef -f UTF-8 -i cmn_TW cmn_TW
-%
-%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%

 LC_IDENTIFICATION
 title        "Mandarin Chinese locale for the Republic of China"
@@ -28,8 +22,8 @@ tel          ""
 fax          ""
 language     "Mandarin Chinese"
 territory    "Taiwan"
-revision     "0.2"
-date         "2017-07-20"
+revision     "0.3"
+date         "2021-04-21"

 category "i18n:2012";LC_IDENTIFICATION
 category "i18n:2012";LC_CTYPE
@@ -77,16 +71,16 @@ mon           "<U4E00><U6708>";/
      "<U5341><U6708>";/
      "<U5341><U4E00><U6708>";/
      "<U5341><U4E8C><U6708>"
-%  1月,  2月,  3月,  4月,  5月,  6月,  7月,  8月,  9月, 10月, 11月, 12月
-abmon         " 1<U6708>";/
-       " 2<U6708>";/
-       " 3<U6708>";/
-       " 4<U6708>";/
-       " 5<U6708>";/
-       " 6<U6708>";/
-       " 7<U6708>";/
-       " 8<U6708>";/
-       " 9<U6708>";/
+% 1月, 2月, 3月, 4月, 5月, 6月, 7月, 8月, 9月, 10月, 11月, 12月
+abmon         "1<U6708>";/
+       "2<U6708>";/
+       "3<U6708>";/
+       "4<U6708>";/
+       "5<U6708>";/
+       "6<U6708>";/
+       "7<U6708>";/
+       "8<U6708>";/
+       "9<U6708>";/
        "10<U6708>";/
        "11<U6708>";/
        "12<U6708>"
@@ -119,6 +113,8 @@ am_pm         "<U4E0A><U5348>";/
 t_fmt_ampm    "%p %I<U9EDE>%M<U5206>%S<U79D2>"
 % %Y年 %b %-d號 %A %H:%M:%S %Z
 date_fmt      "%Y<U5E74> %b %-d<U865F> %A %H:%M:%S %Z"
+week 7;19971130;1
+first_weekday 2

 era "+:2:1913//01//01:+*:<U6C11><U570B>:%EC%Ey<U5E74>";/
     "+:1:1912//01//01:1912//12//31:<U6C11><U570B>:%EC<U5143><U5E74>";/
@@ -127,7 +123,7 @@ END LC_TIME

 LC_NUMERIC
 decimal_point "."
-thousands_sep ","
+thousands_sep "<U2009>"
 grouping      4
 END LC_NUMERIC

@@ -135,7 +131,7 @@ LC_MONETARY
 currency_symbol    "NT$"
 int_curr_symbol    "TWD "
 mon_decimal_point  "."
-mon_thousands_sep  ","
+mon_thousands_sep  "<U2009>"
 mon_grouping       4
 positive_sign      ""
 negative_sign      "-"
@@ -166,8 +162,8 @@ measurement 1
 END LC_MEASUREMENT

 LC_MESSAGES
-yesexpr "^[+1yY<UFF59><UFF39><U662F>]"
-noexpr  "^[-0nN<UFF4E><UFF2E><U4E0D><U5426>]"
+yesexpr "^[yY]"
+noexpr  "^[nN]"
 % 是
 yesstr  "<U662F>"
 % 不是
diff --git a/localedata/locales/hak_TW b/localedata/locales/hak_TW
index 73b9678ec4..9824be119e 100644
--- a/localedata/locales/hak_TW
+++ b/localedata/locales/hak_TW
@@ -8,15 +8,9 @@ escape_char /
 % exempt you from the conditions of the license if your use would
 % otherwise be governed by that license.

-%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%
-%
 % Hakka Chinese locale for the Republic of China
-%
 % Prepared and contributed to glibc by Wei-Lun Chao <bluebat@member.fsf.org>
-%
 % build with: localedef -f UTF-8 -i hak_TW hak_TW
-%
-%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%

 LC_IDENTIFICATION
 title        "Hakka Chinese locale for the Republic of China"
@@ -28,8 +22,8 @@ tel          ""
 fax          ""
 language     "Hakka Chinese"
 territory    "Taiwan"
-revision     "0.1"
-date         "2013-06-02"
+revision     "0.2"
+date         "2021-04-21"

 category "i18n:2012";LC_IDENTIFICATION
 category "i18n:2012";LC_CTYPE
@@ -47,17 +41,20 @@ END LC_IDENTIFICATION

 LC_CTYPE
 copy "i18n"
+translit_start
+include "translit_combining";""
+translit_end
+
 class    "hanzi"; /
 <U3007>;/
 <U3400>..<U4DBF>;/
 <U4E00>..<U9FA5>;/
 <UF900>..<UFA6A>;/
-<U00020000>..<U0002A6D6>;/
-<U0002F800>..<U0002FA1D>
+<U00020000>..<U0002FA1D>
 END LC_CTYPE

 LC_COLLATE
-copy "iso14651_t1"
+copy "cns11643_stroke"
 END LC_COLLATE

 LC_TIME
@@ -74,16 +71,16 @@ mon           "<U4E00><U6708>";/
      "<U5341><U6708>";/
      "<U5341><U4E00><U6708>";/
      "<U5341><U4E8C><U6708>"
-%  1月,  2月,  3月,  4月,  5月,  6月,  7月,  8月,  9月, 10月, 11月, 12月
-abmon         " 1<U6708>";/
-       " 2<U6708>";/
-       " 3<U6708>";/
-       " 4<U6708>";/
-       " 5<U6708>";/
-       " 6<U6708>";/
-       " 7<U6708>";/
-       " 8<U6708>";/
-       " 9<U6708>";/
+% 1月, 2月, 3月, 4月, 5月, 6月, 7月, 8月, 9月, 10月, 11月, 12月
+abmon         "1<U6708>";/
+       "2<U6708>";/
+       "3<U6708>";/
+       "4<U6708>";/
+       "5<U6708>";/
+       "6<U6708>";/
+       "7<U6708>";/
+       "8<U6708>";/
+       "9<U6708>";/
        "10<U6708>";/
        "11<U6708>";/
        "12<U6708>"
@@ -103,19 +100,20 @@ abday         "<U65E5>";/
        "<U56DB>";/
        "<U4E94>";/
        "<U516D>"
-% %Y年%m月%d日 (%A) %H點%M分%S秒
-d_t_fmt       "%Y<U5E74>%m<U6708>%d<U65E5> (%A) %H<U9EDE>%M<U5206>%S<U79D2>"
-% %Y年%m月%d日
-d_fmt         "%Y<U5E74>%m<U6708>%d<U65E5>"
+% %Y年%m月%d號 (%A) %H點%M分%S秒
+d_t_fmt       "%Y<U5E74>%m<U6708>%d<U865F> (%A) %H<U9EDE>%M<U5206>%S<U79D2>"
+% %Y年%m月%d號
+d_fmt         "%Y<U5E74>%m<U6708>%d<U865F>"
 % %H點%M分%S秒
 t_fmt         "%H<U9EDE>%M<U5206>%S<U79D2>"
 % 上晝, 下晝
 am_pm         "<U4E0A><U665D>";"<U4E0B><U665D>"
 % %p %I點%M分%S秒
 t_fmt_ampm    "%p %I<U9EDE>%M<U5206>%S<U79D2>"
-% %Y年 %b %e日 %A %H:%M:%S %Z
-date_fmt      "%Y<U5E74> %b %e<U65E5> %A %H:%M:%S %Z"
+% %Y年 %b %-d號 %A %H:%M:%S %Z
+date_fmt      "%Y<U5E74> %b %-d<U865F> %A %H:%M:%S %Z"
 week 7;19971130;1
+first_weekday 2

 era "+:2:1913//01//01:+*:<U6C11><U570B>:%EC%Ey<U5E74>";/
     "+:1:1912//01//01:1912//12//31:<U6C11><U570B>:%EC<U5143><U5E74>";/
@@ -124,7 +122,7 @@ END LC_TIME

 LC_NUMERIC
 decimal_point "."
-thousands_sep ","
+thousands_sep "<U2009>"
 grouping      4
 END LC_NUMERIC

@@ -132,7 +130,7 @@ LC_MONETARY
 currency_symbol    "NT$"
 int_curr_symbol    "TWD "
 mon_decimal_point  "."
-mon_thousands_sep  ","
+mon_thousands_sep  "<U2009>"
 mon_grouping       4
 positive_sign      ""
 negative_sign      "-"
@@ -153,18 +151,22 @@ int_n_sign_posn    1
 END LC_MONETARY

 LC_PAPER
-copy "i18n"
+height 297
+width  210
 END LC_PAPER

 LC_MEASUREMENT
-copy "i18n"
+% metric
+measurement 1
 END LC_MEASUREMENT

 LC_MESSAGES
-% ^[+1yYyY係]
-yesexpr "^[+1yY<UFF59><UFF39><U4FC2>]"
-% ^[-0nNnN毋]
-noexpr  "^[-0nN<UFF4E><UFF2E><U6BCB>]"
+yesexpr "^[yY]"
+noexpr  "^[nN]"
+% 係
+yesstr  "<U4FC2>"
+% 毋係
+nostr   "<U6BCB><U4FC2>"
 END LC_MESSAGES

 LC_NAME
@@ -191,8 +193,8 @@ country_ab3  "TWN"
 country_num  158
 country_car "RC"
 country_isbn 957
-% 客家語
-lang_name    "<U5BA2><U5BB6><U8A71>"
+% 漢語客家語
+lang_name    "<U6F22><U8A9E><U5BA2><U5BB6><U8A9E>"
 lang_term    "hak"
 lang_lib     "hak"
 END LC_ADDRESS
diff --git a/localedata/locales/lzh_TW b/localedata/locales/lzh_TW
index 4740418a83..ba4c495b09 100644
--- a/localedata/locales/lzh_TW
+++ b/localedata/locales/lzh_TW
@@ -8,15 +8,9 @@ escape_char /
 % exempt you from the conditions of the license if your use would
 % otherwise be governed by that license.

-%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%
-%
 % Literary Chinese locale for the Republic of China
-%
 % Prepared and contributed to glibc by Wei-Lun Chao <bluebat@member.fsf.org>
-%
 % build with: localedef -f UTF-8 -i lzh_TW lzh_TW
-%
-%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%

 LC_IDENTIFICATION
 title        "Literary Chinese locale for the Republic of China"
@@ -28,8 +22,8 @@ tel          ""
 fax          ""
 language     "Literary Chinese"
 territory    "Taiwan"
-revision     "0.1"
-date         "2013-06-02"
+revision     "0.2"
+date         "2021-04-21"

 category "i18n:2012";LC_IDENTIFICATION
 category "i18n:2012";LC_CTYPE
@@ -47,17 +41,20 @@ END LC_IDENTIFICATION

 LC_CTYPE
 copy "i18n"
+translit_start
+include "translit_combining";""
+translit_end
+
 class    "hanzi"; /
 <U3007>;/
 <U3400>..<U4DBF>;/
 <U4E00>..<U9FA5>;/
 <UF900>..<UFA6A>;/
-<U00020000>..<U0002A6D6>;/
-<U0002F800>..<U0002FA1D>
+<U00020000>..<U0002FA1D>
 END LC_CTYPE

 LC_COLLATE
-copy "iso14651_t1"
+copy "cns11643_stroke"
 END LC_COLLATE

 LC_TIME
@@ -74,17 +71,17 @@ mon           "<U4E00><U6708>";/
      "<U5341><U6708>";/
      "<U5341><U4E00><U6708>";/
      "<U5341><U4E8C><U6708>"
-%  一 ,  二 ,  三 ,  四 ,  五 ,  六 ,  七 ,  八 ,  九 ,  十 , 十一, 十二
-abmon         " <U4E00> ";/
-       " <U4E8C> ";/
-       " <U4E09> ";/
-       " <U56DB> ";/
-       " <U4E94> ";/
-       " <U516D> ";/
-       " <U4E03> ";/
-       " <U516B> ";/
-       " <U4E5D> ";/
-       " <U5341> ";/
+% 一, 二, 三, 四, 五, 六, 七, 八, 九, 十, 十一, 十二
+abmon         "<U4E00>";/
+       "<U4E8C>";/
+       "<U4E09>";/
+       "<U56DB>";/
+       "<U4E94>";/
+       "<U516D>";/
+       "<U4E03>";/
+       "<U516B>";/
+       "<U4E5D>";/
+       "<U5341>";/
        "<U5341><U4E00>";/
        "<U5341><U4E8C>"
 % 週日, 週一, 週二, 週三, 週四, 週五, 週六
@@ -103,19 +100,21 @@ abday         "<U65E5>";/
        "<U56DB>";/
        "<U4E94>";/
        "<U516D>"
-% %OC%Oy年%B%Od日 (%A) %OH時%OM分%OS秒
-d_t_fmt       "%OC%Oy<U5E74>%B%Od<U65E5> (%A) %OH<U6642>%OM<U5206>%OS<U79D2>"
-% %OC%Oy年%B%Od日
-d_fmt         "%OC%Oy<U5E74>%B%Od<U65E5>"
+% %Y年%B%Od (%A) %OH時%OM分%OS秒
+d_t_fmt       "%Y<U5E74>%B%Od (%A) %OH<U6642>%OM<U5206>%OS<U79D2>"
+% %Y年%B%Od
+d_fmt         "%Y<U5E74>%B%Od"
 % %OH時%OM分%OS秒
 t_fmt         "%OH<U6642>%OM<U5206>%OS<U79D2>"
 % 朝, 暮
-am_pm         "<U671D>";"<U66AE>"
+am_pm         "<U671D>";/
+       "<U66AE>"
 % %p %OI時%OM分%OS秒
 t_fmt_ampm    "%p %OI<U6642>%OM<U5206>%OS<U79D2>"
-% 公曆 %C%Oy年 %B %Oe日 %A %OH時%OM分%OS秒
-date_fmt      "<U516C><U66C6> %C%Oy<U5E74> %B %Oe<U65E5> %A
%OH<U6642>%OM<U5206>%OS<U79D2>"
-% 〇, 一, 二, 三, 四, 五, 六, 七, 八, 九, 十, 十一, 十二, 十三, 十四, 十五, 十六, 十七, 十八,
十九, 廿, 廿一, 廿二, 廿三, 廿四, 廿五, 廿六, 廿七, 廿八, 廿九, 卅, 卅一
+% 公曆 %Y年 %B %Oe %A %OH時%OM分%OS秒
+date_fmt      "<U516C><U66C6> %Y<U5E74> %B %Oe %A
%OH<U6642>%OM<U5206>%OS<U79D2>"
+% 〇, 一, 二, 三, 四, 五, 六, 七, 八, 九, 十, 十一, 十二, 十三, 十四, 十五, 十六, 十七, 十八,
十九, 廿, 廿一, 廿二, 廿三, 廿四, 廿五, 廿六, 廿七, 廿八, 廿九, 卅, 卅一,
+% 卅二, 卅三, 卅四, 卅五, 卅六, 卅七, 卅八, 卅九, 四十, 四十一, 四十二, 四十三, 四十四, 四十五, 四十六,
四十七, 四十八, 四十九, 五十, 五十一, 五十二, 五十三, 五十四, 五十五, 五十六, 五十七, 五十八, 五十九
 alt_digits    "<U3007>";/
             "<U4E00>";/
             "<U4E8C>";/
@@ -147,9 +146,38 @@ alt_digits    "<U3007>";/
             "<U5EFF><U516B>";/
             "<U5EFF><U4E5D>";/
             "<U5345>";/
-            "<U5345><U4E00>"
+            "<U5345><U4E00>";/
+            "<U5345><U4E8C>";/
+            "<U5345><U4E09>";/
+            "<U5345><U56DB>";/
+            "<U5345><U4E94>";/
+            "<U5345><U516D>";/
+            "<U5345><U4E03>";/
+            "<U5345><U516B>";/
+            "<U5345><U4E5D>";/
+            "<U56DB><U5341>";/
+            "<U56DB><U5341><U4E00>";/
+            "<U56DB><U5341><U4E8C>";/
+            "<U56DB><U5341><U4E09>";/
+            "<U56DB><U5341><U56DB>";/
+            "<U56DB><U5341><U4E94>";/
+            "<U56DB><U5341><U516D>";/
+            "<U56DB><U5341><U4E03>";/
+            "<U56DB><U5341><U516B>";/
+            "<U56DB><U5341><U4E5D>";/
+            "<U56DB><U5341>";/
+            "<U4E94><U5341><U4E00>";/
+            "<U4E94><U5341><U4E8C>";/
+            "<U4E94><U5341><U4E09>";/
+            "<U4E94><U5341><U56DB>";/
+            "<U4E94><U5341><U4E94>";/
+            "<U4E94><U5341><U516D>";/
+            "<U4E94><U5341><U4E03>";/
+            "<U4E94><U5341><U516B>";/
+            "<U4E94><U5341><U4E5D>"
 %
 week 7;19971130;1
+first_weekday 2

 era "+:2:1913//01//01:+*:<U6C11><U570B>:%EC%Ey<U5E74>";/
     "+:1:1912//01//01:1912//12//31:<U6C11><U570B>:%EC<U5143><U5E74>";/
@@ -158,7 +186,7 @@ END LC_TIME

 LC_NUMERIC
 decimal_point "."
-thousands_sep ","
+thousands_sep "<U2009>"
 grouping      4
 END LC_NUMERIC

@@ -166,7 +194,7 @@ LC_MONETARY
 currency_symbol    "NT$"
 int_curr_symbol    "TWD "
 mon_decimal_point  "."
-mon_thousands_sep  ","
+mon_thousands_sep  "<U2009>"
 mon_grouping       4
 positive_sign      ""
 negative_sign      "-"
@@ -187,18 +215,22 @@ int_n_sign_posn    1
 END LC_MONETARY

 LC_PAPER
-copy "i18n"
+height 297
+width  210
 END LC_PAPER

 LC_MEASUREMENT
-copy "i18n"
+% metric
+measurement 1
 END LC_MEASUREMENT

 LC_MESSAGES
-% ^[+1yYyY是]
-yesexpr "^[+1yY<UFF59><UFF39><U662F>]"
-% ^[-0nNnN非]
-noexpr  "^[-0nN<UFF4E><UFF2E><U975E>]"
+yesexpr "^[yY]"
+noexpr  "^[nN]"
+% 是
+yesstr  "<U662F>"
+% 否
+nostr   "<U5426>"
 END LC_MESSAGES

 LC_NAME
diff --git a/localedata/locales/nan_TW b/localedata/locales/nan_TW
index 0c2a56f4ca..83e47afbae 100644
--- a/localedata/locales/nan_TW
+++ b/localedata/locales/nan_TW
@@ -1,22 +1,16 @@
 comment_char %
 escape_char /

-% This file is part of the GNU C Library and contains locale data.
-% The Free Software Foundation does not claim any copyright interest
-% in the locale data contained in this file.  The foregoing does not
-% affect the license of the GNU C Library as a whole.  It does not
-% exempt you from the conditions of the license if your use would
-% otherwise be governed by that license.
-
-%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%
-%
+% This file is a part of GNU C Library (glibc) and contains locale data. The
+% Free Software Foundation does not claim any copyright interest in the
+% locale data contained in this file. The foregoing does not affect the
+% license of GNU C Library (glibc) as a whole. It does not exempt you from the
+% conditions of the license if your use would otherwise be governed by
+% that license.
+
 % Min Nan Chinese locale for the Republic of China
-%
 % Prepared and contributed to glibc by Wei-Lun Chao <bluebat@member.fsf.org>
-%
 % build with: localedef -f UTF-8 -i nan_TW nan_TW
-%
-%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%

 LC_IDENTIFICATION
 title        "Min Nan Chinese locale for the Republic of China"
@@ -28,8 +22,8 @@ tel          ""
 fax          ""
 language     "Min Nan Chinese"
 territory    "Taiwan"
-revision     "0.1"
-date         "2013-06-02"
+revision     "0.2"
+date         "2021-04-21"

 category "i18n:2012";LC_IDENTIFICATION
 category "i18n:2012";LC_CTYPE
@@ -47,17 +41,20 @@ END LC_IDENTIFICATION

 LC_CTYPE
 copy "i18n"
+translit_start
+include "translit_combining";""
+translit_end
+
 class    "hanzi"; /
 <U3007>;/
 <U3400>..<U4DBF>;/
 <U4E00>..<U9FA5>;/
 <UF900>..<UFA6A>;/
-<U00020000>..<U0002A6D6>;/
-<U0002F800>..<U0002FA1D>
+<U00020000>..<U0002FA1D>
 END LC_CTYPE

 LC_COLLATE
-copy "iso14651_t1"
+copy "cns11643_stroke"
 END LC_COLLATE

 LC_TIME
@@ -74,16 +71,16 @@ mon           "<U4E00><U6708>";/
      "<U5341><U6708>";/
      "<U5341><U4E00><U6708>";/
      "<U5341><U4E8C><U6708>"
-%  1月,  2月,  3月,  4月,  5月,  6月,  7月,  8月,  9月, 10月, 11月, 12月
-abmon         " 1<U6708>";/
-       " 2<U6708>";/
-       " 3<U6708>";/
-       " 4<U6708>";/
-       " 5<U6708>";/
-       " 6<U6708>";/
-       " 7<U6708>";/
-       " 8<U6708>";/
-       " 9<U6708>";/
+% 1月, 2月, 3月, 4月, 5月, 6月, 7月, 8月, 9月, 10月, 11月, 12月
+abmon         "1<U6708>";/
+       "2<U6708>";/
+       "3<U6708>";/
+       "4<U6708>";/
+       "5<U6708>";/
+       "6<U6708>";/
+       "7<U6708>";/
+       "8<U6708>";/
+       "9<U6708>";/
        "10<U6708>";/
        "11<U6708>";/
        "12<U6708>"
@@ -103,10 +100,10 @@ abday         "<U65E5>";/
        "<U56DB>";/
        "<U4E94>";/
        "<U516D>"
-% %Y年%m月%d日 (%A) %H點%M分%S秒
-d_t_fmt       "%Y<U5E74>%m<U6708>%d<U65E5> (%A) %H<U9EDE>%M<U5206>%S<U79D2>"
-% %Y年%m月%d日
-d_fmt         "%Y<U5E74>%m<U6708>%d<U65E5>"
+% %Y年%m月%d號 (%A) %H點%M分%S秒
+d_t_fmt       "%Y<U5E74>%m<U6708>%d<U865F> (%A) %H<U9EDE>%M<U5206>%S<U79D2>"
+% %Y年%m月%d號
+d_fmt         "%Y<U5E74>%m<U6708>%d<U865F>"
 % %H點%M分%S秒
 t_fmt         "%H<U9EDE>%M<U5206>%S<U79D2>"
 % 頂晡, 下晡
@@ -114,9 +111,10 @@ am_pm         "<U9802><U6661>";/
        "<U4E0B><U6661>"
 % %p %I點%M分%S秒
 t_fmt_ampm    "%p %I<U9EDE>%M<U5206>%S<U79D2>"
-% %Y年 %b %e日 %A %H:%M:%S %Z
-date_fmt      "%Y<U5E74> %b %e<U65E5> %A %H:%M:%S %Z"
+% %Y年 %b %-d號 %A %H:%M:%S %Z
+date_fmt      "%Y<U5E74> %b %-d<U865F> %A %H:%M:%S %Z"
 week 7;19971130;1
+first_weekday 2

 era "+:2:1913//01//01:+*:<U6C11><U570B>:%EC%Ey<U5E74>";/
     "+:1:1912//01//01:1912//12//31:<U6C11><U570B>:%EC<U5143><U5E74>";/
@@ -125,7 +123,7 @@ END LC_TIME

 LC_NUMERIC
 decimal_point "."
-thousands_sep ","
+thousands_sep "<U2009>"
 grouping      4
 END LC_NUMERIC

@@ -133,7 +131,7 @@ LC_MONETARY
 currency_symbol    "NT$"
 int_curr_symbol    "TWD "
 mon_decimal_point  "."
-mon_thousands_sep  ","
+mon_thousands_sep  "<U2009>"
 mon_grouping       4
 positive_sign      ""
 negative_sign      "-"
@@ -154,18 +152,22 @@ int_n_sign_posn    1
 END LC_MONETARY

 LC_PAPER
-copy "i18n"
+height 297
+width  210
 END LC_PAPER

 LC_MEASUREMENT
-copy "i18n"
+% metric
+measurement 1
 END LC_MEASUREMENT

 LC_MESSAGES
-% ^[+1yYyY是]
-yesexpr "^[+1yY<UFF59><UFF39><U662F>]"
-% ^[-0nNnN伓]
-noexpr  "^[-0nN<UFF4E><UFF2E><U4F13>]"
+yesexpr "^[yY]"
+noexpr  "^[nN]"
+% 是
+yesstr  "<U662F>"
+% 毋是
+nostr   "<U6BCB><U662F>"
 END LC_MESSAGES

 LC_NAME
@@ -192,8 +194,8 @@ country_ab3  "TWN"
 country_num  158
 country_car "RC"
 country_isbn 957
-% 閩南語
-lang_name    "<U95A9><U5357><U8A9E>"
+% 漢語閩南語
+lang_name    "<U6F22><U8A9E><U95A9><U5357><U8A9E>"
 lang_term    "nan"
 lang_lib     "nan"
 END LC_ADDRESS
-- 
2.31.1

^ permalink raw reply	[flat|nested] 11+ messages in thread

* Re: [PATCH v2] localedata: Updates for Taiwanese locales [BZ #24409]
  2021-04-21  5:38 [PATCH v2] localedata: Updates for Taiwanese locales [BZ #24409] Wei-Lun Chao
@ 2021-05-07 21:23 ` Carlos O'Donell
  2021-05-10  3:07   ` Wei-Lun Chao
  0 siblings, 1 reply; 11+ messages in thread
From: Carlos O'Donell @ 2021-05-07 21:23 UTC (permalink / raw)
  To: Wei-Lun Chao, libc-alpha

On 4/21/21 1:38 AM, Wei-Lun Chao via Libc-alpha wrote:
> From: Wei-Lun Chao <bluebat@member.fsf.org>
> 
> Rationale:
> * Header cleanup: make the header of localedata files consistent
> * Remove space (abmon): remove the extra prefix space in abmon 1~9
> * Add (week): add the missing definition of week and first_weekday to 2
> * Change (thousands_sep): change the thousands_sep from <U002C> to
> <U2009> to avoid confusion of grouping 4 with usual grouping 3
> * Simplify (yesexpr) and (noexpr): remove unusual full-width characters
> * Add collation: add missing collation used in cmn_TW
> 
> Changelog:
> * localedata/locales/cmn_TW: Header cleanup; Remove space (abmon); Add
> (week); Change (thousands_sep); Simplify (yesexpr) and (noexpr).
> * localedata/locales/hak_TW: Likewise and add collation.
> * localedata/locales/nan_TW: Likewise and add collation.
> * localedata/locales/lzh_TW: Likewise and add collation.

CI/CD fails to apply the patch:
https://patchwork.sourceware.org/project/glibc/patch/CAP1CgNK6jk52eF1phakqmVkU1DJx0puk--NKAO2iFWjYXO=q7Q@mail.gmail.com/

Looks like your MUA is wrapping lines. Please fix. Thank you!

-- 
Cheers,
Carlos.


^ permalink raw reply	[flat|nested] 11+ messages in thread

* [PATCH v2] localedata: Updates for Taiwanese locales [BZ #24409]
  2021-05-07 21:23 ` Carlos O'Donell
@ 2021-05-10  3:07   ` Wei-Lun Chao
  2021-05-11 11:15     ` TAMUKI Shoichi
  2021-05-11 12:41     ` TAMUKI Shoichi
  0 siblings, 2 replies; 11+ messages in thread
From: Wei-Lun Chao @ 2021-05-10  3:07 UTC (permalink / raw)
  To: Carlos O'Donell; +Cc: libc-alpha

From: Wei-Lun Chao <bluebat@member.fsf.org>

Rationale:
* Header cleanup: make the header of localedata files consistent
* Remove space (abmon): remove the extra prefix space in abmon 1~9
* Add (week): add the missing definition of week and first_weekday to 2
* Change (thousands_sep): change the thousands_sep from <U002C> to
<U2009> to avoid confusion of grouping 4 with usual grouping 3
* Simplify (yesexpr) and (noexpr): remove unusual full-width characters
* Add collation: add missing collation used in cmn_TW

Changelog:
* localedata/locales/cmn_TW: Header cleanup; Remove space (abmon); Add
(week); Change (thousands_sep); Simplify (yesexpr) and (noexpr).
* localedata/locales/hak_TW: Likewise and add collation.
* localedata/locales/nan_TW: Likewise and add collation.
* localedata/locales/lzh_TW: Likewise and add collation.

---
 localedata/locales/cmn_TW |  40 +++++++-------
 localedata/locales/hak_TW |  76 +++++++++++++-------------
 localedata/locales/lzh_TW | 110 ++++++++++++++++++++++++--------------
 localedata/locales/nan_TW |  90 ++++++++++++++++---------------
 4 files changed, 174 insertions(+), 142 deletions(-)

diff --git a/localedata/locales/cmn_TW b/localedata/locales/cmn_TW
index 9d9aca0f9e..bc90121012 100644
--- a/localedata/locales/cmn_TW
+++ b/localedata/locales/cmn_TW
@@ -8,15 +8,9 @@ escape_char /
 % exempt you from the conditions of the license if your use would
 % otherwise be governed by that license.

-%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%
-%
 % Mandarin Chinese locale for the Republic of China
-%
 % Prepared and contributed to glibc by Wei-Lun Chao <bluebat@member.fsf.org>
-%
 % build with: localedef -f UTF-8 -i cmn_TW cmn_TW
-%
-%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%

 LC_IDENTIFICATION
 title        "Mandarin Chinese locale for the Republic of China"
@@ -28,8 +22,8 @@ tel          ""
 fax          ""
 language     "Mandarin Chinese"
 territory    "Taiwan"
-revision     "0.2"
-date         "2017-07-20"
+revision     "0.3"
+date         "2021-04-21"

 category "i18n:2012";LC_IDENTIFICATION
 category "i18n:2012";LC_CTYPE
@@ -77,16 +71,16 @@ mon           "<U4E00><U6708>";/
      "<U5341><U6708>";/
      "<U5341><U4E00><U6708>";/
      "<U5341><U4E8C><U6708>"
-%  1月,  2月,  3月,  4月,  5月,  6月,  7月,  8月,  9月, 10月, 11月, 12月
-abmon         " 1<U6708>";/
-       " 2<U6708>";/
-       " 3<U6708>";/
-       " 4<U6708>";/
-       " 5<U6708>";/
-       " 6<U6708>";/
-       " 7<U6708>";/
-       " 8<U6708>";/
-       " 9<U6708>";/
+% 1月, 2月, 3月, 4月, 5月, 6月, 7月, 8月, 9月, 10月, 11月, 12月
+abmon         "1<U6708>";/
+       "2<U6708>";/
+       "3<U6708>";/
+       "4<U6708>";/
+       "5<U6708>";/
+       "6<U6708>";/
+       "7<U6708>";/
+       "8<U6708>";/
+       "9<U6708>";/
        "10<U6708>";/
        "11<U6708>";/
        "12<U6708>"
@@ -119,6 +113,8 @@ am_pm         "<U4E0A><U5348>";/
 t_fmt_ampm    "%p %I<U9EDE>%M<U5206>%S<U79D2>"
 % %Y年 %b %-d號 %A %H:%M:%S %Z
 date_fmt      "%Y<U5E74> %b %-d<U865F> %A %H:%M:%S %Z"
+week 7;19971130;1
+first_weekday 2

 era "+:2:1913//01//01:+*:<U6C11><U570B>:%EC%Ey<U5E74>";/
     "+:1:1912//01//01:1912//12//31:<U6C11><U570B>:%EC<U5143><U5E74>";/
@@ -127,7 +123,7 @@ END LC_TIME

 LC_NUMERIC
 decimal_point "."
-thousands_sep ","
+thousands_sep "<U2009>"
 grouping      4
 END LC_NUMERIC

@@ -135,7 +131,7 @@ LC_MONETARY
 currency_symbol    "NT$"
 int_curr_symbol    "TWD "
 mon_decimal_point  "."
-mon_thousands_sep  ","
+mon_thousands_sep  "<U2009>"
 mon_grouping       4
 positive_sign      ""
 negative_sign      "-"
@@ -166,8 +162,8 @@ measurement 1
 END LC_MEASUREMENT

 LC_MESSAGES
-yesexpr "^[+1yY<UFF59><UFF39><U662F>]"
-noexpr  "^[-0nN<UFF4E><UFF2E><U4E0D><U5426>]"
+yesexpr "^[yY]"
+noexpr  "^[nN]"
 % 是
 yesstr  "<U662F>"
 % 不是
diff --git a/localedata/locales/hak_TW b/localedata/locales/hak_TW
index 73b9678ec4..9824be119e 100644
--- a/localedata/locales/hak_TW
+++ b/localedata/locales/hak_TW
@@ -8,15 +8,9 @@ escape_char /
 % exempt you from the conditions of the license if your use would
 % otherwise be governed by that license.

-%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%
-%
 % Hakka Chinese locale for the Republic of China
-%
 % Prepared and contributed to glibc by Wei-Lun Chao <bluebat@member.fsf.org>
-%
 % build with: localedef -f UTF-8 -i hak_TW hak_TW
-%
-%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%

 LC_IDENTIFICATION
 title        "Hakka Chinese locale for the Republic of China"
@@ -28,8 +22,8 @@ tel          ""
 fax          ""
 language     "Hakka Chinese"
 territory    "Taiwan"
-revision     "0.1"
-date         "2013-06-02"
+revision     "0.2"
+date         "2021-04-21"

 category "i18n:2012";LC_IDENTIFICATION
 category "i18n:2012";LC_CTYPE
@@ -47,17 +41,20 @@ END LC_IDENTIFICATION

 LC_CTYPE
 copy "i18n"
+translit_start
+include "translit_combining";""
+translit_end
+
 class    "hanzi"; /
 <U3007>;/
 <U3400>..<U4DBF>;/
 <U4E00>..<U9FA5>;/
 <UF900>..<UFA6A>;/
-<U00020000>..<U0002A6D6>;/
-<U0002F800>..<U0002FA1D>
+<U00020000>..<U0002FA1D>
 END LC_CTYPE

 LC_COLLATE
-copy "iso14651_t1"
+copy "cns11643_stroke"
 END LC_COLLATE

 LC_TIME
@@ -74,16 +71,16 @@ mon           "<U4E00><U6708>";/
      "<U5341><U6708>";/
      "<U5341><U4E00><U6708>";/
      "<U5341><U4E8C><U6708>"
-%  1月,  2月,  3月,  4月,  5月,  6月,  7月,  8月,  9月, 10月, 11月, 12月
-abmon         " 1<U6708>";/
-       " 2<U6708>";/
-       " 3<U6708>";/
-       " 4<U6708>";/
-       " 5<U6708>";/
-       " 6<U6708>";/
-       " 7<U6708>";/
-       " 8<U6708>";/
-       " 9<U6708>";/
+% 1月, 2月, 3月, 4月, 5月, 6月, 7月, 8月, 9月, 10月, 11月, 12月
+abmon         "1<U6708>";/
+       "2<U6708>";/
+       "3<U6708>";/
+       "4<U6708>";/
+       "5<U6708>";/
+       "6<U6708>";/
+       "7<U6708>";/
+       "8<U6708>";/
+       "9<U6708>";/
        "10<U6708>";/
        "11<U6708>";/
        "12<U6708>"
@@ -103,19 +100,20 @@ abday         "<U65E5>";/
        "<U56DB>";/
        "<U4E94>";/
        "<U516D>"
-% %Y年%m月%d日 (%A) %H點%M分%S秒
-d_t_fmt       "%Y<U5E74>%m<U6708>%d<U65E5> (%A) %H<U9EDE>%M<U5206>%S<U79D2>"
-% %Y年%m月%d日
-d_fmt         "%Y<U5E74>%m<U6708>%d<U65E5>"
+% %Y年%m月%d號 (%A) %H點%M分%S秒
+d_t_fmt       "%Y<U5E74>%m<U6708>%d<U865F> (%A) %H<U9EDE>%M<U5206>%S<U79D2>"
+% %Y年%m月%d號
+d_fmt         "%Y<U5E74>%m<U6708>%d<U865F>"
 % %H點%M分%S秒
 t_fmt         "%H<U9EDE>%M<U5206>%S<U79D2>"
 % 上晝, 下晝
 am_pm         "<U4E0A><U665D>";"<U4E0B><U665D>"
 % %p %I點%M分%S秒
 t_fmt_ampm    "%p %I<U9EDE>%M<U5206>%S<U79D2>"
-% %Y年 %b %e日 %A %H:%M:%S %Z
-date_fmt      "%Y<U5E74> %b %e<U65E5> %A %H:%M:%S %Z"
+% %Y年 %b %-d號 %A %H:%M:%S %Z
+date_fmt      "%Y<U5E74> %b %-d<U865F> %A %H:%M:%S %Z"
 week 7;19971130;1
+first_weekday 2

 era "+:2:1913//01//01:+*:<U6C11><U570B>:%EC%Ey<U5E74>";/
     "+:1:1912//01//01:1912//12//31:<U6C11><U570B>:%EC<U5143><U5E74>";/
@@ -124,7 +122,7 @@ END LC_TIME

 LC_NUMERIC
 decimal_point "."
-thousands_sep ","
+thousands_sep "<U2009>"
 grouping      4
 END LC_NUMERIC

@@ -132,7 +130,7 @@ LC_MONETARY
 currency_symbol    "NT$"
 int_curr_symbol    "TWD "
 mon_decimal_point  "."
-mon_thousands_sep  ","
+mon_thousands_sep  "<U2009>"
 mon_grouping       4
 positive_sign      ""
 negative_sign      "-"
@@ -153,18 +151,22 @@ int_n_sign_posn    1
 END LC_MONETARY

 LC_PAPER
-copy "i18n"
+height 297
+width  210
 END LC_PAPER

 LC_MEASUREMENT
-copy "i18n"
+% metric
+measurement 1
 END LC_MEASUREMENT

 LC_MESSAGES
-% ^[+1yYyY係]
-yesexpr "^[+1yY<UFF59><UFF39><U4FC2>]"
-% ^[-0nNnN毋]
-noexpr  "^[-0nN<UFF4E><UFF2E><U6BCB>]"
+yesexpr "^[yY]"
+noexpr  "^[nN]"
+% 係
+yesstr  "<U4FC2>"
+% 毋係
+nostr   "<U6BCB><U4FC2>"
 END LC_MESSAGES

 LC_NAME
@@ -191,8 +193,8 @@ country_ab3  "TWN"
 country_num  158
 country_car "RC"
 country_isbn 957
-% 客家語
-lang_name    "<U5BA2><U5BB6><U8A71>"
+% 漢語客家語
+lang_name    "<U6F22><U8A9E><U5BA2><U5BB6><U8A9E>"
 lang_term    "hak"
 lang_lib     "hak"
 END LC_ADDRESS
diff --git a/localedata/locales/lzh_TW b/localedata/locales/lzh_TW
index 4740418a83..ba4c495b09 100644
--- a/localedata/locales/lzh_TW
+++ b/localedata/locales/lzh_TW
@@ -8,15 +8,9 @@ escape_char /
 % exempt you from the conditions of the license if your use would
 % otherwise be governed by that license.

-%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%
-%
 % Literary Chinese locale for the Republic of China
-%
 % Prepared and contributed to glibc by Wei-Lun Chao <bluebat@member.fsf.org>
-%
 % build with: localedef -f UTF-8 -i lzh_TW lzh_TW
-%
-%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%

 LC_IDENTIFICATION
 title        "Literary Chinese locale for the Republic of China"
@@ -28,8 +22,8 @@ tel          ""
 fax          ""
 language     "Literary Chinese"
 territory    "Taiwan"
-revision     "0.1"
-date         "2013-06-02"
+revision     "0.2"
+date         "2021-04-21"

 category "i18n:2012";LC_IDENTIFICATION
 category "i18n:2012";LC_CTYPE
@@ -47,17 +41,20 @@ END LC_IDENTIFICATION

 LC_CTYPE
 copy "i18n"
+translit_start
+include "translit_combining";""
+translit_end
+
 class    "hanzi"; /
 <U3007>;/
 <U3400>..<U4DBF>;/
 <U4E00>..<U9FA5>;/
 <UF900>..<UFA6A>;/
-<U00020000>..<U0002A6D6>;/
-<U0002F800>..<U0002FA1D>
+<U00020000>..<U0002FA1D>
 END LC_CTYPE

 LC_COLLATE
-copy "iso14651_t1"
+copy "cns11643_stroke"
 END LC_COLLATE

 LC_TIME
@@ -74,17 +71,17 @@ mon           "<U4E00><U6708>";/
      "<U5341><U6708>";/
      "<U5341><U4E00><U6708>";/
      "<U5341><U4E8C><U6708>"
-%  一 ,  二 ,  三 ,  四 ,  五 ,  六 ,  七 ,  八 ,  九 ,  十 , 十一, 十二
-abmon         " <U4E00> ";/
-       " <U4E8C> ";/
-       " <U4E09> ";/
-       " <U56DB> ";/
-       " <U4E94> ";/
-       " <U516D> ";/
-       " <U4E03> ";/
-       " <U516B> ";/
-       " <U4E5D> ";/
-       " <U5341> ";/
+% 一, 二, 三, 四, 五, 六, 七, 八, 九, 十, 十一, 十二
+abmon         "<U4E00>";/
+       "<U4E8C>";/
+       "<U4E09>";/
+       "<U56DB>";/
+       "<U4E94>";/
+       "<U516D>";/
+       "<U4E03>";/
+       "<U516B>";/
+       "<U4E5D>";/
+       "<U5341>";/
        "<U5341><U4E00>";/
        "<U5341><U4E8C>"
 % 週日, 週一, 週二, 週三, 週四, 週五, 週六
@@ -103,19 +100,21 @@ abday         "<U65E5>";/
        "<U56DB>";/
        "<U4E94>";/
        "<U516D>"
-% %OC%Oy年%B%Od日 (%A) %OH時%OM分%OS秒
-d_t_fmt       "%OC%Oy<U5E74>%B%Od<U65E5> (%A) %OH<U6642>%OM<U5206>%OS<U79D2>"
-% %OC%Oy年%B%Od日
-d_fmt         "%OC%Oy<U5E74>%B%Od<U65E5>"
+% %Y年%B%Od (%A) %OH時%OM分%OS秒
+d_t_fmt       "%Y<U5E74>%B%Od (%A) %OH<U6642>%OM<U5206>%OS<U79D2>"
+% %Y年%B%Od
+d_fmt         "%Y<U5E74>%B%Od"
 % %OH時%OM分%OS秒
 t_fmt         "%OH<U6642>%OM<U5206>%OS<U79D2>"
 % 朝, 暮
-am_pm         "<U671D>";"<U66AE>"
+am_pm         "<U671D>";/
+       "<U66AE>"
 % %p %OI時%OM分%OS秒
 t_fmt_ampm    "%p %OI<U6642>%OM<U5206>%OS<U79D2>"
-% 公曆 %C%Oy年 %B %Oe日 %A %OH時%OM分%OS秒
-date_fmt      "<U516C><U66C6> %C%Oy<U5E74> %B %Oe<U65E5> %A
%OH<U6642>%OM<U5206>%OS<U79D2>"
-% 〇, 一, 二, 三, 四, 五, 六, 七, 八, 九, 十, 十一, 十二, 十三, 十四, 十五, 十六, 十七, 十八,
十九, 廿, 廿一, 廿二, 廿三, 廿四, 廿五, 廿六, 廿七, 廿八, 廿九, 卅, 卅一
+% 公曆 %Y年 %B %Oe %A %OH時%OM分%OS秒
+date_fmt      "<U516C><U66C6> %Y<U5E74> %B %Oe %A
%OH<U6642>%OM<U5206>%OS<U79D2>"
+% 〇, 一, 二, 三, 四, 五, 六, 七, 八, 九, 十, 十一, 十二, 十三, 十四, 十五, 十六, 十七, 十八,
十九, 廿, 廿一, 廿二, 廿三, 廿四, 廿五, 廿六, 廿七, 廿八, 廿九, 卅, 卅一,
+% 卅二, 卅三, 卅四, 卅五, 卅六, 卅七, 卅八, 卅九, 四十, 四十一, 四十二, 四十三, 四十四, 四十五, 四十六,
四十七, 四十八, 四十九, 五十, 五十一, 五十二, 五十三, 五十四, 五十五, 五十六, 五十七, 五十八, 五十九
 alt_digits    "<U3007>";/
             "<U4E00>";/
             "<U4E8C>";/
@@ -147,9 +146,38 @@ alt_digits    "<U3007>";/
             "<U5EFF><U516B>";/
             "<U5EFF><U4E5D>";/
             "<U5345>";/
-            "<U5345><U4E00>"
+            "<U5345><U4E00>";/
+            "<U5345><U4E8C>";/
+            "<U5345><U4E09>";/
+            "<U5345><U56DB>";/
+            "<U5345><U4E94>";/
+            "<U5345><U516D>";/
+            "<U5345><U4E03>";/
+            "<U5345><U516B>";/
+            "<U5345><U4E5D>";/
+            "<U56DB><U5341>";/
+            "<U56DB><U5341><U4E00>";/
+            "<U56DB><U5341><U4E8C>";/
+            "<U56DB><U5341><U4E09>";/
+            "<U56DB><U5341><U56DB>";/
+            "<U56DB><U5341><U4E94>";/
+            "<U56DB><U5341><U516D>";/
+            "<U56DB><U5341><U4E03>";/
+            "<U56DB><U5341><U516B>";/
+            "<U56DB><U5341><U4E5D>";/
+            "<U56DB><U5341>";/
+            "<U4E94><U5341><U4E00>";/
+            "<U4E94><U5341><U4E8C>";/
+            "<U4E94><U5341><U4E09>";/
+            "<U4E94><U5341><U56DB>";/
+            "<U4E94><U5341><U4E94>";/
+            "<U4E94><U5341><U516D>";/
+            "<U4E94><U5341><U4E03>";/
+            "<U4E94><U5341><U516B>";/
+            "<U4E94><U5341><U4E5D>"
 %
 week 7;19971130;1
+first_weekday 2

 era "+:2:1913//01//01:+*:<U6C11><U570B>:%EC%Ey<U5E74>";/
     "+:1:1912//01//01:1912//12//31:<U6C11><U570B>:%EC<U5143><U5E74>";/
@@ -158,7 +186,7 @@ END LC_TIME

 LC_NUMERIC
 decimal_point "."
-thousands_sep ","
+thousands_sep "<U2009>"
 grouping      4
 END LC_NUMERIC

@@ -166,7 +194,7 @@ LC_MONETARY
 currency_symbol    "NT$"
 int_curr_symbol    "TWD "
 mon_decimal_point  "."
-mon_thousands_sep  ","
+mon_thousands_sep  "<U2009>"
 mon_grouping       4
 positive_sign      ""
 negative_sign      "-"
@@ -187,18 +215,22 @@ int_n_sign_posn    1
 END LC_MONETARY

 LC_PAPER
-copy "i18n"
+height 297
+width  210
 END LC_PAPER

 LC_MEASUREMENT
-copy "i18n"
+% metric
+measurement 1
 END LC_MEASUREMENT

 LC_MESSAGES
-% ^[+1yYyY是]
-yesexpr "^[+1yY<UFF59><UFF39><U662F>]"
-% ^[-0nNnN非]
-noexpr  "^[-0nN<UFF4E><UFF2E><U975E>]"
+yesexpr "^[yY]"
+noexpr  "^[nN]"
+% 是
+yesstr  "<U662F>"
+% 否
+nostr   "<U5426>"
 END LC_MESSAGES

 LC_NAME
diff --git a/localedata/locales/nan_TW b/localedata/locales/nan_TW
index 0c2a56f4ca..83e47afbae 100644
--- a/localedata/locales/nan_TW
+++ b/localedata/locales/nan_TW
@@ -1,22 +1,16 @@
 comment_char %
 escape_char /

-% This file is part of the GNU C Library and contains locale data.
-% The Free Software Foundation does not claim any copyright interest
-% in the locale data contained in this file.  The foregoing does not
-% affect the license of the GNU C Library as a whole.  It does not
-% exempt you from the conditions of the license if your use would
-% otherwise be governed by that license.
-
-%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%
-%
+% This file is a part of GNU C Library (glibc) and contains locale data. The
+% Free Software Foundation does not claim any copyright interest in the
+% locale data contained in this file. The foregoing does not affect the
+% license of GNU C Library (glibc) as a whole. It does not exempt you from the
+% conditions of the license if your use would otherwise be governed by
+% that license.
+
 % Min Nan Chinese locale for the Republic of China
-%
 % Prepared and contributed to glibc by Wei-Lun Chao <bluebat@member.fsf.org>
-%
 % build with: localedef -f UTF-8 -i nan_TW nan_TW
-%
-%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%

 LC_IDENTIFICATION
 title        "Min Nan Chinese locale for the Republic of China"
@@ -28,8 +22,8 @@ tel          ""
 fax          ""
 language     "Min Nan Chinese"
 territory    "Taiwan"
-revision     "0.1"
-date         "2013-06-02"
+revision     "0.2"
+date         "2021-04-21"

 category "i18n:2012";LC_IDENTIFICATION
 category "i18n:2012";LC_CTYPE
@@ -47,17 +41,20 @@ END LC_IDENTIFICATION

 LC_CTYPE
 copy "i18n"
+translit_start
+include "translit_combining";""
+translit_end
+
 class    "hanzi"; /
 <U3007>;/
 <U3400>..<U4DBF>;/
 <U4E00>..<U9FA5>;/
 <UF900>..<UFA6A>;/
-<U00020000>..<U0002A6D6>;/
-<U0002F800>..<U0002FA1D>
+<U00020000>..<U0002FA1D>
 END LC_CTYPE

 LC_COLLATE
-copy "iso14651_t1"
+copy "cns11643_stroke"
 END LC_COLLATE

 LC_TIME
@@ -74,16 +71,16 @@ mon           "<U4E00><U6708>";/
      "<U5341><U6708>";/
      "<U5341><U4E00><U6708>";/
      "<U5341><U4E8C><U6708>"
-%  1月,  2月,  3月,  4月,  5月,  6月,  7月,  8月,  9月, 10月, 11月, 12月
-abmon         " 1<U6708>";/
-       " 2<U6708>";/
-       " 3<U6708>";/
-       " 4<U6708>";/
-       " 5<U6708>";/
-       " 6<U6708>";/
-       " 7<U6708>";/
-       " 8<U6708>";/
-       " 9<U6708>";/
+% 1月, 2月, 3月, 4月, 5月, 6月, 7月, 8月, 9月, 10月, 11月, 12月
+abmon         "1<U6708>";/
+       "2<U6708>";/
+       "3<U6708>";/
+       "4<U6708>";/
+       "5<U6708>";/
+       "6<U6708>";/
+       "7<U6708>";/
+       "8<U6708>";/
+       "9<U6708>";/
        "10<U6708>";/
        "11<U6708>";/
        "12<U6708>"
@@ -103,10 +100,10 @@ abday         "<U65E5>";/
        "<U56DB>";/
        "<U4E94>";/
        "<U516D>"
-% %Y年%m月%d日 (%A) %H點%M分%S秒
-d_t_fmt       "%Y<U5E74>%m<U6708>%d<U65E5> (%A) %H<U9EDE>%M<U5206>%S<U79D2>"
-% %Y年%m月%d日
-d_fmt         "%Y<U5E74>%m<U6708>%d<U65E5>"
+% %Y年%m月%d號 (%A) %H點%M分%S秒
+d_t_fmt       "%Y<U5E74>%m<U6708>%d<U865F> (%A) %H<U9EDE>%M<U5206>%S<U79D2>"
+% %Y年%m月%d號
+d_fmt         "%Y<U5E74>%m<U6708>%d<U865F>"
 % %H點%M分%S秒
 t_fmt         "%H<U9EDE>%M<U5206>%S<U79D2>"
 % 頂晡, 下晡
@@ -114,9 +111,10 @@ am_pm         "<U9802><U6661>";/
        "<U4E0B><U6661>"
 % %p %I點%M分%S秒
 t_fmt_ampm    "%p %I<U9EDE>%M<U5206>%S<U79D2>"
-% %Y年 %b %e日 %A %H:%M:%S %Z
-date_fmt      "%Y<U5E74> %b %e<U65E5> %A %H:%M:%S %Z"
+% %Y年 %b %-d號 %A %H:%M:%S %Z
+date_fmt      "%Y<U5E74> %b %-d<U865F> %A %H:%M:%S %Z"
 week 7;19971130;1
+first_weekday 2

 era "+:2:1913//01//01:+*:<U6C11><U570B>:%EC%Ey<U5E74>";/
     "+:1:1912//01//01:1912//12//31:<U6C11><U570B>:%EC<U5143><U5E74>";/
@@ -125,7 +123,7 @@ END LC_TIME

 LC_NUMERIC
 decimal_point "."
-thousands_sep ","
+thousands_sep "<U2009>"
 grouping      4
 END LC_NUMERIC

@@ -133,7 +131,7 @@ LC_MONETARY
 currency_symbol    "NT$"
 int_curr_symbol    "TWD "
 mon_decimal_point  "."
-mon_thousands_sep  ","
+mon_thousands_sep  "<U2009>"
 mon_grouping       4
 positive_sign      ""
 negative_sign      "-"
@@ -154,18 +152,22 @@ int_n_sign_posn    1
 END LC_MONETARY

 LC_PAPER
-copy "i18n"
+height 297
+width  210
 END LC_PAPER

 LC_MEASUREMENT
-copy "i18n"
+% metric
+measurement 1
 END LC_MEASUREMENT

 LC_MESSAGES
-% ^[+1yYyY是]
-yesexpr "^[+1yY<UFF59><UFF39><U662F>]"
-% ^[-0nNnN伓]
-noexpr  "^[-0nN<UFF4E><UFF2E><U4F13>]"
+yesexpr "^[yY]"
+noexpr  "^[nN]"
+% 是
+yesstr  "<U662F>"
+% 毋是
+nostr   "<U6BCB><U662F>"
 END LC_MESSAGES

 LC_NAME
@@ -192,8 +194,8 @@ country_ab3  "TWN"
 country_num  158
 country_car "RC"
 country_isbn 957
-% 閩南語
-lang_name    "<U95A9><U5357><U8A9E>"
+% 漢語閩南語
+lang_name    "<U6F22><U8A9E><U95A9><U5357><U8A9E>"
 lang_term    "nan"
 lang_lib     "nan"
 END LC_ADDRESS
-- 
2.31.1

^ permalink raw reply	[flat|nested] 11+ messages in thread

* Re: [PATCH v2] localedata: Updates for Taiwanese locales [BZ #24409]
  2021-05-10  3:07   ` Wei-Lun Chao
@ 2021-05-11 11:15     ` TAMUKI Shoichi
  2021-05-13  3:53       ` Wei-Lun Chao
  2021-05-11 12:41     ` TAMUKI Shoichi
  1 sibling, 1 reply; 11+ messages in thread
From: TAMUKI Shoichi @ 2021-05-11 11:15 UTC (permalink / raw)
  To: Wei-Lun Chao; +Cc: Carlos O'Donell, libc-alpha

Hello Wei-Lun-san,

From: Wei-Lun Chao via Libc-alpha <libc-alpha@sourceware.org>
Subject: [PATCH v2] localedata: Updates for Taiwanese locales [BZ #24409]
Date: Mon, 10 May 2021 11:07:27 +0800

> Rationale:
> * Header cleanup: make the header of localedata files consistent
> * Remove space (abmon): remove the extra prefix space in abmon 1~9

Why are you trying to remove the extra prefix space in abmon 1..9?
By fixing the display width of abbreviated month names (%b) in the
same way as "Jan", "Feb", "Mar", ..., it has the effect of making the
display width constant, such as system log.
I don't think we should remove the leading space in abmon 1..9.

Regards,
TAMUKI Shoichi

^ permalink raw reply	[flat|nested] 11+ messages in thread

* Re: [PATCH v2] localedata: Updates for Taiwanese locales [BZ #24409]
  2021-05-10  3:07   ` Wei-Lun Chao
  2021-05-11 11:15     ` TAMUKI Shoichi
@ 2021-05-11 12:41     ` TAMUKI Shoichi
  2021-05-13  5:10       ` Wei-Lun Chao
  1 sibling, 1 reply; 11+ messages in thread
From: TAMUKI Shoichi @ 2021-05-11 12:41 UTC (permalink / raw)
  To: Wei-Lun Chao; +Cc: Carlos O'Donell, libc-alpha

Hello Wei-Lun-san,

From: Wei-Lun Chao via Libc-alpha <libc-alpha@sourceware.org>
Subject: [PATCH v2] localedata: Updates for Taiwanese locales [BZ #24409]
Date: Mon, 10 May 2021 11:07:27 +0800

> Changelog:
> * localedata/locales/cmn_TW: Header cleanup; Remove space (abmon); Add (week); Change (thousands_sep); Simplify (yesexpr) and (noexpr).
> * localedata/locales/hak_TW: Likewise and add collation.
> * localedata/locales/nan_TW: Likewise and add collation.
> * localedata/locales/lzh_TW: Likewise and add collation.

If elements from 0 to 59 are defined for alt_digits in lzh_TW, there
are the following problems:

$ LANG=lzh_TW date -d "1959-04-01 09:00:00" +"%Oy<U5E74>"
<U4E94><U5341><U4E5D><U5E74>
$ LANG=lzh_TW date -d "1960-04-01 09:00:00" +"%Oy<U5E74>"
60<U5E74>

Up to 99 elements should be defined for alt_digits.

Regards,
TAMUKI Shoichi

^ permalink raw reply	[flat|nested] 11+ messages in thread

* Re: [PATCH v2] localedata: Updates for Taiwanese locales [BZ #24409]
  2021-05-11 11:15     ` TAMUKI Shoichi
@ 2021-05-13  3:53       ` Wei-Lun Chao
  2021-05-16 21:46         ` TAMUKI Shoichi
       [not found]         ` <202105161000.AA00005@tamuki.linet.gr.jp>
  0 siblings, 2 replies; 11+ messages in thread
From: Wei-Lun Chao @ 2021-05-13  3:53 UTC (permalink / raw)
  To: TAMUKI Shoichi; +Cc: Carlos O'Donell, libc-alpha

Hello,

Without this patch, "date +%b" will output with a leading space for month 1..9.
And the day number makes the display width inconstant already.
So I think single space would be a better separator.

Regards,
Wei-Lun CHAO

TAMUKI Shoichi <tamuki@linet.gr.jp> 於 2021年5月11日 週二 下午7:17寫道:
>
> Hello Wei-Lun-san,
>
> From: Wei-Lun Chao via Libc-alpha <libc-alpha@sourceware.org>
> Subject: [PATCH v2] localedata: Updates for Taiwanese locales [BZ #24409]
> Date: Mon, 10 May 2021 11:07:27 +0800
>
> > Rationale:
> > * Header cleanup: make the header of localedata files consistent
> > * Remove space (abmon): remove the extra prefix space in abmon 1~9
>
> Why are you trying to remove the extra prefix space in abmon 1..9?
> By fixing the display width of abbreviated month names (%b) in the
> same way as "Jan", "Feb", "Mar", ..., it has the effect of making the
> display width constant, such as system log.
> I don't think we should remove the leading space in abmon 1..9.
>
> Regards,
> TAMUKI Shoichi

^ permalink raw reply	[flat|nested] 11+ messages in thread

* Re: [PATCH v2] localedata: Updates for Taiwanese locales [BZ #24409]
  2021-05-11 12:41     ` TAMUKI Shoichi
@ 2021-05-13  5:10       ` Wei-Lun Chao
  2021-05-16 21:46         ` TAMUKI Shoichi
       [not found]         ` <202105161001.AA00006@tamuki.linet.gr.jp>
  0 siblings, 2 replies; 11+ messages in thread
From: Wei-Lun Chao @ 2021-05-13  5:10 UTC (permalink / raw)
  To: TAMUKI Shoichi; +Cc: Carlos O'Donell, libc-alpha

Hello,

First, alt_digits works like "alt_numbers". I don't know how to just
map each digit to another character.
Before this patch, alt_digits covers 0..31, and this patch covers
0..59. I am not sure, is it worthy to extend
to 0..99, because those presentations are not suitable for year
numbers. For example:
$ LANG=lzh_TW date -d "1959-04-01 09:00:00" +"%Oy<U5E74>"
We will expect <U4E94><U4E5D><U5E74> instead of <U4E94><U5341><U4E5D><U5E74>

Regards,
Wei-Lun CHAO

TAMUKI Shoichi <tamuki@linet.gr.jp> 於 2021年5月11日 週二 下午8:42寫道:
>
> Hello Wei-Lun-san,
>
> From: Wei-Lun Chao via Libc-alpha <libc-alpha@sourceware.org>
> Subject: [PATCH v2] localedata: Updates for Taiwanese locales [BZ #24409]
> Date: Mon, 10 May 2021 11:07:27 +0800
>
> > Changelog:
> > * localedata/locales/cmn_TW: Header cleanup; Remove space (abmon); Add (week); Change (thousands_sep); Simplify (yesexpr) and (noexpr).
> > * localedata/locales/hak_TW: Likewise and add collation.
> > * localedata/locales/nan_TW: Likewise and add collation.
> > * localedata/locales/lzh_TW: Likewise and add collation.
>
> If elements from 0 to 59 are defined for alt_digits in lzh_TW, there
> are the following problems:
>
> $ LANG=lzh_TW date -d "1959-04-01 09:00:00" +"%Oy<U5E74>"
> <U4E94><U5341><U4E5D><U5E74>
> $ LANG=lzh_TW date -d "1960-04-01 09:00:00" +"%Oy<U5E74>"
> 60<U5E74>
>
> Up to 99 elements should be defined for alt_digits.
>
> Regards,
> TAMUKI Shoichi

^ permalink raw reply	[flat|nested] 11+ messages in thread

* Re: [PATCH v2] localedata: Updates for Taiwanese locales [BZ #24409]
  2021-05-13  3:53       ` Wei-Lun Chao
@ 2021-05-16 21:46         ` TAMUKI Shoichi
       [not found]         ` <202105161000.AA00005@tamuki.linet.gr.jp>
  1 sibling, 0 replies; 11+ messages in thread
From: TAMUKI Shoichi @ 2021-05-16 21:46 UTC (permalink / raw)
  To: Wei-Lun Chao; +Cc: Carlos O'Donell, libc-alpha

[-- Attachment #1: Type: text/plain, Size: 1549 bytes --]

Hello Wei-Lun-san,

From: Wei-Lun Chao <bluebat@member.fsf.org>
Subject: Re: [PATCH v2] localedata: Updates for Taiwanese locales [BZ #24409]
Date: Thu, 13 May 2021 11:53:38 +0800

> > > Rationale:
> > > * Header cleanup: make the header of localedata files consistent
> > > * Remove space (abmon): remove the extra prefix space in abmon 1~9
> > 
> > Why are you trying to remove the extra prefix space in abmon 1..9?
> > By fixing the display width of abbreviated month names (%b) in the
> > same way as "Jan", "Feb", "Mar", ..., it has the effect of making the
> > display width constant, such as system log.
> > I don't think we should remove the leading space in abmon 1..9.
> 
> Without this patch, "date +%b" will output with a leading space for month 1..9.
> And the day number makes the display width inconstant already.
> So I think single space would be a better separator.

The elements defined in (ab)mon and (ab)day in the current *_TW locale
are summarized in the attached file mon+day.txt.  In each locale, the
display widths of mon (%B) and abday (%A) can change, while the
display widths of abmon (%b) and abday (%a) are constant.

Date and time notations such as logs and form lists may sometimes be
in RFC2822 (%a, %d %b %Y %T %z) or ctime (%a %b %d %T %Z %Y) format
with local locales.

With this patch, these display widths will change in *_TW locale,
even though the display width of each conversion specification that
makes up them is intended to be constant.  Please see the attached
file ctime.txt.

Regards,
TAMUKI Shoichi

[-- Attachment #2: mon+day.txt --]
[-- Type: application/octet-stream, Size: 4196 bytes --]

		zh_TW		lzh_TW		cmn_TW		nan_TW		nan_TW@latin	hak_TW		ja_JP		POSIX(C)

mon (%B)	"一月"		"一月"		"一月"		"一月"		"1goe̍h"	"一月"		"1月"		"January"
		"二月"		"二月"		"二月"		"二月"		"2goe̍h"	"二月"		"2月"		"February"
		"三月"		"三月"		"三月"		"三月"		"3goe̍h"	"三月"		"3月"		"March"
		"四月"		"四月"		"四月"		"四月"		"4goe̍h"	"四月"		"4月"		"April"
		"五月"		"五月"		"五月"		"五月"		"5goe̍h"	"五月"		"5月"		"May"
		"六月"		"六月"		"六月"		"六月"		"6goe̍h"	"六月"		"6月"		"June"
		"七月"		"七月"		"七月"		"七月"		"7goe̍h"	"七月"		"7月"		"July"
		"八月"		"八月"		"八月"		"八月"		"8goe̍h"	"八月"		"8月"		"August"
		"九月"		"九月"		"九月"		"九月"		"9goe̍h"	"九月"		"9月"		"September"
		"十月"		"十月"		"十月"		"十月"		"10goe̍h"	"十月"		"10月"		"October"
		"十一月"	"十一月"	"十一月"	"十一月"	"11goe̍h"	"十一月"	"11月"		"November"
		"十二月"	"十二月"	"十二月"	"十二月"	"12goe̍h"	"十二月"	"12月"		"December"

abmon (%b)	" 1月"		" 一 "		" 1月"		" 1月"		"1g"		" 1月"		" 1月"		"Jan"
		" 2月"		" 二 "		" 2月"		" 2月"		"2g"		" 2月"		" 2月"		"Feb"
		" 3月"		" 三 "		" 3月"		" 3月"		"3g"		" 3月"		" 3月"		"Mar"
		" 4月"		" 四 "		" 4月"		" 4月"		"4g"		" 4月"		" 4月"		"Apr"
		" 5月"		" 五 "		" 5月"		" 5月"		"5g"		" 5月"		" 5月"		"May"
		" 6月"		" 六 "		" 6月"		" 6月"		"6g"		" 6月"		" 6月"		"Jun"
		" 7月"		" 七 "		" 7月"		" 7月"		"7g"		" 7月"		" 7月"		"Jul"
		" 8月"		" 八 "		" 8月"		" 8月"		"8g"		" 8月"		" 8月"		"Aug"
		" 9月"		" 九 "		" 9月"		" 9月"		"9g"		" 9月"		" 9月"		"Sep"
		"10月"		" 十 "		"10月"		"10月"		"10g"		"10月"		"10月"		"Oct"
		"11月"		"十一"		"11月"		"11月"		"11g"		"11月"		"11月"		"Nov"
		"12月"		"十二"		"12月"		"12月"		"12g"		"12月"		"12月"		"Dec"

day (%A)	"週日"		"週日"		"星期日"	"禮拜日"	"lé-pài-ji̍"	"禮拜日"	"日曜日"	"Sunday"
		"週一"		"週一"		"星期一"	"禮拜一"	"pài-it"	"禮拜一"	"月曜日"	"Monday"
		"週二"		"週二"		"星期二"	"禮拜二"	"pài-jī"	"禮拜二"	"火曜日"	"Tuesday"
		"週三"		"週三"		"星期三"	"禮拜三"	"pài-saⁿ"	"禮拜三"	"水曜日"	"Wednesday"
		"週四"		"週四"		"星期四"	"禮拜四"	"pài-sì"	"禮拜四"	"木曜日"	"Thursday"
		"週五"		"週五"		"星期五"	"禮拜五"	"pài-gō͘"	"禮拜五"	"金曜日"	"Friday"
		"週六"		"週六"		"星期六"	"禮拜六"	"pài-la̍k"	"禮拜六"	"土曜日"	"Saturday"

abday (%a)	"日"		"日"		"日"		"日"		"lp"		"日"		"日"		"Sun"
		"一"		"一"		"一"		"一"		"p1"		"一"		"月"		"Mon"
		"二"		"二"		"二"		"二"		"p2"		"二"		"火"		"Tue"
		"三"		"三"		"三"		"三"		"p3"		"三"		"水"		"Wed"
		"四"		"四"		"四"		"四"		"p4"		"四"		"木"		"Thu"
		"五"		"五"		"五"		"五"		"p5"		"五"		"金"		"Fri"
		"六"		"六"		"六"		"六"		"p6"		"六"		"土"		"Sat"

zh_TW:		         Chinese  locale for Taiwan R.O.C.		中華民國的中文言環境			中華民国の中国語ロケール
lzh_TW:		Literary Chinese  locale for the Republic of China	中華民國的漢語文言言環境		中華民国の漢文ロケール
cmn_TW:		Mandarin Chinese  locale for the Republic of China	中華民國的漢語官話言環境		中華民国の北京語ロケール
nan_TW:		Min Nan  Chinese  locale for the Republic of China	中華民國的漢語閩南語言環境		中華民国の閩南語ロケール
nan_TW@latin:	Minnan   Language Locale for Taiwan			中華民國的漢語閩南語拉丁腳本語言環境	中華民国の閩南語ラテン文字ロケール
hak_TW:		Hakka    Chinese  locale for the Republic of China	中華民國的漢語客家語言環境		中華民国の客家語ロケール
ja_JP:		Japanese language locale for Japan			日本的日語語言環境			日本の日本語ロケール

zh_TW:		"西元%Y年%m月%d日 (%A) %H時%M分%S秒 %Z"
lzh_TW:		"公曆 %C%Oy年 %B %Oe日 %A %OH時%OM分%OS秒"
cmn_TW:		"%Y年 %b %-d號 %A %H:%M:%S %Z"
nan_TW:		"%Y年 %b %e日 %A %H:%M:%S %Z"
nan_TW@latin:	"%Y %b %d (%a) %H:%M:%S %Z"
hak_TW:		"%Y年 %b %e日 %A %H:%M:%S %Z"
ja_JP:		"%Y年 %b %e日 %A %H:%M:%S %Z"

[-- Attachment #3: ctime.txt --]
[-- Type: application/octet-stream, Size: 1906 bytes --]

$ LANG=C ; for i in `seq -w 12` ; do date -d "2021-$i-01 09:00:00" +"%a %b %d %T %Z %Y" ; done
Fri Jan 01 09:00:00 JST 2021
Mon Feb 01 09:00:00 JST 2021
Mon Mar 01 09:00:00 JST 2021
Thu Apr 01 09:00:00 JST 2021
Sat May 01 09:00:00 JST 2021
Tue Jun 01 09:00:00 JST 2021
Thu Jul 01 09:00:00 JST 2021
Sun Aug 01 09:00:00 JST 2021
Wed Sep 01 09:00:00 JST 2021
Fri Oct 01 09:00:00 JST 2021
Mon Nov 01 09:00:00 JST 2021
Wed Dec 01 09:00:00 JST 2021
$ LANG=ja_JP.UTF-8 ; for i in `seq -w 12` ; do date -d "2021-$i-01 09:00:00" +"%a %b %d %T %Z %Y" ; done
金  1月 01 09:00:00 JST 2021
月  2月 01 09:00:00 JST 2021
月  3月 01 09:00:00 JST 2021
木  4月 01 09:00:00 JST 2021
土  5月 01 09:00:00 JST 2021
火  6月 01 09:00:00 JST 2021
木  7月 01 09:00:00 JST 2021
日  8月 01 09:00:00 JST 2021
水  9月 01 09:00:00 JST 2021
金 10月 01 09:00:00 JST 2021
月 11月 01 09:00:00 JST 2021
水 12月 01 09:00:00 JST 2021

[without this patch]
$ LANG=zh_TW.UTF-8 ; for i in `seq -w 12` ; do date -d "2021-$i-01 09:00:00" +"%a %b %d %T %Z %Y" ; done
五  1月 01 09:00:00 JST 2021
一  2月 01 09:00:00 JST 2021
一  3月 01 09:00:00 JST 2021
四  4月 01 09:00:00 JST 2021
六  5月 01 09:00:00 JST 2021
二  6月 01 09:00:00 JST 2021
四  7月 01 09:00:00 JST 2021
日  8月 01 09:00:00 JST 2021
三  9月 01 09:00:00 JST 2021
五 10月 01 09:00:00 JST 2021
一 11月 01 09:00:00 JST 2021
三 12月 01 09:00:00 JST 2021

[with this patch]
$ LANG=zh_TW.UTF-8 ; for i in `seq -w 12` ; do date -d "2021-$i-01 09:00:00" +"%a %b %d %T %Z %Y" ; done
五 1月 01 09:00:00 JST 2021
一 2月 01 09:00:00 JST 2021
一 3月 01 09:00:00 JST 2021
四 4月 01 09:00:00 JST 2021
六 5月 01 09:00:00 JST 2021
二 6月 01 09:00:00 JST 2021
四 7月 01 09:00:00 JST 2021
日 8月 01 09:00:00 JST 2021
三 9月 01 09:00:00 JST 2021
五 10月 01 09:00:00 JST 2021
一 11月 01 09:00:00 JST 2021
三 12月 01 09:00:00 JST 2021

^ permalink raw reply	[flat|nested] 11+ messages in thread

* Re: [PATCH v2] localedata: Updates for Taiwanese locales [BZ #24409]
  2021-05-13  5:10       ` Wei-Lun Chao
@ 2021-05-16 21:46         ` TAMUKI Shoichi
       [not found]         ` <202105161001.AA00006@tamuki.linet.gr.jp>
  1 sibling, 0 replies; 11+ messages in thread
From: TAMUKI Shoichi @ 2021-05-16 21:46 UTC (permalink / raw)
  To: Wei-Lun Chao; +Cc: Carlos O'Donell, libc-alpha

[-- Attachment #1: Type: text/plain, Size: 2132 bytes --]

Hello Wei-Lun-san,

From: Wei-Lun Chao <bluebat@member.fsf.org>
Subject: Re: [PATCH v2] localedata: Updates for Taiwanese locales [BZ #24409]
Date: Thu, 13 May 2021 13:10:12 +0800

> > > Changelog:
> > > * localedata/locales/cmn_TW: Header cleanup; Remove space (abmon); Add
> > > (week); Change (thousands_sep); Simplify (yesexpr) and (noexpr).
> > > * localedata/locales/hak_TW: Likewise and add collation.
> > > * localedata/locales/nan_TW: Likewise and add collation.
> > > * localedata/locales/lzh_TW: Likewise and add collation.
> > 
> > If elements from 0 to 59 are defined for alt_digits in lzh_TW, there
> > are the following problems:
> > 
> > $ LANG=lzh_TW date -d "1959-04-01 09:00:00" +"%Oy<U5E74>"
> > <U4E94><U5341><U4E5D><U5E74>
> > $ LANG=lzh_TW date -d "1960-04-01 09:00:00" +"%Oy<U5E74>"
> > 60<U5E74>
> > 
> > Up to 99 elements should be defined for alt_digits.
> 
> First, alt_digits works like "alt_numbers". I don't know how to just
> map each digit to another character.
> Before this patch, alt_digits covers 0..31, and this patch covers
> 0..59. I am not sure, is it worthy to extend
> to 0..99, because those presentations are not suitable for year
> numbers. For example:
> $ LANG=lzh_TW date -d "1959-04-01 09:00:00" +"%Oy<U5E74>"
> We will expect <U4E94><U4E5D><U5E74> instead of <U4E94><U5341><U4E5D><U5E74>

I understand what you are concerned about.

In Japan, for example, it is not sutable to use number names to
express another form of year notation using alternative numeric
symbols in years such as AD 1984 and AD 645.  It is commonly expressed
in positional notation.  I think the situation is the same in Taiwan.

On the other hand, for example, it is not suitable to use positional
notation to express another form of year notation using alternative
numeric symbols in years such as AD 78.  It is commonly expressed in
number names.  Please see the attached file alt_digits.txt.

I think that these boundaries are empirically determined by whether
the numerical value is 2 digits or less or 3 digits or more.
Therefore, it makes sense to define alt_digits up to 99.

Regards,
TAMUKI Shoichi

[-- Attachment #2: alt_digits.txt --]
[-- Type: application/octet-stream, Size: 1922 bytes --]

[year notation]
西暦1984年		(Arabic numerals)
西暦千九百八十四年	(number names)		;not suitable
西暦一九八四年		(positional notation)	;suitable

西暦645年		(Arabic numerals)
西暦六百四十五年	(number names)		;not suitable
西暦六四五年		(positional notation)	;suitable

西暦78年		(Arabic numerals)
西暦七十八年		(number names)		;suitable
西暦七八年		(positional notation)	;not suitable

	ja_JP		lzh_TW		fa_IR		my_MM
0	〇		〇		۰		၀
1	一		一		۱		၁
9	九		九		۹		၉
10	十		十		۱۰		၁၀
11	十一		十一		۱۱		၁၁
19	十九		十九		۱۹		၁၉
20	二十		廿		۲۰		၂၀
21	二十一		廿一		۲۱		၂၁
29	二十九		廿九		۲۹		၂၉
30	三十		卅		۳۰		၃၀
31	三十一		卅一		۳۱		၃၁
39	三十九		卅九		۳۹		၃၉
40	四十		四十		۴۰		၄၀
41	四十一		四十一		۴۱		၄၁
78	七十八		七十八		۷۸		၇၈
99	九十九		九十九		۹۹		၉၉
100	一〇〇		一〇〇		۱۰۰		၁၀၀
101	一〇一		一〇一		۱۰۱		၁၀၁
645	六四五		六四五		۶۴۵		၆၄၅
999	九九九		九九九		۹۹۹		၉၉၉
1000	一〇〇〇	一〇〇〇	۱۰۰۰		၁၀၀၀
1001	一〇〇一	一〇〇一	۱۰۰۱		၁၀၀၁
1984	一九八四	一九八四	۱۹۸۴		၁၉၈၄
2021	二〇二一	二〇二一	۲۰۲۱		၂၀၂၁

# The following features have not been implemented yet.
# See [BZ #24453][BZ #24471] in detail.

$ LANG=ja_JP.UTF-8 date -d "1987-04-01 09:00:00" +"西暦%OY年"
西暦一九八七年
$ LANG=ja_JP.UTF-8 date -d "1987-04-01 09:00:00" +"%OEY"
昭和六十二年
$ LANG=lzh_TW.UTF-8 date -d "1987-04-01 09:00:00" +"%OEY"
民國七十六年

$ LANG=ja_JP.UTF-8 date -d "2021-04-01 09:00:00" +"西暦%OY年"
西暦二〇二一年
$ LANG=ja_JP.UTF-8 date -d "2021-04-01 09:00:00" +"%OEY"
令和三年
$ LANG=lzh_TW.UTF-8 date -d "2021-04-01 09:00:00" +"%OEY"
民國一一〇年

^ permalink raw reply	[flat|nested] 11+ messages in thread

* Re: [PATCH v2] localedata: Updates for Taiwanese locales [BZ #24409]
       [not found]         ` <202105161000.AA00005@tamuki.linet.gr.jp>
@ 2021-11-19 14:47           ` Wei-Lun Chao
  0 siblings, 0 replies; 11+ messages in thread
From: Wei-Lun Chao @ 2021-11-19 14:47 UTC (permalink / raw)
  To: TAMUKI Shoichi; +Cc: Carlos O'Donell, libc-alpha

Dear Shoichi,

Thanks for your explanation.
I'll drop this part of patch.

TAMUKI Shoichi <tamuki@linet.gr.jp> 於 2021年5月16日 週日 下午6:04寫道:
>
> Hello Wei-Lun-san,
>
> From: Wei-Lun Chao <bluebat@member.fsf.org>
> Subject: Re: [PATCH v2] localedata: Updates for Taiwanese locales [BZ #24409]
> Date: Thu, 13 May 2021 11:53:38 +0800
>
> > > > Rationale:
> > > > * Header cleanup: make the header of localedata files consistent
> > > > * Remove space (abmon): remove the extra prefix space in abmon 1~9
> > >
> > > Why are you trying to remove the extra prefix space in abmon 1..9?
> > > By fixing the display width of abbreviated month names (%b) in the
> > > same way as "Jan", "Feb", "Mar", ..., it has the effect of making the
> > > display width constant, such as system log.
> > > I don't think we should remove the leading space in abmon 1..9.
> >
> > Without this patch, "date +%b" will output with a leading space for month 1..9.
> > And the day number makes the display width inconstant already.
> > So I think single space would be a better separator.
>
> The elements defined in (ab)mon and (ab)day in the current *_TW locale
> are summarized in the attached file mon+day.png.  In each locale, the
> display widths of mon (%B) and abday (%A) can change, while the
> display widths of abmon (%b) and abday (%a) are constant.
>
> Date and time notations such as logs and form lists may sometimes be
> in RFC2822 (%a, %d %b %Y %T %z) or ctime (%a %b %d %T %Z %Y) format
> with local locales.
>
> With this patch, these display widths will change in *_TW locale,
> even though the display width of each conversion specification that
> makes up them is intended to be constant.  Please see the attached
> file ctime.png.
>
> Regards,
> TAMUKI Shoichi

^ permalink raw reply	[flat|nested] 11+ messages in thread

* Re: [PATCH v2] localedata: Updates for Taiwanese locales [BZ #24409]
       [not found]         ` <202105161001.AA00006@tamuki.linet.gr.jp>
@ 2021-11-19 14:48           ` Wei-Lun Chao
  0 siblings, 0 replies; 11+ messages in thread
From: Wei-Lun Chao @ 2021-11-19 14:48 UTC (permalink / raw)
  To: TAMUKI Shoichi; +Cc: Carlos O'Donell, libc-alpha

Dear Shoichi,

Thanks for your explanation.
I'll add this part of patch.

TAMUKI Shoichi <tamuki@linet.gr.jp> 於 2021年5月16日 週日 下午6:04寫道:
>
> Hello Wei-Lun-san,
>
> From: Wei-Lun Chao <bluebat@member.fsf.org>
> Subject: Re: [PATCH v2] localedata: Updates for Taiwanese locales [BZ #24409]
> Date: Thu, 13 May 2021 13:10:12 +0800
>
> > > > Changelog:
> > > > * localedata/locales/cmn_TW: Header cleanup; Remove space (abmon); Add
> > > > (week); Change (thousands_sep); Simplify (yesexpr) and (noexpr).
> > > > * localedata/locales/hak_TW: Likewise and add collation.
> > > > * localedata/locales/nan_TW: Likewise and add collation.
> > > > * localedata/locales/lzh_TW: Likewise and add collation.
> > >
> > > If elements from 0 to 59 are defined for alt_digits in lzh_TW, there
> > > are the following problems:
> > >
> > > $ LANG=lzh_TW date -d "1959-04-01 09:00:00" +"%Oy<U5E74>"
> > > <U4E94><U5341><U4E5D><U5E74>
> > > $ LANG=lzh_TW date -d "1960-04-01 09:00:00" +"%Oy<U5E74>"
> > > 60<U5E74>
> > >
> > > Up to 99 elements should be defined for alt_digits.
> >
> > First, alt_digits works like "alt_numbers". I don't know how to just
> > map each digit to another character.
> > Before this patch, alt_digits covers 0..31, and this patch covers
> > 0..59. I am not sure, is it worthy to extend
> > to 0..99, because those presentations are not suitable for year
> > numbers. For example:
> > $ LANG=lzh_TW date -d "1959-04-01 09:00:00" +"%Oy<U5E74>"
> > We will expect <U4E94><U4E5D><U5E74> instead of <U4E94><U5341><U4E5D><U5E74>
>
> I understand what you are concerned about.
>
> In Japan, for example, it is not sutable to use number names to
> express another form of year notation using alternative numeric
> symbols in years such as AD 1984 and AD 645.  It is commonly expressed
> in positional notation.  I think the situation is the same in Taiwan.
>
> On the other hand, for example, it is not suitable to use positional
> notation to express another form of year notation using alternative
> numeric symbols in years such as AD 78.  It is commonly expressed in
> number names.  Please see the attached file alt_digits.png.
>
> I think that these boundaries are empirically determined by whether
> the numerical value is 2 digits or less or 3 digits or more.
> Therefore, it makes sense to define alt_digits up to 99.
>
> Regards,
> TAMUKI Shoichi

^ permalink raw reply	[flat|nested] 11+ messages in thread

end of thread, other threads:[~2021-11-19 14:48 UTC | newest]

Thread overview: 11+ messages (download: mbox.gz / follow: Atom feed)
-- links below jump to the message on this page --
2021-04-21  5:38 [PATCH v2] localedata: Updates for Taiwanese locales [BZ #24409] Wei-Lun Chao
2021-05-07 21:23 ` Carlos O'Donell
2021-05-10  3:07   ` Wei-Lun Chao
2021-05-11 11:15     ` TAMUKI Shoichi
2021-05-13  3:53       ` Wei-Lun Chao
2021-05-16 21:46         ` TAMUKI Shoichi
     [not found]         ` <202105161000.AA00005@tamuki.linet.gr.jp>
2021-11-19 14:47           ` Wei-Lun Chao
2021-05-11 12:41     ` TAMUKI Shoichi
2021-05-13  5:10       ` Wei-Lun Chao
2021-05-16 21:46         ` TAMUKI Shoichi
     [not found]         ` <202105161001.AA00006@tamuki.linet.gr.jp>
2021-11-19 14:48           ` Wei-Lun Chao

This is a public inbox, see mirroring instructions
for how to clone and mirror all data and code used for this inbox;
as well as URLs for read-only IMAP folder(s) and NNTP newsgroup(s).