Set width of JUNGSEONG/JONGSEONG characters from UD7B0 to UD7FB to 0 [BZ #26120]

author Mike FABIAN <mfabian@redhat.com>

Tue, 16 Jun 2020 06:29:40 +0000 (08:29 +0200)

committer Mike FABIAN <mfabian@redhat.com>

Fri, 26 Jun 2020 07:54:43 +0000 (09:54 +0200)
author Mike FABIAN <mfabian@redhat.com>
Tue, 16 Jun 2020 06:29:40 +0000 (08:29 +0200)
committer Mike FABIAN <mfabian@redhat.com>
Fri, 26 Jun 2020 07:54:43 +0000 (09:54 +0200)
diff --git a/localedata/charmaps/UTF-8 b/localedata/charmaps/UTF-8

index 14c5d4fa334ba05eeb9ee5b8a349f9d83abbe994..8cce47cd97217daaf9141f8f1162dd30ecdad7bb 100644 (file)
--- a/localedata/charmaps/UTF-8
+++ b/localedata/charmaps/UTF-8
@@ -48920,6 +48920,8 @@ WIDTH
  <UABE8>        0
  <UABED>        0
  <UAC00>...<UD7A3>      2
+<UD7B0>...<UD7C6>      0
+<UD7CB>...<UD7FB>      0
  <UF900>...<UFA6D>      2
  <UFA70>...<UFAD9>      2
  <UFB1E>        0
diff --git a/localedata/locales/i18n_ctype b/localedata/locales/i18n_ctype

index 6f078a101d5936ce6946c53caf9c37b93b8c43c6..c63e0790fc71c1c1d99a9af6ab8e72445b8d3b78 100644 (file)
--- a/localedata/locales/i18n_ctype
+++ b/localedata/locales/i18n_ctype
@@ -26,7 +26,7 @@ fax       ""
  language  ""
  territory "Earth"
  revision  "13.0.0"
-date      "2020-04-14"
+date      "2020-06-25"
  category  "i18n:2012";LC_CTYPE
  END LC_IDENTIFICATION
  
diff --git a/localedata/locales/tr_TR b/localedata/locales/tr_TR

index d5785ceca1a96a1cbf66588efd5e52d25a590eca..7dbb923228a35bdab21aaed2b950e976def6d4b4 100644 (file)
--- a/localedata/locales/tr_TR
+++ b/localedata/locales/tr_TR
@@ -43,7 +43,7 @@ fax        ""
  language   "Turkish"
  territory  "Turkey"
  revision   "1.0"
-date       "2020-04-14"
+date       "2020-06-25"
  
  category "i18n:2012";LC_IDENTIFICATION
  category "i18n:2012";LC_CTYPE
diff --git a/localedata/locales/translit_circle b/localedata/locales/translit_circle

index 0f1e81541c31fe1a049fcee45cb73b5fcae463e7..5c07b44532c6f936eca2bdb561a5e0c555b9a28e 100644 (file)
--- a/localedata/locales/translit_circle
+++ b/localedata/locales/translit_circle
@@ -9,7 +9,7 @@ comment_char %
  % otherwise be governed by that license.
  
  % Transliterations of encircled characters.
-% Generated automatically from UnicodeData.txt by gen_translit_circle.py on 2020-04-14 for Unicode 13.0.0.
+% Generated automatically from UnicodeData.txt by gen_translit_circle.py on 2020-06-25 for Unicode 13.0.0.
  
  LC_CTYPE
  
diff --git a/localedata/locales/translit_cjk_compat b/localedata/locales/translit_cjk_compat

index 17b74134fc06598f94b063499d163f4f3befadfa..ee0d7f83c6641f10c1729e46faee25bc5753bfae 100644 (file)
--- a/localedata/locales/translit_cjk_compat
+++ b/localedata/locales/translit_cjk_compat
@@ -9,7 +9,7 @@ comment_char %
  % otherwise be governed by that license.
  
  % Transliterations of CJK compatibility characters.
-% Generated automatically from UnicodeData.txt by gen_translit_cjk_compat.py on 2020-04-14 for Unicode 13.0.0.
+% Generated automatically from UnicodeData.txt by gen_translit_cjk_compat.py on 2020-06-25 for Unicode 13.0.0.
  
  LC_CTYPE
  
diff --git a/localedata/locales/translit_combining b/localedata/locales/translit_combining

index d5c8bbfe8f80936b4a93aa3bfbeda4fbbf330ae7..36128f097a855db0045f122e5bd955e91d4990d6 100644 (file)
--- a/localedata/locales/translit_combining
+++ b/localedata/locales/translit_combining
@@ -10,7 +10,7 @@ comment_char %
  
  % Transliterations that remove all combining characters (accents,
  % pronounciation marks, etc.).
-% Generated automatically from UnicodeData.txt by gen_translit_combining.py on 2020-04-14 for Unicode 13.0.0.
+% Generated automatically from UnicodeData.txt by gen_translit_combining.py on 2020-06-25 for Unicode 13.0.0.
  
  LC_CTYPE
  
diff --git a/localedata/locales/translit_compat b/localedata/locales/translit_compat

index ff18b02ea361b1410c508e7fccda18843849b44e..ac24c4e9386c41fbef315b9857c5b2423c9fd02d 100644 (file)
--- a/localedata/locales/translit_compat
+++ b/localedata/locales/translit_compat
@@ -9,7 +9,7 @@ comment_char %
  % otherwise be governed by that license.
  
  % Transliterations of compatibility characters and ligatures.
-% Generated automatically from UnicodeData.txt by gen_translit_compat.py on 2020-04-14 for Unicode 13.0.0.
+% Generated automatically from UnicodeData.txt by gen_translit_compat.py on 2020-06-25 for Unicode 13.0.0.
  
  LC_CTYPE
  
diff --git a/localedata/locales/translit_font b/localedata/locales/translit_font

index e79b0d83f560e798231c877ca0ee54d904477712..680c4ed4267782670166b80d2dfde2c2d7bca74b 100644 (file)
--- a/localedata/locales/translit_font
+++ b/localedata/locales/translit_font
@@ -9,7 +9,7 @@ comment_char %
  % otherwise be governed by that license.
  
  % Transliterations of font equivalents.
-% Generated automatically from UnicodeData.txt by gen_translit_font.py on 2020-04-14 for Unicode 13.0.0.
+% Generated automatically from UnicodeData.txt by gen_translit_font.py on 2020-06-25 for Unicode 13.0.0.
  
  LC_CTYPE
  
diff --git a/localedata/locales/translit_fraction b/localedata/locales/translit_fraction

index 197d57a6449b001497bf016b6fe566faf66fcd2f..b52244969e8e581f74f15763149ec0a312cedf6a 100644 (file)
--- a/localedata/locales/translit_fraction
+++ b/localedata/locales/translit_fraction
@@ -9,7 +9,7 @@ comment_char %
  % otherwise be governed by that license.
  
  % Transliterations of fractions.
-% Generated automatically from UnicodeData.txt by gen_translit_fraction.py on 2020-04-14 for Unicode 13.0.0.
+% Generated automatically from UnicodeData.txt by gen_translit_fraction.py on 2020-06-25 for Unicode 13.0.0.
  % The replacements have been surrounded with spaces, because fractions are
  % often preceded by a decimal number and followed by a unit or a math symbol.
  
diff --git a/localedata/unicode-gen/utf8_gen.py b/localedata/unicode-gen/utf8_gen.py

index 17b99ee88d200ccd49c13ef2d778ec57a03aa2db..11c906b92fe9946a95e4be4a2764580b06bdca2d 100755 (executable)
--- a/localedata/unicode-gen/utf8_gen.py
+++ b/localedata/unicode-gen/utf8_gen.py
@@ -258,7 +258,13 @@ def process_width(outfile, ulines, elines, plines):
          if key in width_dict:
              del width_dict[key] # default width is 1
      for key in list(range(0x1160, 0x1200)):
-        width_dict[key] = 0
+        # Hangul jungseong and jongseong:
+        if key in unicode_utils.UNICODE_ATTRIBUTES:
+            width_dict[key] = 0
+    for key in list(range(0xD7B0, 0xD800)):
+        # Hangul jungseong and jongseong:
+        if key in unicode_utils.UNICODE_ATTRIBUTES:
+            width_dict[key] = 0
      for key in list(range(0x3248, 0x3250)):
          # These are “A” which means we can decide whether to treat them
          # as “W” or “N” based on context:
@@ -327,6 +333,7 @@ if __name__ == "__main__":
          help='The Unicode version of the input files used.')
      ARGS = PARSER.parse_args()
  
+    unicode_utils.fill_attributes(ARGS.unicode_data_file)
      with open(ARGS.unicode_data_file, mode='r') as UNIDATA_FILE:
          UNICODE_DATA_LINES = UNIDATA_FILE.readlines()
      with open(ARGS.east_asian_with_file, mode='r') as EAST_ASIAN_WIDTH_FILE:
author	Mike FABIAN <mfabian@redhat.com>
	Tue, 16 Jun 2020 06:29:40 +0000 (08:29 +0200)
committer	Mike FABIAN <mfabian@redhat.com>
	Fri, 26 Jun 2020 07:54:43 +0000 (09:54 +0200)
localedata/charmaps/UTF-8		patch \| blob \| blame \| history
localedata/locales/i18n_ctype		patch \| blob \| blame \| history
localedata/locales/tr_TR		patch \| blob \| blame \| history
localedata/locales/translit_circle		patch \| blob \| blame \| history
localedata/locales/translit_cjk_compat		patch \| blob \| blame \| history
localedata/locales/translit_combining		patch \| blob \| blame \| history
localedata/locales/translit_compat		patch \| blob \| blame \| history
localedata/locales/translit_font		patch \| blob \| blame \| history
localedata/locales/translit_fraction		patch \| blob \| blame \| history
localedata/unicode-gen/utf8_gen.py		patch \| blob \| blame \| history