@@ -846,6 +846,16 @@ def getpreferredencoding(do_setlocale = True):
846
846
#
847
847
# SS 2014-10-01:
848
848
# Updated alias mapping with glibc 2.19 supported locales.
849
+ #
850
+ # SS 2018-05-05:
851
+ # Updated alias mapping with glibc 2.27 supported locales.
852
+ #
853
+ # These are the differences compared to the old mapping (Python 3.6.5
854
+ # and older):
855
+ #
856
+ # updated 'ca_es@valencia' -> 'ca_ES.ISO8859-15@valencia' to 'ca_ES.UTF-8@valencia'
857
+ # updated 'kk_kz' -> 'kk_KZ.RK1048' to 'kk_KZ.ptcp154'
858
+ # updated 'russian' -> 'ru_RU.ISO8859-5' to 'ru_RU.KOI8-R'
849
859
850
860
locale_alias = {
851
861
'a3' : 'az_AZ.KOI8-C' ,
@@ -856,10 +866,13 @@ def getpreferredencoding(do_setlocale = True):
856
866
'aa_et' : 'aa_ET.UTF-8' ,
857
867
'af' : 'af_ZA.ISO8859-1' ,
858
868
'af_za' : 'af_ZA.ISO8859-1' ,
869
+ 'agr_pe' : 'agr_PE.UTF-8' ,
870
+ 'ak_gh' : 'ak_GH.UTF-8' ,
859
871
'am' : 'am_ET.UTF-8' ,
860
872
'am_et' : 'am_ET.UTF-8' ,
861
873
'american' : 'en_US.ISO8859-1' ,
862
874
'an_es' : 'an_ES.ISO8859-15' ,
875
+ 'anp_in' : 'anp_IN.UTF-8' ,
863
876
'ar' : 'ar_AA.ISO8859-6' ,
864
877
'ar_aa' : 'ar_AA.ISO8859-6' ,
865
878
'ar_ae' : 'ar_AE.ISO8859-6' ,
@@ -877,6 +890,7 @@ def getpreferredencoding(do_setlocale = True):
877
890
'ar_qa' : 'ar_QA.ISO8859-6' ,
878
891
'ar_sa' : 'ar_SA.ISO8859-6' ,
879
892
'ar_sd' : 'ar_SD.ISO8859-6' ,
893
+ 'ar_ss' : 'ar_SS.UTF-8' ,
880
894
'ar_sy' : 'ar_SY.ISO8859-6' ,
881
895
'ar_tn' : 'ar_TN.ISO8859-6' ,
882
896
'ar_ye' : 'ar_YE.ISO8859-6' ,
@@ -888,6 +902,7 @@ def getpreferredencoding(do_setlocale = True):
888
902
'az' : 'az_AZ.ISO8859-9E' ,
889
903
'az_az' : 'az_AZ.ISO8859-9E' ,
890
904
'az_az.iso88599e' : 'az_AZ.ISO8859-9E' ,
905
+ 'az_ir' : 'az_IR.UTF-8' ,
891
906
'be' : 'be_BY.CP1251' ,
892
907
'be@latin' : 'be_BY.UTF-8@latin' ,
893
908
'be_bg.utf8' : 'bg_BG.UTF-8' ,
@@ -898,13 +913,17 @@ def getpreferredencoding(do_setlocale = True):
898
913
'ber_ma' : 'ber_MA.UTF-8' ,
899
914
'bg' : 'bg_BG.CP1251' ,
900
915
'bg_bg' : 'bg_BG.CP1251' ,
916
+ 'bhb_in.utf8' : 'bhb_IN.UTF-8' ,
901
917
'bho_in' : 'bho_IN.UTF-8' ,
918
+ 'bho_np' : 'bho_NP.UTF-8' ,
919
+ 'bi_vu' : 'bi_VU.UTF-8' ,
902
920
'bn_bd' : 'bn_BD.UTF-8' ,
903
921
'bn_in' : 'bn_IN.UTF-8' ,
904
922
'bo_cn' : 'bo_CN.UTF-8' ,
905
923
'bo_in' : 'bo_IN.UTF-8' ,
906
924
'bokmal' : 'nb_NO.ISO8859-1' ,
907
925
'bokm\xe5 l' : 'nb_NO.ISO8859-1' ,
926
+ 'bokm\xef \xbf \xbd ' : 'nb_NO.ISO8859-1' ,
908
927
'br' : 'br_FR.ISO8859-1' ,
909
928
'br_fr' : 'br_FR.ISO8859-1' ,
910
929
'brx_in' : 'brx_IN.UTF-8' ,
@@ -923,13 +942,17 @@ def getpreferredencoding(do_setlocale = True):
923
942
'ca' : 'ca_ES.ISO8859-1' ,
924
943
'ca_ad' : 'ca_AD.ISO8859-1' ,
925
944
'ca_es' : 'ca_ES.ISO8859-1' ,
926
- 'ca_es@valencia' : 'ca_ES.ISO8859-15 @valencia' ,
945
+ 'ca_es@valencia' : 'ca_ES.UTF-8 @valencia' ,
927
946
'ca_fr' : 'ca_FR.ISO8859-1' ,
928
947
'ca_it' : 'ca_IT.ISO8859-1' ,
929
948
'catalan' : 'ca_ES.ISO8859-1' ,
949
+ 'ce_ru' : 'ce_RU.UTF-8' ,
930
950
'cextend' : 'en_US.ISO8859-1' ,
931
951
'chinese-s' : 'zh_CN.eucCN' ,
932
952
'chinese-t' : 'zh_TW.eucTW' ,
953
+ 'chr_us' : 'chr_US.UTF-8' ,
954
+ 'ckb_iq' : 'ckb_IQ.UTF-8' ,
955
+ 'cmn_tw' : 'cmn_TW.UTF-8' ,
933
956
'crh_ua' : 'crh_UA.UTF-8' ,
934
957
'croatian' : 'hr_HR.ISO8859-2' ,
935
958
'cs' : 'cs_CZ.ISO8859-2' ,
@@ -951,6 +974,7 @@ def getpreferredencoding(do_setlocale = True):
951
974
'de_be' : 'de_BE.ISO8859-1' ,
952
975
'de_ch' : 'de_CH.ISO8859-1' ,
953
976
'de_de' : 'de_DE.ISO8859-1' ,
977
+ 'de_it' : 'de_IT.ISO8859-1' ,
954
978
'de_li.utf8' : 'de_LI.UTF-8' ,
955
979
'de_lu' : 'de_LU.ISO8859-1' ,
956
980
'deutsch' : 'de_DE.ISO8859-1' ,
@@ -977,10 +1001,12 @@ def getpreferredencoding(do_setlocale = True):
977
1001
'en_gb' : 'en_GB.ISO8859-1' ,
978
1002
'en_hk' : 'en_HK.ISO8859-1' ,
979
1003
'en_ie' : 'en_IE.ISO8859-1' ,
1004
+ 'en_il' : 'en_IL.UTF-8' ,
980
1005
'en_in' : 'en_IN.ISO8859-1' ,
981
1006
'en_ng' : 'en_NG.UTF-8' ,
982
1007
'en_nz' : 'en_NZ.ISO8859-1' ,
983
1008
'en_ph' : 'en_PH.ISO8859-1' ,
1009
+ 'en_sc.utf8' : 'en_SC.UTF-8' ,
984
1010
'en_sg' : 'en_SG.ISO8859-1' ,
985
1011
'en_uk' : 'en_GB.ISO8859-1' ,
986
1012
'en_us' : 'en_US.ISO8859-1' ,
@@ -991,6 +1017,7 @@ def getpreferredencoding(do_setlocale = True):
991
1017
'en_zw.utf8' : 'en_ZS.UTF-8' ,
992
1018
'eng_gb' : 'en_GB.ISO8859-1' ,
993
1019
'english' : 'en_EN.ISO8859-1' ,
1020
+ 'english.iso88591' : 'en_US.ISO8859-1' ,
994
1021
'english_uk' : 'en_GB.ISO8859-1' ,
995
1022
'english_united-states' : 'en_US.ISO8859-1' ,
996
1023
'english_united-states.437' : 'C' ,
@@ -1045,6 +1072,7 @@ def getpreferredencoding(do_setlocale = True):
1045
1072
'fr_fr' : 'fr_FR.ISO8859-1' ,
1046
1073
'fr_lu' : 'fr_LU.ISO8859-1' ,
1047
1074
'fran\xe7 ais' : 'fr_FR.ISO8859-1' ,
1075
+ 'fran\xef \xbf \xbd is' : 'fr_FR.ISO8859-1' ,
1048
1076
'fre_fr' : 'fr_FR.ISO8859-1' ,
1049
1077
'french' : 'fr_FR.ISO8859-1' ,
1050
1078
'french.iso88591' : 'fr_CH.ISO8859-1' ,
@@ -1071,12 +1099,14 @@ def getpreferredencoding(do_setlocale = True):
1071
1099
'gv' : 'gv_GB.ISO8859-1' ,
1072
1100
'gv_gb' : 'gv_GB.ISO8859-1' ,
1073
1101
'ha_ng' : 'ha_NG.UTF-8' ,
1102
+ 'hak_tw' : 'hak_TW.UTF-8' ,
1074
1103
'he' : 'he_IL.ISO8859-8' ,
1075
1104
'he_il' : 'he_IL.ISO8859-8' ,
1076
1105
'hebrew' : 'he_IL.ISO8859-8' ,
1077
1106
'hi' : 'hi_IN.ISCII-DEV' ,
1078
1107
'hi_in' : 'hi_IN.ISCII-DEV' ,
1079
1108
'hi_in.isciidev' : 'hi_IN.ISCII-DEV' ,
1109
+ 'hif_fj' : 'hif_FJ.UTF-8' ,
1080
1110
'hne' : 'hne_IN.UTF-8' ,
1081
1111
'hne_in' : 'hne_IN.UTF-8' ,
1082
1112
'hr' : 'hr_HR.ISO8859-2' ,
@@ -1131,7 +1161,8 @@ def getpreferredencoding(do_setlocale = True):
1131
1161
'ka_ge.georgianacademy' : 'ka_GE.GEORGIAN-ACADEMY' ,
1132
1162
'ka_ge.georgianps' : 'ka_GE.GEORGIAN-PS' ,
1133
1163
'ka_ge.georgianrs' : 'ka_GE.GEORGIAN-ACADEMY' ,
1134
- 'kk_kz' : 'kk_KZ.RK1048' ,
1164
+ 'kab_dz' : 'kab_DZ.UTF-8' ,
1165
+ 'kk_kz' : 'kk_KZ.ptcp154' ,
1135
1166
'kl' : 'kl_GL.ISO8859-1' ,
1136
1167
'kl_gl' : 'kl_GL.ISO8859-1' ,
1137
1168
'km_kh' : 'km_KH.UTF-8' ,
@@ -1157,6 +1188,7 @@ def getpreferredencoding(do_setlocale = True):
1157
1188
'li_nl' : 'li_NL.UTF-8' ,
1158
1189
'lij_it' : 'lij_IT.UTF-8' ,
1159
1190
'lithuanian' : 'lt_LT.ISO8859-13' ,
1191
+ 'ln_cd' : 'ln_CD.UTF-8' ,
1160
1192
'lo' : 'lo_LA.MULELAO-1' ,
1161
1193
'lo_la' : 'lo_LA.MULELAO-1' ,
1162
1194
'lo_la.cp1133' : 'lo_LA.IBM-CP1133' ,
@@ -1166,13 +1198,18 @@ def getpreferredencoding(do_setlocale = True):
1166
1198
'lt_lt' : 'lt_LT.ISO8859-13' ,
1167
1199
'lv' : 'lv_LV.ISO8859-13' ,
1168
1200
'lv_lv' : 'lv_LV.ISO8859-13' ,
1201
+ 'lzh_tw' : 'lzh_TW.UTF-8' ,
1169
1202
'mag_in' : 'mag_IN.UTF-8' ,
1170
1203
'mai' : 'mai_IN.UTF-8' ,
1171
1204
'mai_in' : 'mai_IN.UTF-8' ,
1205
+ 'mai_np' : 'mai_NP.UTF-8' ,
1206
+ 'mfe_mu' : 'mfe_MU.UTF-8' ,
1172
1207
'mg_mg' : 'mg_MG.ISO8859-15' ,
1173
1208
'mhr_ru' : 'mhr_RU.UTF-8' ,
1174
1209
'mi' : 'mi_NZ.ISO8859-1' ,
1175
1210
'mi_nz' : 'mi_NZ.ISO8859-1' ,
1211
+ 'miq_ni' : 'miq_NI.UTF-8' ,
1212
+ 'mjw_in' : 'mjw_IN.UTF-8' ,
1176
1213
'mk' : 'mk_MK.ISO8859-5' ,
1177
1214
'mk_mk' : 'mk_MK.ISO8859-5' ,
1178
1215
'ml' : 'ml_IN.UTF-8' ,
@@ -1186,7 +1223,7 @@ def getpreferredencoding(do_setlocale = True):
1186
1223
'mt' : 'mt_MT.ISO8859-3' ,
1187
1224
'mt_mt' : 'mt_MT.ISO8859-3' ,
1188
1225
'my_mm' : 'my_MM.UTF-8' ,
1189
- 'nan_tw@latin ' : 'nan_TW.UTF-8@latin ' ,
1226
+ 'nan_tw' : 'nan_TW.UTF-8' ,
1190
1227
'nb' : 'nb_NO.ISO8859-1' ,
1191
1228
'nb_no' : 'nb_NO.ISO8859-1' ,
1192
1229
'nds_de' : 'nds_DE.UTF-8' ,
@@ -1225,6 +1262,8 @@ def getpreferredencoding(do_setlocale = True):
1225
1262
'pa_in' : 'pa_IN.UTF-8' ,
1226
1263
'pa_pk' : 'pa_PK.UTF-8' ,
1227
1264
'pap_an' : 'pap_AN.UTF-8' ,
1265
+ 'pap_aw' : 'pap_AW.UTF-8' ,
1266
+ 'pap_cw' : 'pap_CW.UTF-8' ,
1228
1267
'pd' : 'pd_US.ISO8859-1' ,
1229
1268
'pd_de' : 'pd_DE.ISO8859-1' ,
1230
1269
'pd_us' : 'pd_US.ISO8859-1' ,
@@ -1243,14 +1282,16 @@ def getpreferredencoding(do_setlocale = True):
1243
1282
'pt' : 'pt_PT.ISO8859-1' ,
1244
1283
'pt_br' : 'pt_BR.ISO8859-1' ,
1245
1284
'pt_pt' : 'pt_PT.ISO8859-1' ,
1285
+ 'quz_pe' : 'quz_PE.UTF-8' ,
1286
+ 'raj_in' : 'raj_IN.UTF-8' ,
1246
1287
'ro' : 'ro_RO.ISO8859-2' ,
1247
1288
'ro_ro' : 'ro_RO.ISO8859-2' ,
1248
1289
'romanian' : 'ro_RO.ISO8859-2' ,
1249
1290
'ru' : 'ru_RU.UTF-8' ,
1250
1291
'ru_ru' : 'ru_RU.UTF-8' ,
1251
1292
'ru_ua' : 'ru_UA.KOI8-U' ,
1252
1293
'rumanian' : 'ro_RO.ISO8859-2' ,
1253
- 'russian' : 'ru_RU.ISO8859-5 ' ,
1294
+ 'russian' : 'ru_RU.KOI8-R ' ,
1254
1295
'rw' : 'rw_RW.ISO8859-1' ,
1255
1296
'rw_rw' : 'rw_RW.ISO8859-1' ,
1256
1297
'sa_in' : 'sa_IN.UTF-8' ,
@@ -1262,12 +1303,14 @@ def getpreferredencoding(do_setlocale = True):
1262
1303
'sd_pk' : 'sd_PK.UTF-8' ,
1263
1304
'se_no' : 'se_NO.UTF-8' ,
1264
1305
'serbocroatian' : 'sr_RS.UTF-8@latin' ,
1306
+ 'sgs_lt' : 'sgs_LT.UTF-8' ,
1265
1307
'sh' : 'sr_RS.UTF-8@latin' ,
1266
1308
'sh_ba.iso88592@bosnia' : 'sr_CS.ISO8859-2' ,
1267
1309
'sh_hr' : 'sh_HR.ISO8859-2' ,
1268
1310
'sh_hr.iso88592' : 'hr_HR.ISO8859-2' ,
1269
1311
'sh_sp' : 'sr_CS.ISO8859-2' ,
1270
1312
'sh_yu' : 'sr_RS.UTF-8@latin' ,
1313
+ 'shn_mm' : 'shn_MM.UTF-8' ,
1271
1314
'shs_ca' : 'shs_CA.UTF-8' ,
1272
1315
'si' : 'si_LK.UTF-8' ,
1273
1316
'si_lk' : 'si_LK.UTF-8' ,
@@ -1281,6 +1324,7 @@ def getpreferredencoding(do_setlocale = True):
1281
1324
'slovak' : 'sk_SK.ISO8859-2' ,
1282
1325
'slovene' : 'sl_SI.ISO8859-2' ,
1283
1326
'slovenian' : 'sl_SI.ISO8859-2' ,
1327
+ 'sm_ws' : 'sm_WS.UTF-8' ,
1284
1328
'so_dj' : 'so_DJ.ISO8859-1' ,
1285
1329
'so_et' : 'so_ET.UTF-8' ,
1286
1330
'so_ke' : 'so_KE.ISO8859-1' ,
@@ -1327,6 +1371,7 @@ def getpreferredencoding(do_setlocale = True):
1327
1371
'ta_in.tscii' : 'ta_IN.TSCII-0' ,
1328
1372
'ta_in.tscii0' : 'ta_IN.TSCII-0' ,
1329
1373
'ta_lk' : 'ta_LK.UTF-8' ,
1374
+ 'tcy_in.utf8' : 'tcy_IN.UTF-8' ,
1330
1375
'te' : 'te_IN.UTF-8' ,
1331
1376
'te_in' : 'te_IN.UTF-8' ,
1332
1377
'tg' : 'tg_TJ.KOI8-C' ,
@@ -1336,6 +1381,7 @@ def getpreferredencoding(do_setlocale = True):
1336
1381
'th_th.tactis' : 'th_TH.TIS620' ,
1337
1382
'th_th.tis620' : 'th_TH.TIS620' ,
1338
1383
'thai' : 'th_TH.ISO8859-11' ,
1384
+ 'the_np' : 'the_NP.UTF-8' ,
1339
1385
'ti_er' : 'ti_ER.UTF-8' ,
1340
1386
'ti_et' : 'ti_ET.UTF-8' ,
1341
1387
'tig_er' : 'tig_ER.UTF-8' ,
@@ -1344,6 +1390,8 @@ def getpreferredencoding(do_setlocale = True):
1344
1390
'tl_ph' : 'tl_PH.ISO8859-1' ,
1345
1391
'tn' : 'tn_ZA.ISO8859-15' ,
1346
1392
'tn_za' : 'tn_ZA.ISO8859-15' ,
1393
+ 'to_to' : 'to_TO.UTF-8' ,
1394
+ 'tpi_pg' : 'tpi_PG.UTF-8' ,
1347
1395
'tr' : 'tr_TR.ISO8859-9' ,
1348
1396
'tr_cy' : 'tr_CY.ISO8859-9' ,
1349
1397
'tr_tr' : 'tr_TR.ISO8859-9' ,
@@ -1386,6 +1434,7 @@ def getpreferredencoding(do_setlocale = True):
1386
1434
'yi_us' : 'yi_US.CP1255' ,
1387
1435
'yo_ng' : 'yo_NG.UTF-8' ,
1388
1436
'yue_hk' : 'yue_HK.UTF-8' ,
1437
+ 'yuw_pg' : 'yuw_PG.UTF-8' ,
1389
1438
'zh' : 'zh_CN.eucCN' ,
1390
1439
'zh_cn' : 'zh_CN.gb2312' ,
1391
1440
'zh_cn.big5' : 'zh_TW.big5' ,
0 commit comments