Systèmes d'encodage des caractères de TXM

Introduction

Certains systèmes d'encodage se distinguent selon le système d'exploitation d'origine des fichiers sources (typiquement d'extension .txt ou .TXT) :

  • si vous êtes sous Windows : essayez le système “windows-1252”
  • si vous êtes sous Mac OS X : essayez le système “MacRoman”
    • des variantes pour différentes régions géographiques peuvent utiliser d'autres systèmes : comme MacCyrillic ou MacCentralEurope par exemple
  • si vous êtes sous Ubuntu : essayez le système “UTF8”
  • si vous ne savez pas : essayer le système “UTF8”

Liste complète des systèmes d'encodage

Chaque nom de système d'encodage est suivi de ses appelations synonymes.

  1. Big5 = csBig5
  2. Big5-HKSCS = Big5_HKSCS, big5-hkscs, big5hkscs, big5hk
  3. EUC-JP = eucjis, Extended_UNIX_Code_Packed_Format_for_Japanese, x-eucjp, eucjp, csEUCPkdFmtjapanese, x-euc-jp, euc_jp
  4. EUC-KR = 5601, ksc5601-1987, ksc5601_1987, euckr, ksc5601, ksc_5601, ks_c_5601-1987, euc_kr, csEUCKR
  5. GB18030 = gb18030-2000
  6. GB2312 = euc-cn, x-EUC-CN, gb2312-1980, gb2312, gb2312-80, EUC_CN, euccn
  7. GBK = windows-936, CP936
  8. IBM-Thai = 838, cp838, ibm838, ibm-838
  9. IBM00858 = cp858, 858, ccsid00858, PC-Multilingual-850+euro, cp00858
  10. IBM01140 = 1140, cp01140, ccsid01140, cp1140, ebcdic-us-037+euro
  11. IBM01141 = cp1141, 1141, cp01141, ccsid01141, ebcdic-de-273+euro
  12. IBM01142 = cp01142, cp1142, ebcdic-no-277+euro, 1142, ebcdic-dk-277+euro, ccsid01142
  13. IBM01143 = ebcdic-se-278+euro, 1143, cp01143, ccsid01143, ebcdic-fi-278+euro, cp1143
  14. IBM01144 = cp01144, ebcdic-it-280+euro, 1144, ccsid01144, cp1144
  15. IBM01145 = ebcdic-es-284+euro, cp1145, cp01145, 1145, ccsid01145
  16. IBM01146 = ccsid01146, cp01146, ebcdic-gb-285+euro, 1146, cp1146
  17. IBM01147 = ccsid01147, ebcdic-fr-277+euro, cp1147, 1147, cp01147
  18. IBM01148 = cp1148, ebcdic-international-500+euro, 1148, ccsid01148, cp01148
  19. IBM01149 = ebcdic-s-871+euro, cp01149, cp1149, 1149, ccsid01149
  20. IBM037 = cs-ebcdic-cp-nl, cs-ebcdic-cp-us, ebcdic-cp-wt, 037, ebcdic-cp-ca, cs-ebcdic-cp-wt, ibm-037, csIBM037, cp037, cs-ebcdic-cp-ca, cpibm37, ibm037, ebcdic-cp-nl, ebcdic-cp-us, ibm-37
  21. IBM1026 = 1026, cp1026, ibm-1026, ibm1026
  22. IBM1047 = cp1047, 1047, ibm-1047
  23. IBM273 = ibm-273, ibm273, cp273, 273
  24. IBM277 = 277, cp277, ibm-277, ibm277
  25. IBM278 = csIBM278, ebcdic-cp-se, cp278, 278, ebcdic-sv, ibm278, ibm-278
  26. IBM280 = 280, ibm-280, ibm280, cp280
  27. IBM284 = cpibm284, csIBM284, ibm284, cp284, 284, ibm-284
  28. IBM285 = ibm285, ebcdic-cp-gb, cpibm285, cp285, csIBM285, ebcdic-gb, 285, ibm-285
  29. IBM290 = cp290, ibm-290, ibm290, EBCDIC-JP-kana, 290, csIBM290
  30. IBM297 = cp297, cpibm297, ibm297, ebcdic-cp-fr, 297, ibm-297, csIBM297
  31. IBM420 = ibm420, cp420, 420, ibm-420, csIBM420, ebcdic-cp-ar1
  32. IBM424 = csIBM424, ibm-424, ibm424, cp424, ebcdic-cp-he, 424
  33. IBM437 = ibm-437, windows-437, cspc8codepage437, 437, ibm437, cp437
  34. IBM500 = ibm-500, ebcdic-cp-bh, cp500, csIBM500, ibm500, ebcdic-cp-ch, 500
  35. IBM775 = ibm-775, 775, cp775, ibm775
  36. IBM850 = ibm-850, cp850, 850, cspc850multilingual, ibm850
  37. IBM852 = ibm852, csPCp852, 852, ibm-852, cp852
  38. IBM855 = cspcp855, 855, ibm855, ibm-855, cp855
  39. IBM857 = csIBM857, 857, ibm-857, cp857, ibm857
  40. IBM860 = 860, cp860, ibm-860, csIBM860, ibm860
  41. IBM861 = 861, cp-is, ibm-861, cp861, csIBM861, ibm861
  42. IBM862 = ibm-862, ibm862, csIBM862, cp862, cspc862latinhebrew, 862
  43. IBM863 = ibm863, csIBM863, cp863, 863, ibm-863
  44. IBM864 = csIBM864, ibm864, 864, cp864, ibm-864
  45. IBM865 = csIBM865, ibm865, 865, ibm-865, cp865
  46. IBM866 = 866, ibm-866, ibm866, csIBM866, cp866
  47. IBM868 = 868, ibm-868, cp868, csIBM868, cp-ar, ibm868
  48. IBM869 = 869, ibm-869, cp869, csIBM869, cp-gr, ibm869
  49. IBM870 = ibm-870, ebcdic-cp-roece, ebcdic-cp-yu, csIBM870, ibm870, cp870, 870
  50. IBM871 = ibm-871, 871, ebcdic-cp-is, cp871, csIBM871, ibm871
  51. IBM918 = ebcdic-cp-ar2, 918, ibm-918, cp918
  52. ISO-2022-CN = csISO2022CN, ISO2022CN
  53. ISO-2022-JP = jis_encoding, csjisencoding, jis, iso2022jp, csISO2022JP
  54. ISO-2022-JP-2 = csISO2022JP2, iso2022jp2
  55. ISO-2022-KR = csISO2022KR, ISO2022KR
  56. ISO-8859-1 = csISOLatin1, latin1, IBM-819, iso-ir-100, 8859_1, ISO_8859-1:1987, ISO_8859-1, 819, l1, ISO8859-1, IBM819, ISO_8859_1, ISO8859_1, cp819
  57. ISO-8859-13 = 8859_13, iso8859_13, iso_8859-13, ISO8859-13
  58. ISO-8859-15 = IBM923, 8859_15, ISO_8859-15, ISO-8859-15, L9, ISO8859-15, ISO8859_15_FDIS, 923, LATIN0, csISOlatin9, LATIN9, csISOlatin0, IBM-923, ISO8859_15, cp923
  59. ISO-8859-2 = csISOLatin2, iso-ir-101, ibm-912, 8859_2, l2, ISO_8859-2, ibm912, 912, ISO8859-2, latin2, iso8859_2, ISO_8859-2:1987, cp912
  60. ISO-8859-3 = ibm-913, latin3, csISOLatin3, iso-ir-109, l3, iso8859_3, ISO_8859-3:1988, 8859_3, ibm913, ISO8859-3, ISO_8859-3, 913, cp913
  61. ISO-8859-4 = iso-ir-110, iso8859-4, ibm914, ibm-914, csISOLatin4, l4, 914, 8859_4, latin4, ISO_8859-4, ISO_8859-4:1988, iso8859_4, cp914
  62. ISO-8859-5 = cp915, ISO8859-5, ibm915, ISO_8859-5:1988, ibm-915, 8859_5, 915, cyrillic, iso8859_5, ISO_8859-5, iso-ir-144, csISOLatinCyrillic
  63. ISO-8859-6 = arabic, ibm1089, iso8859_6, iso-ir-127, 8859_6, cp1089, ECMA-114, ISO_8859-6, csISOLatinArabic, 1089, ibm-1089, ISO8859-6, ASMO-708, ISO_8859-6:1987
  64. ISO-8859-7 = iso8859-7, sun_eu_greek, csISOLatinGreek, 813, ISO_8859-7, ibm-813, ISO_8859-7:1987, greek, greek8, iso8859_7, ECMA-118, iso-ir-126, 8859_7, cp813, ibm813, ELOT_928
  65. ISO-8859-8 = ibm916, cp916, csISOLatinHebrew, ISO_8859-8, ISO8859-8, ibm-916, iso8859_8, hebrew, 916, iso-ir-138, ISO_8859-8:1988, 8859_8
  66. ISO-8859-9 = ISO_8859-9, 920, iso8859_9, csISOLatin5, l5, 8859_9, latin5, ibm920, iso-ir-148, ISO_8859-9:1989, ISO8859-9, cp920, ibm-920
  67. JIS_X0201 = JIS0201, X0201, JIS_X0201, csHalfWidthKatakana
  68. JIS_X0212-1990 = csISO159JISX02121990, x0212, jis_x0212-1990, iso-ir-159, JIS0212
  69. KOI8-R = cskoi8r, koi8_r, koi8
  70. KOI8-U = koi8_u
  71. Shift_JIS = x-sjis, shift_jis, sjis, ms_kanji, shift-jis, csShiftJIS
  72. TIS-620 = tis620.2533, tis620
  73. US-ASCII = cp367, ascii7, ISO646-US, 646, csASCII, us, iso_646.irv:1983, ISO_646.irv:1991, IBM367, ASCII, default, ANSI_X3.4-1986, ANSI_X3.4-1968, iso-ir-6
  74. UTF-16 = utf16, UnicodeBig, UTF_16, unicode
  75. UTF-16BE = X-UTF-16BE, UTF_16BE, ISO-10646-UCS-2, UnicodeBigUnmarked
  76. UTF-16LE = UnicodeLittleUnmarked, UTF_16LE, X-UTF-16LE
  77. UTF-32 = UTF32, UTF_32
  78. UTF-32BE = X-UTF-32BE, UTF_32BE
  79. UTF-32LE = X-UTF-32LE, UTF_32LE
  80. UTF-8 = unicode-1-1-utf-8, UTF8
  81. windows-1250 = cp1250, cp5346
  82. windows-1251 = ansi-1251, cp5347, cp1251
  83. windows-1252 = cp1252, cp5348
  84. windows-1253 = cp5349, cp1253
  85. windows-1254 = cp5350, cp1254
  86. windows-1255 = cp1255
  87. windows-1256 = cp1256
  88. windows-1257 = cp1257, cp5353
  89. windows-1258 = cp1258
  90. windows-31j = csWindows31J, windows-932, MS932
  91. x-Big5-HKSCS-2001 = big5-hkscs:unicode3.0, big5-hkscs-2001, big5hk-2001, big5hkscs-2001, Big5_HKSCS_2001
  92. x-Big5-Solaris = Big5_Solaris
  93. x-COMPOUND_TEXT = x-compound-text, COMPOUND_TEXT, x11-compound_text
  94. x-euc-jp-linux = euc_jp_linux, euc-jp-linux
  95. x-EUC-TW = euctw, euc_tw, EUC-TW, cns11643
  96. x-eucJP-Open = eucJP-open, EUC_JP_Solaris
  97. x-IBM1006 = ibm-1006, cp1006, ibm1006, 1006
  98. x-IBM1025 = ibm-1025, cp1025, 1025, ibm1025
  99. x-IBM1046 = ibm-1046, ibm1046, cp1046, 1046
  100. x-IBM1097 = 1097, cp1097, ibm-1097, ibm1097
  101. x-IBM1098 = ibm-1098, ibm1098, cp1098, 1098
  102. x-IBM1112 = ibm-1112, 1112, ibm1112, cp1112
  103. x-IBM1122 = 1122, cp1122, ibm-1122, ibm1122
  104. x-IBM1123 = ibm-1123, ibm1123, cp1123, 1123
  105. x-IBM1124 = 1124, cp1124, ibm-1124, ibm1124
  106. x-IBM1364 = 1364, cp1364, ibm1364, ibm-1364
  107. x-IBM1381 = ibm-1381, ibm1381, cp1381, 1381
  108. x-IBM1383 = cp1383, 1383, ibm-1383, ibm1383
  109. x-IBM300 = ibm300, 300, cp300, ibm-300
  110. x-IBM33722 = ibm33722, 33722, ibm-33722_vascii_vpua, ibm-5050, ibm-33722, cp33722
  111. x-IBM737 = cp737, ibm-737, 737, ibm737
  112. x-IBM833 = ibm-833, ibm833, cp833
  113. x-IBM834 = 834, ibm834, ibm-834, cp834
  114. x-IBM856 = 856, cp856, ibm-856, ibm856
  115. x-IBM874 = 874, cp874, ibm874, ibm-874
  116. x-IBM875 = 875, ibm875, cp875, ibm-875
  117. x-IBM921 = cp921, ibm921, 921, ibm-921
  118. x-IBM922 = ibm922, ibm-922, 922, cp922
  119. x-IBM930 = cp930, ibm930, 930, ibm-930
  120. x-IBM933 = 933, cp933, ibm933, ibm-933
  121. x-IBM935 = ibm935, 935, cp935, ibm-935
  122. x-IBM937 = ibm-937, cp937, 937, ibm937
  123. x-IBM939 = ibm-939, ibm939, cp939, 939
  124. x-IBM942 = ibm-942, ibm942, 942, cp942
  125. x-IBM942C = 942C, ibm942C, ibm-942C, cp942C
  126. x-IBM943 = ibm943, cp943, 943, ibm-943
  127. x-IBM943C = ibm-943C, 943C, cp943C, ibm943C
  128. x-IBM948 = ibm948, ibm-948, cp948, 948
  129. x-IBM949 = 949, ibm-949, ibm949, cp949
  130. x-IBM949C = ibm949C, cp949C, 949C, ibm-949C
  131. x-IBM950 = 950, ibm950, cp950, ibm-950
  132. x-IBM964 = 964, ibm-964, cp964, ibm964
  133. x-IBM970 = 970, ibm-970, ibm970, cp970, ibm-eucKR
  134. x-ISCII91 = iso-ir-153, ST_SEV_358-88, ISCII91, iscii, csISO153GOST1976874
  135. x-ISO-2022-CN-CNS = ISO-2022-CN-CNS, ISO2022CN_CNS
  136. x-ISO-2022-CN-GB = ISO-2022-CN-GB, ISO2022CN_GB
  137. x-iso-8859-11 = iso-8859-11, iso8859_11
  138. x-JIS0208 = JIS_X0208-1983, x0208, JIS0208, JIS_C6226-1983, iso-ir-87, csISO87JISX0208
  139. x-JISAutoDetect = JISAutoDetect
  140. x-Johab = ksc5601_1992, ms1361, johab, ksc5601-1992
  141. x-MacArabic = MacArabic
  142. x-MacCentralEurope = MacCentralEurope
  143. x-MacCroatian = MacCroatian
  144. x-MacCyrillic = MacCyrillic
  145. x-MacDingbat = MacDingbat
  146. x-MacGreek = MacGreek
  147. x-MacHebrew = MacHebrew
  148. x-MacIceland = MacIceland
  149. x-MacRoman = MacRoman
  150. x-MacRomania = MacRomania
  151. x-MacSymbol = MacSymbol
  152. x-MacThai = MacThai
  153. x-MacTurkish = MacTurkish
  154. x-MacUkraine = MacUkraine
  155. x-MS932_0213 =
  156. x-MS950-HKSCS = MS950_HKSCS
  157. x-MS950-HKSCS-XP = MS950_HKSCS_XP
  158. x-mswin-936 = ms936, ms_936
  159. x-PCK = pck
  160. x-SJIS_0213 =
  161. x-UTF-16LE-BOM = UnicodeLittle
  162. X-UTF-32BE-BOM = UTF-32BE-BOM, UTF_32BE_BOM
  163. X-UTF-32LE-BOM = UTF_32LE_BOM, UTF-32LE-BOM
  164. x-windows-50220 = ms50220, cp50220
  165. x-windows-50221 = cp50221, ms50221
  166. x-windows-874 = ms-874, ms874, windows-874
  167. x-windows-949 = ms_949, windows-949, windows949, ms949
  168. x-windows-950 = ms950, windows-950
  169. x-windows-iso2022jp = windows-iso2022jp
public/character_encodings_list.txt · Dernière modification: 2018/06/21 16:14 par slh@ens-lyon.fr