In Bezug auf die Beziehung zwischen Unicode und UTF können Sie sich einfach erinnern: Unicode ist eine Codierungsorganisation, eine Codierungsspezifikation und bezieht sich auf UTF-16 in Java. Gut im Netzwerk.
Die Codekopie lautet wie folgt:
public static void main (String [] args) wirft eine nicht unterstützte AnscodingException aus {
Stringutil.str2all ("0 Produktmodellbeschreibung");
Stringutil.str4all ("30000900A74ec1548b57f753cf63f08f");
}
/**
* Versuchen Sie, hexadezimale numerische Zeichenfolgen in allen Codierungsformaten zu codieren
*
* @param hexstr
* @Throws Uns SupportedenCodingException
*/
public static void str4all (String uSTR) wirft eine nicht unterstützte AnscodingException aus {
System.out.println ("++++++++++++++++++++++++++++++++++++++ +++++++++++++++++++++++++++++++ -);
byte [] bs = new byte [uststr.length ()/2];
für (int i = 0; i <bs.Length; i ++) {
BS [i] = (Byte) Integer
}
System.out.println (neue String (BS, "UTF-8");
// 16
System.out.println (neue String (BS, "UTF-16");
System.out.println (neue String (BS, "UTF-16LE");
System.out.println (neue String (BS, "X-UTF-16LE-BOM");
System.out.println (neue String (BS, "UTF-16BE");
//System.out.println(new String (BS, "X-UTF-16BE-BOM");
// 32
System.out.println (neue String (BS, "UTF-32");
System.out.println (neue String (BS, "UTF-32LE");
System.out.println (neue String (BS, "X-UTF-32LE-BOM");
System.out.println (neue String (BS, "UTF-32BE");
System.out.println (neue String (BS, "X-UTF-32LE-BOM");
}
/**
* Listen Sie alle dekodierten hexadezimalen numerischen Zeichenfolgen auf, die der Codierung entsprechen
*
* @param uStr
* @Throws Uns SupportedenCodingException
*/
public static void Str2all (String uSTR) wirft eine nicht unterstützte AnscodingException aus {
System.out.println ("++++++++++++++++++++++++++++++++++++++ +++++++++++++++++++++++++++++++ -);
byte [] bs = new Byte [] {};
bs = uststr.getBytes ("utf-8");
für (Byte B: bs) {
System.out.print (Integer.tohexString (B & 0xff));
}
System.out.println ();
// 16
bs = uststr.getBytes ("utf-16");
für (Byte B: bs) {
System.out.print (Integer.tohexString (B & 0xff));
}
System.out.println ();
bs = uststr.getBytes ("utf-16le");
für (Byte B: bs) {
System.out.print (Integer.tohexString (B & 0xff));
}
System.out.println ();
bs = uststr.getBytes ("X-UTF-16LE-BOM");
für (Byte B: bs) {
System.out.print (Integer.tohexString (B & 0xff));
}
System.out.println ();
bs = uststr.getBytes ("utf-16be");
für (Byte B: bs) {
System.out.print (Integer.tohexString (B & 0xff));
}
System.out.println ();
// bs = usstr.getBytes ("X-UTF-16BE-BOM");
// 32
bs = uststr.getBytes ("utf-32");
für (Byte B: bs) {
System.out.print (Integer.tohexString (B & 0xff));
}
System.out.println ();
bs = uststr.getBytes ("utf-32le");
für (Byte B: bs) {
System.out.print (Integer.tohexString (B & 0xff));
}
System.out.println ();
bs = uststr.getBytes ("X-UTF-32LE-BOM");
für (Byte B: bs) {
System.out.print (Integer.tohexString (B & 0xff));
}
System.out.println ();
bs = uststr.getBytes ("utf-32be");
für (Byte B: bs) {
System.out.print (Integer.tohexString (B & 0xff));
}
System.out.println ();
bs = uststr.getBytes ("X-UTF-32LE-BOM");
für (Byte B: bs) {
System.out.print (Integer.tohexString (B & 0xff));
}
System.out.println ();
}
Codierungsnamensammlung
Die Codekopie lautet wie folgt:
charet us -cii %s
HistoricalName ASCII
# Iana Aliase
Alias ISO-IR-6
alias ansi_x3.4-1986
alias iso_646.irv: 1991
alias ascii
alias iso646-us
alias uns
Alias IBM367
Alias CP367
alias csascii
alias Standard
# Andere Aliase
Alias 646 # Solaris Possix -Gebietsschema
alias iso_646.irv: 1983
alias ANSI_X3.4-1968 # Linux Possix Locale (Redhat)
alias ascii7
Charset UTF-8 UTF_8
HistoricalName UTF8
alias utf8
Alias Unicode-1-1-UTF-8
Charset UTF-16 UTF_16
HistoricalName UTF-16
alias utf_16
alias utf16
alias unicode
alias unicodebig
Charset UTF-16BE UTF_16BE
HistoricalName Unicodebigunmarked
alias utf_16be
Alias ISO-10646-UCS-2
Alias X-UTF-16BE
alias unicodebigunmarked
Charset UTF-16LE UTF_16LE
HistoricalName Unicodelittleunmarked
alias utf_16le
Alias X-UTF-16LE
alias unicodelittleunmarked
Charset X-UTF-16LE-BOM UTF_16LE_BOM
HistoricalName Unicodelittle
alias unicodelittle
Charset UTF-32 UTF_32
alias utf_32
alias utf32
Charset UTF-32LE UTF_32LE
alias utf_32le
Alias X-UTF-32LE
charset UTF-32BE UTF_32BE
alias utf_32be
Alias X-UTF-32BE
charset X-UTF-32LE-BOM UTF_32LE_BOM
alias utf_32le_bom
Alias UTF-32LE-BOM
charset X-UTF-32BE-BOM UTF_32BE_BOM
alias utf_32be_bom
Alias UTF-32BE-BOM
Charset ISO-8859-1 %s
HistoricalName ISO8859_1
# Iana Aliase
Alias ISO-IR-100
alias iso_8859-1
alias latein1
Alias L1
Alias IBM819
alias cp819
alias csiolatin1
# Andere Aliase
Alias 819
Alias IBM-819
Alias ISO8859_1
Alias ISO_8859-1: 1987
alias iso_8859_1
Alias 8859_1
Alias ISO8859-1
Charset ISO-8859-2 %s
HistoricalName ISO8859_2
Alias ISO8859_2
Alias 8859_2
Alias ISO-IR-101
alias iso_8859-2
Alias ISO_8859-2: 1987
Alias ISO8859-2
alias latein2
Alias L2
Alias IBM912
Alias IBM-912
alias cp912
Alias 912
alias csiolatin2
Charset ISO-8859-4 %s
HistoricalName ISO8859_4
Alias ISO8859_4
Alias ISO8859-4
Alias 8859_4
Alias ISO-IR-110
alias iso_8859-4
Alias ISO_8859-4: 1988
alias latein4
Alias L4
Alias IBM914
Alias IBM-914
alias cp914
Alias 914
alias csiolatin4
Charset ISO-8859-5 %s
HistoricalName ISO8859_5
Alias ISO8859_5
Alias 8859_5
Alias ISO-IR-144
alias iso_8859-5
Alias ISO_8859-5: 1988
Alias ISO8859-5
Alias Cyrillic
Alias IBM915
Alias IBM-915
alias cp915
Alias 915
alias csisolatincyrillisch
Charset ISO-8859-7 %s
HistoricalName ISO8859_7
Alias ISO8859_7
Alias 8859_7
Alias ISO-IR-126
alias iso_8859-7
Alias ISO_8859-7: 1987
alias elot_928
alias ecma-118
Alias Griechisch
Alias Greek8
alias csisolatingreek
alias sun_eu_greek # Solaris 7/8 Kompatibilität
Alias IBM813
Alias IBM-813
Alias 813
alias cp813
Alias ISO8859-7 # Solaris 9 Kompatibilität
Charset ISO-8859-9 %s
HistoricalName ISO8859_9
Alias ISO8859_9
Alias 8859_9
Alias ISO-IR-148
alias iso_8859-9
Alias ISO_8859-9: 1989
Alias ISO8859-9
alias latein5
Alias L5
Alias IBM920
Alias IBM-920
Alias 920
alias cp920
alias csiolatin5
Charset ISO-8859-13 %s
HistoricalName ISO8859_13
Alias ISO8859_13
Alias 8859_13
alias iso_8859-13
Alias ISO8859-13
Charset ISO-8859-15 %s
HistoricalName ISO8859_15
# Iana alias
alias iso_8859-15
# Andere Aliase
Alias 8859_15
Alias ISO8859_15
Alias ISO8859-15
Alias IBM923
Alias IBM-923
alias cp923
Alias 923
alias latein0
alias latein9
Alias L9
alias csiolatin0
alias csiolatin9
alias iso8859_15_fdis
Charset KOI8-R %s
HistoricalName KOI8_R
alias koi8_r
alias koi8
alias cskoi8r
Charset KOI8-U %s
alias koi8_u
Charset Windows-1250 %s
HistoricalName CP1250
alias cp1250
alias cp5346 # euro ibm ccsid
Charset Windows-1251 %s
HistoricalName CP1251
alias cp1251
Alias CP5347 # Euro IBM CCSID
Alias ANSI-1251 # Solaris-Kompatibilität
Charset Windows-1252 %s
HistoricalName CP1252
alias cp1252
Alias CP5348 # Euro IBM CCSID
Charset Windows-1253 %s
HistoricalName CP1253
alias cp1253
Alias CP5349 # Euro IBM CCSID
Charset Windows-1254 %s
HistoricalName CP1254
alias cp1254
Alias CP5350 # Euro IBM CCSID
Charset Windows-1257 %s
HistoricalName CP1257
alias cp1257
Alias CP5353 # Euro IBM CCSID
Charset IBM437 %s
HistoricalName CP437
alias cp437
Alias IBM-437
Alias 437
alias cspc8codepage437
Alias Windows-437
Charset X-IBM737 %s
HistoricalName CP737
alias cp737
Alias IBM737
Alias IBM-737
Alias 737
Charset IBM775 %s
HistoricalName CP775
alias cp775
Alias IBM-775
Alias 775
Charset IBM850 %s
HistoricalName CP850
alias cp850
Alias IBM-850
Alias 850
alias cspc850multinellual
Charset IBM852 %s
HistoricalName CP852
alias cp852
Alias IBM-852
Alias 852
alias cspcp852
Charset IBM855 %s
HistoricalName CP855
alias cp855
Alias IBM-855
Alias 855
alias cspcp855
Charset IBM857 %s
HistoricalName CP857
alias cp857
Alias IBM-857
Alias 857
alias csibm857
Charset IBM00858 %s
HistoricalName CP858
alias cp858
alias ccsid00858
alias cp00858
Alias 858
Charset IBM862 %s
HistoricalName CP862
alias cp862
Alias IBM-862
Alias 862
alias csibm862
alias cspc862latinHebrew
Charset IBM866 %s
HistoricalName CP866
alias cp866
Alias IBM-866
Alias 866
alias csibm866
Charset X-IBM874 %s
HistoricalName CP874
alias cp874
Alias IBM874
Alias IBM-874
Alias 874