You can not select more than 25 topics
			Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
		
		
		
		
		
			
		
			
				
					
					
						
							431 lines
						
					
					
						
							13 KiB
						
					
					
				
			
		
		
		
			
			
			
				
					
				
				
					
				
			
		
		
	
	
							431 lines
						
					
					
						
							13 KiB
						
					
					
				| "use strict"; | |
| Object.defineProperty(exports, "__esModule", { value: true }); | |
| /** | |
|  * @param {boolean} fatal If true, decoding errors raise an exception. | |
|  * @param {number=} opt_code_point Override the standard fallback code point. | |
|  * @return {number} The code point to insert on a decoding error. | |
|  */ | |
| function decoderError(fatal, opt_code_point) { | |
|     if (opt_code_point === void 0) { opt_code_point = undefined; } | |
|     if (fatal) | |
|         throw TypeError("Decoder error"); | |
|     return opt_code_point || 0xfffd; | |
| } | |
| exports.decoderError = decoderError; | |
| /** | |
|  * @param {number} code_point The code point that could not be encoded. | |
|  * @return {number} Always throws, no value is actually returned. | |
|  */ | |
| function encoderError(code_point) { | |
|     throw TypeError("The code point " + code_point + " could not be encoded."); | |
| } | |
| exports.encoderError = encoderError; | |
| // 5.2 Names and labels | |
| // TODO: Define @typedef for Encoding: {name:string,labels:Array.<string>} | |
| // https://github.com/google/closure-compiler/issues/247 | |
| /** | |
|  * @param {string} label The encoding label. | |
|  * @return {?{name:string,labels:Array.<string>}} | |
|  */ | |
| function getEncoding(label) { | |
|     // 1. Remove any leading and trailing ASCII whitespace from label. | |
|     var keyLabel = String(label).trim().toLowerCase(); | |
|     // 2. If label is an ASCII case-insensitive match for any of the | |
|     // labels listed in the table below, return the corresponding | |
|     // encoding, and failure otherwise. | |
|     if (keyLabel in label_to_encoding) { | |
|         return label_to_encoding[keyLabel]; | |
|     } | |
|     return null; | |
| } | |
| exports.getEncoding = getEncoding; | |
| /** | |
|  * Encodings table: https://encoding.spec.whatwg.org/encodings.json | |
|  * @const | |
|  * @type {!Array.<{ | |
|  *          heading: string, | |
|  *          encodings: Array.<{name:string,labels:Array.<string>}> | |
|  *        }>} | |
|  */ | |
| var encodings = [ | |
|     { | |
|         encodings: [ | |
|             { | |
|                 labels: ["unicode-1-1-utf-8", "utf-8", "utf8"], | |
|                 name: "UTF-8", | |
|             }, | |
|         ], | |
|         heading: "The Encoding", | |
|     }, | |
|     { | |
|         encodings: [ | |
|             { | |
|                 labels: ["866", "cp866", "csibm866", "ibm866"], | |
|                 name: "IBM866", | |
|             }, | |
|             { | |
|                 labels: [ | |
|                     "csisolatin2", | |
|                     "iso-8859-2", | |
|                     "iso-ir-101", | |
|                     "iso8859-2", | |
|                     "iso88592", | |
|                     "iso_8859-2", | |
|                     "iso_8859-2:1987", | |
|                     "l2", | |
|                     "latin2", | |
|                 ], | |
|                 name: "ISO-8859-2", | |
|             }, | |
|             { | |
|                 labels: [ | |
|                     "csisolatin3", | |
|                     "iso-8859-3", | |
|                     "iso-ir-109", | |
|                     "iso8859-3", | |
|                     "iso88593", | |
|                     "iso_8859-3", | |
|                     "iso_8859-3:1988", | |
|                     "l3", | |
|                     "latin3", | |
|                 ], | |
|                 name: "ISO-8859-3", | |
|             }, | |
|             { | |
|                 labels: [ | |
|                     "csisolatin4", | |
|                     "iso-8859-4", | |
|                     "iso-ir-110", | |
|                     "iso8859-4", | |
|                     "iso88594", | |
|                     "iso_8859-4", | |
|                     "iso_8859-4:1988", | |
|                     "l4", | |
|                     "latin4", | |
|                 ], | |
|                 name: "ISO-8859-4", | |
|             }, | |
|             { | |
|                 labels: [ | |
|                     "csisolatincyrillic", | |
|                     "cyrillic", | |
|                     "iso-8859-5", | |
|                     "iso-ir-144", | |
|                     "iso8859-5", | |
|                     "iso88595", | |
|                     "iso_8859-5", | |
|                     "iso_8859-5:1988", | |
|                 ], | |
|                 name: "ISO-8859-5", | |
|             }, | |
|             { | |
|                 labels: [ | |
|                     "arabic", | |
|                     "asmo-708", | |
|                     "csiso88596e", | |
|                     "csiso88596i", | |
|                     "csisolatinarabic", | |
|                     "ecma-114", | |
|                     "iso-8859-6", | |
|                     "iso-8859-6-e", | |
|                     "iso-8859-6-i", | |
|                     "iso-ir-127", | |
|                     "iso8859-6", | |
|                     "iso88596", | |
|                     "iso_8859-6", | |
|                     "iso_8859-6:1987", | |
|                 ], | |
|                 name: "ISO-8859-6", | |
|             }, | |
|             { | |
|                 labels: [ | |
|                     "csisolatingreek", | |
|                     "ecma-118", | |
|                     "elot_928", | |
|                     "greek", | |
|                     "greek8", | |
|                     "iso-8859-7", | |
|                     "iso-ir-126", | |
|                     "iso8859-7", | |
|                     "iso88597", | |
|                     "iso_8859-7", | |
|                     "iso_8859-7:1987", | |
|                     "sun_eu_greek", | |
|                 ], | |
|                 name: "ISO-8859-7", | |
|             }, | |
|             { | |
|                 labels: [ | |
|                     "csiso88598e", | |
|                     "csisolatinhebrew", | |
|                     "hebrew", | |
|                     "iso-8859-8", | |
|                     "iso-8859-8-e", | |
|                     "iso-ir-138", | |
|                     "iso8859-8", | |
|                     "iso88598", | |
|                     "iso_8859-8", | |
|                     "iso_8859-8:1988", | |
|                     "visual", | |
|                 ], | |
|                 name: "ISO-8859-8", | |
|             }, | |
|             { | |
|                 labels: ["csiso88598i", "iso-8859-8-i", "logical"], | |
|                 name: "ISO-8859-8-I", | |
|             }, | |
|             { | |
|                 labels: [ | |
|                     "csisolatin6", | |
|                     "iso-8859-10", | |
|                     "iso-ir-157", | |
|                     "iso8859-10", | |
|                     "iso885910", | |
|                     "l6", | |
|                     "latin6", | |
|                 ], | |
|                 name: "ISO-8859-10", | |
|             }, | |
|             { | |
|                 labels: ["iso-8859-13", "iso8859-13", "iso885913"], | |
|                 name: "ISO-8859-13", | |
|             }, | |
|             { | |
|                 labels: ["iso-8859-14", "iso8859-14", "iso885914"], | |
|                 name: "ISO-8859-14", | |
|             }, | |
|             { | |
|                 labels: [ | |
|                     "csisolatin9", | |
|                     "iso-8859-15", | |
|                     "iso8859-15", | |
|                     "iso885915", | |
|                     "iso_8859-15", | |
|                     "l9", | |
|                 ], | |
|                 name: "ISO-8859-15", | |
|             }, | |
|             { | |
|                 labels: ["iso-8859-16"], | |
|                 name: "ISO-8859-16", | |
|             }, | |
|             { | |
|                 labels: ["cskoi8r", "koi", "koi8", "koi8-r", "koi8_r"], | |
|                 name: "KOI8-R", | |
|             }, | |
|             { | |
|                 labels: ["koi8-ru", "koi8-u"], | |
|                 name: "KOI8-U", | |
|             }, | |
|             { | |
|                 labels: ["csmacintosh", "mac", "macintosh", "x-mac-roman"], | |
|                 name: "macintosh", | |
|             }, | |
|             { | |
|                 labels: [ | |
|                     "dos-874", | |
|                     "iso-8859-11", | |
|                     "iso8859-11", | |
|                     "iso885911", | |
|                     "tis-620", | |
|                     "windows-874", | |
|                 ], | |
|                 name: "windows-874", | |
|             }, | |
|             { | |
|                 labels: ["cp1250", "windows-1250", "x-cp1250"], | |
|                 name: "windows-1250", | |
|             }, | |
|             { | |
|                 labels: ["cp1251", "windows-1251", "x-cp1251"], | |
|                 name: "windows-1251", | |
|             }, | |
|             { | |
|                 labels: [ | |
|                     "ansi_x3.4-1968", | |
|                     "cp1252", | |
|                     "cp819", | |
|                     "ibm819", | |
|                     "iso-ir-100", | |
|                     "windows-1252", | |
|                     "x-cp1252", | |
|                 ], | |
|                 name: "windows-1252", | |
|             }, | |
|             { | |
|                 labels: [ | |
|                     "ascii", | |
|                     "us-ascii", | |
|                     "iso-8859-1", | |
|                     "iso8859-1", | |
|                     "iso88591", | |
|                     "iso_8859-1", | |
|                     "iso_8859-1:1987", | |
|                     "l1", | |
|                     "latin1", | |
|                     "csisolatin1", | |
|                 ], | |
|                 name: "iso-8859-1", | |
|             }, | |
|             { | |
|                 labels: ["cp1253", "windows-1253", "x-cp1253"], | |
|                 name: "windows-1253", | |
|             }, | |
|             { | |
|                 labels: [ | |
|                     "cp1254", | |
|                     "csisolatin5", | |
|                     "iso-8859-9", | |
|                     "iso-ir-148", | |
|                     "iso8859-9", | |
|                     "iso88599", | |
|                     "iso_8859-9", | |
|                     "iso_8859-9:1989", | |
|                     "l5", | |
|                     "latin5", | |
|                     "windows-1254", | |
|                     "x-cp1254", | |
|                 ], | |
|                 name: "windows-1254", | |
|             }, | |
|             { | |
|                 labels: ["cp1255", "windows-1255", "x-cp1255"], | |
|                 name: "windows-1255", | |
|             }, | |
|             { | |
|                 labels: ["cp1256", "windows-1256", "x-cp1256"], | |
|                 name: "windows-1256", | |
|             }, | |
|             { | |
|                 labels: ["cp1257", "windows-1257", "x-cp1257"], | |
|                 name: "windows-1257", | |
|             }, | |
|             { | |
|                 labels: ["cp1258", "windows-1258", "x-cp1258"], | |
|                 name: "windows-1258", | |
|             }, | |
|             { | |
|                 labels: ["x-mac-cyrillic", "x-mac-ukrainian"], | |
|                 name: "x-mac-cyrillic", | |
|             }, | |
|         ], | |
|         heading: "Legacy single-byte encodings", | |
|     }, | |
|     { | |
|         encodings: [ | |
|             { | |
|                 labels: [ | |
|                     "chinese", | |
|                     "csgb2312", | |
|                     "csiso58gb231280", | |
|                     "gb2312", | |
|                     "gb_2312", | |
|                     "gb_2312-80", | |
|                     "gbk", | |
|                     "iso-ir-58", | |
|                     "x-gbk", | |
|                 ], | |
|                 name: "GBK", | |
|             }, | |
|             { | |
|                 labels: ["gb18030"], | |
|                 name: "gb18030", | |
|             }, | |
|         ], | |
|         heading: "Legacy multi-byte Chinese (simplified) encodings", | |
|     }, | |
|     { | |
|         encodings: [ | |
|             { | |
|                 labels: ["big5", "big5-hkscs", "cn-big5", "csbig5", "x-x-big5"], | |
|                 name: "Big5", | |
|             }, | |
|         ], | |
|         heading: "Legacy multi-byte Chinese (traditional) encodings", | |
|     }, | |
|     { | |
|         encodings: [ | |
|             { | |
|                 labels: ["cseucpkdfmtjapanese", "euc-jp", "x-euc-jp"], | |
|                 name: "EUC-JP", | |
|             }, | |
|             { | |
|                 labels: ["csiso2022jp", "iso-2022-jp"], | |
|                 name: "ISO-2022-JP", | |
|             }, | |
|             { | |
|                 labels: [ | |
|                     "csshiftjis", | |
|                     "ms932", | |
|                     "ms_kanji", | |
|                     "shift-jis", | |
|                     "shift_jis", | |
|                     "sjis", | |
|                     "windows-31j", | |
|                     "x-sjis", | |
|                 ], | |
|                 name: "Shift_JIS", | |
|             }, | |
|         ], | |
|         heading: "Legacy multi-byte Japanese encodings", | |
|     }, | |
|     { | |
|         encodings: [ | |
|             { | |
|                 labels: [ | |
|                     "cseuckr", | |
|                     "csksc56011987", | |
|                     "euc-kr", | |
|                     "iso-ir-149", | |
|                     "korean", | |
|                     "ks_c_5601-1987", | |
|                     "ks_c_5601-1989", | |
|                     "ksc5601", | |
|                     "ksc_5601", | |
|                     "windows-949", | |
|                 ], | |
|                 name: "EUC-KR", | |
|             }, | |
|         ], | |
|         heading: "Legacy multi-byte Korean encodings", | |
|     }, | |
|     { | |
|         encodings: [ | |
|             { | |
|                 labels: [ | |
|                     "csiso2022kr", | |
|                     "hz-gb-2312", | |
|                     "iso-2022-cn", | |
|                     "iso-2022-cn-ext", | |
|                     "iso-2022-kr", | |
|                 ], | |
|                 name: "replacement", | |
|             }, | |
|             { | |
|                 labels: ["utf-16be"], | |
|                 name: "UTF-16BE", | |
|             }, | |
|             { | |
|                 labels: ["utf-16", "utf-16le"], | |
|                 name: "UTF-16LE", | |
|             }, | |
|             { | |
|                 labels: ["x-user-defined"], | |
|                 name: "x-user-defined", | |
|             }, | |
|         ], | |
|         heading: "Legacy miscellaneous encodings", | |
|     }, | |
| ]; | |
| exports.encodings = encodings; | |
| // Label to encoding registry. | |
| /** @type {Object.<string,{name:string,labels:Array.<string>}>} */ | |
| var label_to_encoding = {}; | |
| encodings.forEach(function (category) { | |
|     category.encodings.forEach(function (encoding) { | |
|         encoding.labels.forEach(function (label) { | |
|             label_to_encoding[label] = encoding; | |
|         }); | |
|     }); | |
| }); | |
| //# sourceMappingURL=encodings.js.map
 |