builder/lib/processors/nonAsciiEscaper.js

  1. import escapeUnicode from "escape-unicode";
  2. /**
  3. * @public
  4. * @module @ui5/builder/processors/nonAsciiEscaper
  5. */
  6. /**
  7. * @see https://en.wikipedia.org/wiki/ASCII
  8. * ascii contains 128 characters.
  9. * its char codes reach from 0 to 127.
  10. * @type {number}
  11. */
  12. const CHAR_CODE_OF_LAST_ASCII_CHARACTER = 127;
  13. // use memoization for escapeUnicode function for performance
  14. const memoizeEscapeUnicodeMap = Object.create(null);
  15. const memoizeEscapeUnicode = function(sChar) {
  16. if (memoizeEscapeUnicodeMap[sChar]) {
  17. return memoizeEscapeUnicodeMap[sChar];
  18. }
  19. memoizeEscapeUnicodeMap[sChar] = escapeUnicode(sChar);
  20. return memoizeEscapeUnicodeMap[sChar];
  21. };
  22. /**
  23. * Escapes non ASCII characters with unicode escape sequences.
  24. *
  25. * @see https://en.wikipedia.org/wiki/ASCII
  26. * @see https://tools.ietf.org/html/rfc5137#section-6.1
  27. *
  28. *
  29. * @param {string} string input string with non ascii characters, e.g. L♥VE
  30. * @returns {{string: (string), modified: boolean}} output string with all non ascii
  31. * characters being escaped by unicode sequence, e.g. L\u2665VE
  32. */
  33. const escapeNonAscii = function(string) {
  34. let result = "";
  35. let modified = false;
  36. for (let i = 0; i < string.length; i++) {
  37. const char = string[i];
  38. // check for non ascii characters (characters which have a char code
  39. // greater than the ascii character code range)
  40. if (string.charCodeAt(i) > CHAR_CODE_OF_LAST_ASCII_CHARACTER) {
  41. result += memoizeEscapeUnicode(char);
  42. modified = true;
  43. } else {
  44. result += char;
  45. }
  46. }
  47. return {
  48. modified,
  49. string: result
  50. };
  51. };
  52. /**
  53. * Escapes non ASCII characters with unicode escape sequences.
  54. *
  55. * @example
  56. * const encoding = nonAsciiEscaper.getEncodingFromAlias("ISO-8859-1");
  57. * nonAsciiEscaper({resources, options: {encoding}});
  58. *
  59. *
  60. * @public
  61. * @function default
  62. * @static
  63. *
  64. * @param {object} parameters Parameters
  65. * @param {@ui5/fs/Resource[]} parameters.resources List of resources to be processed
  66. * @param {object} [parameters.options] Options
  67. * @param {string} [parameters.options.encoding="utf8"] resource file encoding
  68. * ({@link https://nodejs.org/api/buffer.html#buffer_buffers_and_character_encodings Node.js character encodings}).
  69. * Use #getEncodingFromAlias to get the encoding string
  70. * @returns {Promise<@ui5/fs/Resource[]>} Promise resolving with the processed resources
  71. */
  72. async function nonAsciiEscaper({resources, options: {encoding}}) {
  73. encoding = encoding || "utf8";
  74. async function processResource(resource) {
  75. const resourceString = (await resource.getBuffer()).toString(encoding);
  76. const escaped = escapeNonAscii(resourceString);
  77. // only modify the resource's string if it was changed
  78. if (escaped.modified) {
  79. resource.setString(escaped.string);
  80. }
  81. return resource;
  82. }
  83. return Promise.all(resources.map(processResource));
  84. }
  85. const encodingMap = {
  86. "UTF-8": "utf8",
  87. "ISO-8859-1": "latin1",
  88. };
  89. /**
  90. * Provides a mapping from user-friendly encoding name (alias) such as "UTF-8" and "ISO-8859-1" to node
  91. * specific encoding name such as "utf8" or "latin1". Simplifies usage of nonAsciiEscaper encoding option
  92. * such that it can be used standalone without the respective task (e.g. in Splitter, Bundler and related projects).
  93. *
  94. * @public
  95. * @function getEncodingFromAlias
  96. * @alias @ui5/builder/processors/nonAsciiEscaper․getEncodingFromAlias
  97. * @static
  98. *
  99. * @param {string} encoding encoding labels: "UTF-8" and "ISO-8859-1"
  100. * @returns {string} node.js character encoding string, e.g. utf8 and latin1
  101. */
  102. nonAsciiEscaper.getEncodingFromAlias = function(encoding) {
  103. if (!encodingMap[encoding]) {
  104. throw new Error(
  105. `Encoding "${encoding}" is not supported. Only ${Object.keys(encodingMap).join(", ")} are allowed values` );
  106. }
  107. return encodingMap[encoding];
  108. };
  109. export default nonAsciiEscaper;