From: Jesse Tane Date: Sun, 5 Jan 2014 22:39:42 +0000 (-0500) Subject: detect and handle utf16 non-BMP characters (surrogate pairs) X-Git-Url: https://zoso.dev/?a=commitdiff_plain;h=f812fb66863ba4ec977331ca7538f8fa9a3f3f54;p=buffer.git detect and handle utf16 non-BMP characters (surrogate pairs) --- diff --git a/index.js b/index.js index f8ce472..c77d54a 100644 --- a/index.js +++ b/index.js @@ -920,14 +920,18 @@ function toHex (n) { function utf8ToBytes (str) { var byteArray = [] - for (var i = 0; i < str.length; i++) - if (str.charCodeAt(i) <= 0x7F) + for (var i = 0; i < str.length; i++) { + var b = str.charCodeAt(i) + if (b <= 0x7F) byteArray.push(str.charCodeAt(i)) else { - var h = encodeURIComponent(str.charAt(i)).substr(1).split('%') + var start = i + if (b >= 0xD800 && b <= 0xDFFF) i++ + var h = encodeURIComponent(str.slice(start, i+1)).substr(1).split('%') for (var j = 0; j < h.length; j++) byteArray.push(parseInt(h[j], 16)) } + } return byteArray }