|
| 1 | +import { utf8CountUint16Array } from "./utf8CountUint16Array"; |
| 2 | +import { storeUint8BE, storeUint16BE, storeUint32BE, loadUint16BE } from "./be"; |
| 3 | + |
| 4 | +function storeStringHeader(outputPtr: usize, utf8ByteLength: usize): usize { |
| 5 | + let ptr = outputPtr; |
| 6 | + if (utf8ByteLength < 32) { |
| 7 | + // fixstr |
| 8 | + storeUint8BE(ptr++, 0xa0 + (utf8ByteLength as u8)); |
| 9 | + } else if (utf8ByteLength < 0x100) { |
| 10 | + // str 8 |
| 11 | + storeUint8BE(ptr++, 0xd9); |
| 12 | + storeUint8BE(ptr++, utf8ByteLength as u8); |
| 13 | + } else if (utf8ByteLength < 0x10000) { |
| 14 | + // str 16 |
| 15 | + storeUint8BE(ptr++, 0xda); |
| 16 | + storeUint16BE(ptr, utf8ByteLength as u16); |
| 17 | + ptr += sizeof<u16>(); |
| 18 | + } else if ((utf8ByteLength as u64) < 0x100000000) { |
| 19 | + // str 32 |
| 20 | + storeUint8BE(ptr++, 0xdb); |
| 21 | + storeUint32BE(ptr, utf8ByteLength as u32); |
| 22 | + ptr += sizeof<u32>(); |
| 23 | + } else { |
| 24 | + throw new Error(`Too long string: ${utf8ByteLength} bytes in UTF-8`); |
| 25 | + } |
| 26 | + return ptr; |
| 27 | +} |
| 28 | + |
| 29 | +// outputPtr: u8* |
| 30 | +// inputPtr: u16* |
| 31 | +// It adds MessagePack str head bytes to the output |
| 32 | +export function utf8EncodeUint16Array(outputPtr: usize, inputPtr: usize, inputLength: usize): usize { |
| 33 | + let utf8ByteLength = utf8CountUint16Array(inputPtr, inputLength); |
| 34 | + let strHeaderOffset = storeStringHeader(outputPtr, utf8ByteLength); |
| 35 | + |
| 36 | + const u16s = sizeof<u16>(); |
| 37 | + let inputOffset = inputPtr; |
| 38 | + let inputEnd = inputPtr + inputLength * u16s; |
| 39 | + let outputOffset = strHeaderOffset; |
| 40 | + while (inputOffset < inputEnd) { |
| 41 | + let value: u32 = loadUint16BE(inputOffset); |
| 42 | + inputOffset += u16s; |
| 43 | + |
| 44 | + if ((value & 0xffffff80) === 0) { |
| 45 | + // 1-byte |
| 46 | + store<u8>(outputOffset++, value); |
| 47 | + continue; |
| 48 | + } else if ((value & 0xfffff800) === 0) { |
| 49 | + // 2-bytes |
| 50 | + store<u8>(outputOffset++, ((value >> 6) & 0x1f) | 0xc0); |
| 51 | + } else { |
| 52 | + // handle surrogate pair |
| 53 | + if (value >= 0xd800 && value <= 0xdbff) { |
| 54 | + // high surrogate |
| 55 | + if (inputOffset < inputEnd) { |
| 56 | + let extra: u32 = loadUint16BE(inputOffset); |
| 57 | + if ((extra & 0xfc00) === 0xdc00) { |
| 58 | + inputOffset += u16s; |
| 59 | + value = ((value & 0x3ff) << 10) + (extra & 0x3ff) + 0x10000; |
| 60 | + } |
| 61 | + } |
| 62 | + } |
| 63 | + |
| 64 | + if ((value & 0xffff0000) === 0) { |
| 65 | + // 3-byte |
| 66 | + store<u8>(outputOffset++, ((value >> 12) & 0x0f) | 0xe0); |
| 67 | + store<u8>(outputOffset++, ((value >> 6) & 0x3f) | 0x80); |
| 68 | + } else { |
| 69 | + // 4-byte |
| 70 | + store<u8>(outputOffset++, ((value >> 18) & 0x07) | 0xf0); |
| 71 | + store<u8>(outputOffset++, ((value >> 12) & 0x3f) | 0x80); |
| 72 | + store<u8>(outputOffset++, ((value >> 6) & 0x3f) | 0x80); |
| 73 | + } |
| 74 | + } |
| 75 | + |
| 76 | + store<u8>(outputOffset++, (value & 0x3f) | 0x80); |
| 77 | + } |
| 78 | + |
| 79 | + return outputOffset - outputPtr; |
| 80 | +} |
0 commit comments