2022-03-18 22:50:24 +01:00
|
|
|
import * as plugins from './smartstring.plugins.js';
|
|
|
|
import * as base64 from './smartstring.base64.js';
|
2019-10-10 17:28:23 +02:00
|
|
|
|
2024-03-01 23:34:43 +01:00
|
|
|
export const isUtf8 = (stringArg: string): boolean => {
|
|
|
|
// Convert string to a Uint8Array. In browsers, this will be a bit more complex
|
|
|
|
// because we need to convert the string to a binary representation first.
|
|
|
|
const encoder = new TextEncoder();
|
|
|
|
const bytes = encoder.encode(stringArg);
|
|
|
|
|
2019-10-10 17:28:23 +02:00
|
|
|
let i = 0;
|
2019-10-10 18:14:07 +02:00
|
|
|
while (i < bytes.length) {
|
|
|
|
if (
|
|
|
|
// ASCII
|
|
|
|
bytes[i] === 0x09 ||
|
|
|
|
bytes[i] === 0x0a ||
|
|
|
|
bytes[i] === 0x0d ||
|
|
|
|
(0x20 <= bytes[i] && bytes[i] <= 0x7e)
|
|
|
|
) {
|
|
|
|
i += 1;
|
|
|
|
continue;
|
|
|
|
}
|
2019-10-10 17:28:23 +02:00
|
|
|
|
2019-10-10 18:14:07 +02:00
|
|
|
if (
|
|
|
|
// non-overlong 2-byte
|
|
|
|
0xc2 <= bytes[i] &&
|
|
|
|
bytes[i] <= 0xdf &&
|
2019-11-24 11:44:21 +00:00
|
|
|
0x80 <= bytes[i + 1] &&
|
|
|
|
bytes[i + 1] <= 0xbf
|
2019-10-10 18:14:07 +02:00
|
|
|
) {
|
|
|
|
i += 2;
|
|
|
|
continue;
|
|
|
|
}
|
2019-10-10 17:28:23 +02:00
|
|
|
|
2019-10-10 18:14:07 +02:00
|
|
|
if (
|
|
|
|
// excluding overlongs
|
|
|
|
(bytes[i] === 0xe0 &&
|
2019-11-24 11:44:21 +00:00
|
|
|
0xa0 <= bytes[i + 1] &&
|
|
|
|
bytes[i + 1] <= 0xbf &&
|
|
|
|
0x80 <= bytes[i + 2] &&
|
2024-03-01 23:34:43 +01:00
|
|
|
bytes[i + 2] <= 0xbf) ||
|
|
|
|
// straight 3-byte
|
2019-10-10 18:14:07 +02:00
|
|
|
(((0xe1 <= bytes[i] && bytes[i] <= 0xec) || bytes[i] === 0xee || bytes[i] === 0xef) &&
|
2019-11-24 11:44:21 +00:00
|
|
|
0x80 <= bytes[i + 1] &&
|
|
|
|
bytes[i + 1] <= 0xbf &&
|
|
|
|
0x80 <= bytes[i + 2] &&
|
2024-03-01 23:34:43 +01:00
|
|
|
bytes[i + 2] <= 0xbf) ||
|
|
|
|
// excluding surrogates
|
2019-10-10 18:14:07 +02:00
|
|
|
(bytes[i] === 0xed &&
|
2019-11-24 11:44:21 +00:00
|
|
|
0x80 <= bytes[i + 1] &&
|
|
|
|
bytes[i + 1] <= 0x9f &&
|
|
|
|
0x80 <= bytes[i + 2] &&
|
|
|
|
bytes[i + 2] <= 0xbf)
|
2019-10-10 18:14:07 +02:00
|
|
|
) {
|
|
|
|
i += 3;
|
|
|
|
continue;
|
|
|
|
}
|
2019-10-10 17:28:23 +02:00
|
|
|
|
2019-10-10 18:14:07 +02:00
|
|
|
if (
|
|
|
|
// planes 1-3
|
|
|
|
(bytes[i] === 0xf0 &&
|
2019-11-24 11:44:21 +00:00
|
|
|
0x90 <= bytes[i + 1] &&
|
|
|
|
bytes[i + 1] <= 0xbf &&
|
|
|
|
0x80 <= bytes[i + 2] &&
|
|
|
|
bytes[i + 2] <= 0xbf &&
|
|
|
|
0x80 <= bytes[i + 3] &&
|
2024-03-01 23:34:43 +01:00
|
|
|
bytes[i + 3] <= 0xbf) ||
|
|
|
|
// planes 4-15
|
2019-10-10 18:14:07 +02:00
|
|
|
(0xf1 <= bytes[i] &&
|
|
|
|
bytes[i] <= 0xf3 &&
|
2019-11-24 11:44:21 +00:00
|
|
|
0x80 <= bytes[i + 1] &&
|
|
|
|
bytes[i + 1] <= 0xbf &&
|
|
|
|
0x80 <= bytes[i + 2] &&
|
|
|
|
bytes[i + 2] <= 0xbf &&
|
|
|
|
0x80 <= bytes[i + 3] &&
|
2024-03-01 23:34:43 +01:00
|
|
|
bytes[i + 3] <= 0xbf) ||
|
|
|
|
// plane 16
|
2019-10-10 18:14:07 +02:00
|
|
|
(bytes[i] === 0xf4 &&
|
2019-11-24 11:44:21 +00:00
|
|
|
0x80 <= bytes[i + 1] &&
|
|
|
|
bytes[i + 1] <= 0x8f &&
|
|
|
|
0x80 <= bytes[i + 2] &&
|
|
|
|
bytes[i + 2] <= 0xbf &&
|
|
|
|
0x80 <= bytes[i + 3] &&
|
|
|
|
bytes[i + 3] <= 0xbf)
|
2019-10-10 18:14:07 +02:00
|
|
|
) {
|
|
|
|
i += 4;
|
|
|
|
continue;
|
2019-10-10 17:28:23 +02:00
|
|
|
}
|
|
|
|
|
2019-10-10 18:14:07 +02:00
|
|
|
return false;
|
|
|
|
}
|
|
|
|
|
|
|
|
return true;
|
2019-10-10 18:03:04 +02:00
|
|
|
};
|
|
|
|
|
2024-03-01 23:34:43 +01:00
|
|
|
|
2019-10-10 18:03:04 +02:00
|
|
|
export const isBase64 = (stringArg: string) => {
|
2019-10-10 18:24:03 +02:00
|
|
|
const notBase64 = /[^A-Z0-9+\/=]/i;
|
|
|
|
const len = stringArg.length;
|
|
|
|
if (!len || len % 4 !== 0 || notBase64.test(stringArg)) {
|
|
|
|
return false;
|
|
|
|
}
|
|
|
|
const firstPaddingChar = stringArg.indexOf('=');
|
2019-11-24 11:44:21 +00:00
|
|
|
return (
|
|
|
|
firstPaddingChar === -1 ||
|
2019-10-10 18:24:03 +02:00
|
|
|
firstPaddingChar === len - 1 ||
|
2019-11-24 11:44:21 +00:00
|
|
|
(firstPaddingChar === len - 2 && stringArg[len - 1] === '=')
|
|
|
|
);
|
2019-10-10 18:03:04 +02:00
|
|
|
};
|