| 123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231 |
- function toString(number) {
- if (number < 255) {
- if (number > 32 && number < 127) {
- const char = String.fromCharCode(number);
- if (
- // 0-9
- number > 47 && number < 58 || // A-Z
- number > 64 && number < 91 || // _`a-z
- number > 94 && number < 123
- ) {
- return char;
- }
- return "\\" + char;
- }
- return "\\x" + (number < 16 ? "0" : "") + number.toString(16).toUpperCase();
- }
- return "\\u" + number.toString(16).toUpperCase();
- }
- function wrapRegexInGroup(regex) {
- return "(?:" + regex + ")";
- }
- function updateUTF16EmojiRegexItem(item) {
- const numbers = item.numbers;
- if (numbers.length === 1) {
- const num = numbers[0];
- return item.regex = toString(num);
- }
- numbers.sort((a, b) => a - b);
- const chars = [];
- let range = null;
- const addRange = () => {
- if (range) {
- const { start, last, numbers: numbers2 } = range;
- range = null;
- if (last > start + 1) {
- chars.push(toString(start) + "-" + toString(last));
- } else {
- for (let i = 0; i < numbers2.length; i++) {
- chars.push(toString(numbers2[i]));
- }
- }
- }
- };
- for (let i = 0; i < numbers.length; i++) {
- const num = numbers[i];
- if (range) {
- if (range.last === num) {
- continue;
- }
- if (range.last === num - 1) {
- range.numbers.push(num);
- range.last = num;
- continue;
- }
- }
- addRange();
- range = {
- start: num,
- last: num,
- numbers: [num]
- };
- }
- addRange();
- if (!chars.length) {
- throw new Error("Unexpected empty range");
- }
- return item.regex = "[" + chars.join("") + "]";
- }
- function createUTF16EmojiRegexItem(numbers) {
- const result = {
- type: "utf16",
- regex: "",
- numbers,
- length: 1,
- group: true
- };
- updateUTF16EmojiRegexItem(result);
- return result;
- }
- function updateSequenceEmojiRegexItem(item) {
- return item.regex = item.items.map((childItem) => {
- if (!childItem.group && childItem.type === "set") {
- return wrapRegexInGroup(childItem.regex);
- }
- return childItem.regex;
- }).join("");
- }
- function createSequenceEmojiRegexItem(sequence, numbers) {
- let items = [];
- sequence.forEach((item) => {
- if (item.type === "sequence") {
- items = items.concat(item.items);
- } else {
- items.push(item);
- }
- });
- if (!items.length) {
- throw new Error("Empty sequence");
- }
- const result = {
- type: "sequence",
- items,
- regex: "",
- length: items.reduce((length, item) => item.length + length, 0),
- group: false
- };
- if (sequence.length === 1) {
- const firstItem = sequence[0];
- result.group = firstItem.group;
- if (firstItem.type !== "optional") {
- const numbers2 = firstItem.numbers;
- if (numbers2) {
- result.numbers = numbers2;
- }
- }
- }
- if (numbers) {
- result.numbers = numbers;
- }
- updateSequenceEmojiRegexItem(result);
- return result;
- }
- function updateSetEmojiRegexItem(item) {
- if (item.sets.length === 1) {
- const firstItem = item.sets[0];
- item.group = firstItem.group;
- return item.regex = firstItem.regex;
- }
- item.group = false;
- return item.regex = item.sets.map((childItem) => childItem.regex).join("|");
- }
- function createSetEmojiRegexItem(set) {
- let sets = [];
- let numbers = [];
- set.forEach((item) => {
- if (item.type === "set") {
- sets = sets.concat(item.sets);
- } else {
- sets.push(item);
- }
- if (numbers) {
- if (item.type === "optional" || !item.numbers) {
- numbers = null;
- } else {
- numbers = [...numbers, ...item.numbers];
- }
- }
- });
- sets.sort((a, b) => {
- if (a.length === b.length) {
- return a.regex.localeCompare(b.regex);
- }
- return b.length - a.length;
- });
- const result = {
- type: "set",
- sets,
- regex: "",
- length: sets.reduce(
- (length, item) => length ? Math.min(length, item.length) : item.length,
- 0
- ),
- group: false
- };
- if (numbers) {
- result.numbers = numbers;
- }
- if (set.length === 1) {
- const firstItem = set[0];
- result.group = firstItem.group;
- }
- updateSetEmojiRegexItem(result);
- return result;
- }
- function updateOptionalEmojiRegexItem(item) {
- const childItem = item.item;
- const regex = (childItem.group ? childItem.regex : wrapRegexInGroup(childItem.regex)) + "?";
- return item.regex = regex;
- }
- function createOptionalEmojiRegexItem(item) {
- if (item.type === "optional") {
- return item;
- }
- const result = {
- type: "optional",
- item,
- regex: "",
- length: item.length,
- group: true
- };
- updateOptionalEmojiRegexItem(result);
- return result;
- }
- function cloneEmojiRegexItem(item, shallow = false) {
- const result = {
- ...item
- };
- if (result.type !== "optional" && result.numbers) {
- result.numbers = [...result.numbers];
- }
- switch (result.type) {
- case "utf16":
- break;
- case "sequence":
- if (shallow) {
- result.items = [...result.items];
- } else {
- result.items = result.items.map(
- (item2) => cloneEmojiRegexItem(item2, false)
- );
- }
- break;
- case "set":
- if (shallow) {
- result.sets = [...result.sets];
- } else {
- result.sets = result.sets.map(
- (item2) => cloneEmojiRegexItem(item2, false)
- );
- }
- break;
- case "optional":
- if (!shallow) {
- result.item = cloneEmojiRegexItem(result.item, false);
- }
- break;
- }
- return result;
- }
- export { cloneEmojiRegexItem, createOptionalEmojiRegexItem, createSequenceEmojiRegexItem, createSetEmojiRegexItem, createUTF16EmojiRegexItem, updateOptionalEmojiRegexItem, updateSequenceEmojiRegexItem, updateSetEmojiRegexItem, updateUTF16EmojiRegexItem, wrapRegexInGroup };
|