2019-12-18 15:40:19 +00:00
|
|
|
/*
|
|
|
|
Copyright 2019 The Matrix.org Foundation C.I.C.
|
|
|
|
|
|
|
|
Licensed under the Apache License, Version 2.0 (the "License");
|
|
|
|
you may not use this file except in compliance with the License.
|
|
|
|
You may obtain a copy of the License at
|
|
|
|
|
|
|
|
http://www.apache.org/licenses/LICENSE-2.0
|
|
|
|
|
|
|
|
Unless required by applicable law or agreed to in writing, software
|
|
|
|
distributed under the License is distributed on an "AS IS" BASIS,
|
|
|
|
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
|
|
See the License for the specific language governing permissions and
|
|
|
|
limitations under the License.
|
|
|
|
*/
|
|
|
|
|
|
|
|
import EMOJIBASE from "emojibase-data/en/compact.json";
|
2021-07-11 02:40:30 +00:00
|
|
|
import SHORTCODES from "emojibase-data/en/shortcodes/iamcal.json";
|
2023-06-29 11:17:05 +00:00
|
|
|
import { CompactEmoji } from "emojibase";
|
2019-12-18 15:40:19 +00:00
|
|
|
|
2023-06-29 11:17:05 +00:00
|
|
|
export interface IEmoji extends Omit<CompactEmoji, "shortcodes"> {
|
|
|
|
// We generate a shortcode based on the label if none exist in the dataset
|
2021-07-16 20:36:03 +00:00
|
|
|
shortcodes: string[];
|
2020-04-20 18:17:58 +00:00
|
|
|
}
|
|
|
|
|
2019-12-18 15:40:19 +00:00
|
|
|
// The unicode is stored without the variant selector
|
2021-07-16 20:36:03 +00:00
|
|
|
const UNICODE_TO_EMOJI = new Map<string, IEmoji>(); // not exported as gets for it are handled by getEmojiFromUnicode
|
|
|
|
export const EMOTICON_TO_EMOJI = new Map<string, IEmoji>();
|
2019-12-18 15:40:19 +00:00
|
|
|
|
2023-02-13 17:01:43 +00:00
|
|
|
export const getEmojiFromUnicode = (unicode: string): IEmoji | undefined =>
|
|
|
|
UNICODE_TO_EMOJI.get(stripVariation(unicode));
|
2019-12-18 15:40:19 +00:00
|
|
|
|
2021-08-05 21:56:16 +00:00
|
|
|
const isRegionalIndicator = (x: string): boolean => {
|
|
|
|
// First verify that the string is a single character. We use Array.from
|
|
|
|
// to make sure we count by characters, not UTF-8 code units.
|
|
|
|
return (
|
|
|
|
Array.from(x).length === 1 &&
|
|
|
|
// Next verify that the character is within the code point range for
|
|
|
|
// regional indicators.
|
|
|
|
// http://unicode.org/charts/PDF/Unicode-6.0/U60-1F100.pdf
|
|
|
|
x >= "\u{1f1e6}" &&
|
|
|
|
x <= "\u{1f1ff}"
|
|
|
|
);
|
|
|
|
};
|
2021-07-27 21:22:49 +00:00
|
|
|
|
2019-12-18 15:40:19 +00:00
|
|
|
const EMOJIBASE_GROUP_ID_TO_CATEGORY = [
|
|
|
|
"people", // smileys
|
|
|
|
"people", // actually people
|
|
|
|
"control", // modifiers and such, not displayed in picker
|
|
|
|
"nature",
|
|
|
|
"foods",
|
|
|
|
"places",
|
|
|
|
"activity",
|
|
|
|
"objects",
|
|
|
|
"symbols",
|
|
|
|
"flags",
|
|
|
|
];
|
|
|
|
|
2023-02-13 11:39:16 +00:00
|
|
|
export const DATA_BY_CATEGORY: Record<string, IEmoji[]> = {
|
2019-12-18 15:40:19 +00:00
|
|
|
people: [],
|
|
|
|
nature: [],
|
|
|
|
foods: [],
|
|
|
|
places: [],
|
|
|
|
activity: [],
|
|
|
|
objects: [],
|
|
|
|
symbols: [],
|
|
|
|
flags: [],
|
|
|
|
};
|
|
|
|
|
|
|
|
// Store various mappings from unicode/emoticon/shortcode to the Emoji objects
|
2023-06-29 11:17:05 +00:00
|
|
|
export const EMOJI: IEmoji[] = EMOJIBASE.map((emojiData) => {
|
2021-07-20 11:47:31 +00:00
|
|
|
// If there's ever a gap in shortcode coverage, we fudge it by
|
|
|
|
// filling it in with the emoji's CLDR annotation
|
|
|
|
const shortcodeData = SHORTCODES[emojiData.hexcode] ?? [emojiData.label.toLowerCase().replace(/\W+/g, "_")];
|
|
|
|
|
2021-07-16 20:36:03 +00:00
|
|
|
const emoji: IEmoji = {
|
|
|
|
...emojiData,
|
2021-07-19 19:09:15 +00:00
|
|
|
// Homogenize shortcodes by ensuring that everything is an array
|
2021-07-20 11:47:31 +00:00
|
|
|
shortcodes: typeof shortcodeData === "string" ? [shortcodeData] : shortcodeData,
|
2021-07-16 20:36:03 +00:00
|
|
|
};
|
|
|
|
|
2021-07-27 21:22:49 +00:00
|
|
|
// We manually include regional indicators in the symbols group, since
|
|
|
|
// Emojibase intentionally leaves them uncategorized
|
|
|
|
const categoryId =
|
2023-06-29 11:17:05 +00:00
|
|
|
EMOJIBASE_GROUP_ID_TO_CATEGORY[emoji.group!] ?? (isRegionalIndicator(emoji.unicode) ? "symbols" : null);
|
2021-07-27 21:22:49 +00:00
|
|
|
|
2019-12-18 15:40:19 +00:00
|
|
|
if (DATA_BY_CATEGORY.hasOwnProperty(categoryId)) {
|
|
|
|
DATA_BY_CATEGORY[categoryId].push(emoji);
|
|
|
|
}
|
2021-07-11 02:40:30 +00:00
|
|
|
|
2019-12-18 15:40:19 +00:00
|
|
|
// Add mapping from unicode to Emoji object
|
2020-01-07 18:48:55 +00:00
|
|
|
// The 'unicode' field that we use in emojibase has either
|
|
|
|
// VS15 or VS16 appended to any characters that can take
|
|
|
|
// variation selectors. Which one it appends depends
|
|
|
|
// on whether emojibase considers their type to be 'text' or
|
|
|
|
// 'emoji'. We therefore strip any variation chars from strings
|
|
|
|
// both when building the map and when looking up.
|
|
|
|
UNICODE_TO_EMOJI.set(stripVariation(emoji.unicode), emoji);
|
2019-12-18 15:40:19 +00:00
|
|
|
|
|
|
|
if (emoji.emoticon) {
|
|
|
|
// Add mapping from emoticon to Emoji object
|
2022-03-23 17:08:34 +00:00
|
|
|
Array.isArray(emoji.emoticon)
|
|
|
|
? emoji.emoticon.forEach((x) => EMOTICON_TO_EMOJI.set(x, emoji))
|
|
|
|
: EMOTICON_TO_EMOJI.set(emoji.emoticon, emoji);
|
2019-12-18 15:40:19 +00:00
|
|
|
}
|
2021-07-16 20:36:03 +00:00
|
|
|
|
|
|
|
return emoji;
|
2019-12-18 15:40:19 +00:00
|
|
|
});
|
2020-01-07 18:48:55 +00:00
|
|
|
|
|
|
|
/**
|
2020-01-26 22:15:44 +00:00
|
|
|
* Strips variation selectors from the end of given string
|
|
|
|
* NB. Skin tone modifiers are not variation selectors:
|
2020-01-07 18:48:55 +00:00
|
|
|
* this function does not touch them. (Should it?)
|
|
|
|
*
|
|
|
|
* @param {string} str string to strip
|
|
|
|
* @returns {string} stripped string
|
|
|
|
*/
|
2023-01-12 13:25:14 +00:00
|
|
|
function stripVariation(str: string): string {
|
2020-01-26 22:15:44 +00:00
|
|
|
return str.replace(/[\uFE00-\uFE0F]$/, "");
|
2020-01-07 18:48:55 +00:00
|
|
|
}
|