require_relative "../lib/unicode/emoji" require "minitest/autorun" describe Unicode::Emoji do describe ".properties" do it "returns an Array for Emoji properties if has codepoints" do assert_equal ["Emoji", "Emoji_Presentation", "Extended_Pictographic"], Unicode::Emoji.properties("😴") assert_equal ["Emoji", "Extended_Pictographic"], Unicode::Emoji.properties("β™ ") end it "returns nil for Emoji properties if has no codepoints" do assert_nil Unicode::Emoji.properties("A") end end describe "REGEX" do it "matches most singleton emoji codepoints" do "😴 sleeping face" =~ Unicode::Emoji::REGEX assert_equal "😴", $& end it "matches singleton emoji in combination with emoji variation selector" do "😴\u{FE0F} sleeping face" =~ Unicode::Emoji::REGEX assert_equal "😴\u{FE0F}", $& end it "does not match singleton emoji in combination with text variation selector" do "😴\u{FE0E} sleeping face" =~ Unicode::Emoji::REGEX assert_nil $& end it "does not match textual singleton emoji" do "β–Ά play button" =~ Unicode::Emoji::REGEX assert_nil $& end it "matches textual singleton emoji in combination with emoji variation selector" do "β–Ά\u{FE0F} play button" =~ Unicode::Emoji::REGEX assert_equal "β–Ά\u{FE0F}", $& end it "does not match singleton 'component' emoji codepoints" do "🏻 light skin tone" =~ Unicode::Emoji::REGEX assert_nil $& end it "matches modified emoji if modifier base emoji is used" do "πŸ›ŒπŸ½ person in bed: medium skin tone" =~ Unicode::Emoji::REGEX assert_equal "πŸ›ŒπŸ½", $& end it "does not match modified emoji if no modifier base emoji is used" do "🌡🏽 cactus" =~ Unicode::Emoji::REGEX assert_equal "🌡", $& end it "matches valid region flags" do "πŸ‡΅πŸ‡Ή Portugal" =~ Unicode::Emoji::REGEX assert_equal "πŸ‡΅πŸ‡Ή", $& end it "does not match invalid region flags" do "πŸ‡΅πŸ‡΅ PP Land" =~ Unicode::Emoji::REGEX assert_nil $& end it "matches emoji keycap sequences" do "2️⃣ keycap: 2" =~ Unicode::Emoji::REGEX assert_equal "2️⃣", $& end it "matches recommended tag sequences" do "🏴󠁧󠁒󠁳󠁣󠁴󠁿 Scotland" =~ Unicode::Emoji::REGEX assert_equal "🏴󠁧󠁒󠁳󠁣󠁴󠁿", $& end it "does not match valid tag sequences that are not recommended" do "🏴󠁧󠁒󠁑󠁧󠁒󠁿 GB AGB" =~ Unicode::Emoji::REGEX assert_equal "🏴", $& # only base flag is matched end it "matches recommended zwj sequences" do "πŸ€ΎπŸ½β€β™€οΈ woman playing handball: medium skin tone" =~ Unicode::Emoji::REGEX assert_equal "πŸ€ΎπŸ½β€β™€οΈ", $& end it "does not match valid zwj sequences that are not recommended" do "πŸ€ β€πŸ€’ vomiting cowboy" =~ Unicode::Emoji::REGEX assert_equal "🀠", $& end it "matches 12.1 emoji" do "πŸ§‘β€πŸ¦± person: curly hair" =~ Unicode::Emoji::REGEX assert_equal "πŸ§‘β€πŸ¦±", $& end it "matches 13.0 emoji" do "πŸ‘¨β€πŸΌ man feeding baby" =~ Unicode::Emoji::REGEX assert_equal "πŸ‘¨β€πŸΌ", $& end it "matches 13.1 emoji" do "❀️‍πŸ”₯ heart on fire" =~ Unicode::Emoji::REGEX assert_equal "❀️‍πŸ”₯", $& end end describe "REGEX_VALID" do it "matches most singleton emoji codepoints" do "😴 sleeping face" =~ Unicode::Emoji::REGEX_VALID assert_equal "😴", $& end it "matches singleton emoji in combination with emoji variation selector" do "😴\u{FE0F} sleeping face" =~ Unicode::Emoji::REGEX_VALID assert_equal "😴\u{FE0F}", $& end it "does not match singleton emoji when in combination with text variation selector" do "😴\u{FE0E} sleeping face" =~ Unicode::Emoji::REGEX_VALID assert_nil $& end it "does not match textual singleton emoji" do "β–Ά play button" =~ Unicode::Emoji::REGEX_VALID assert_nil $& end it "matches textual singleton emoji in combination with emoji variation selector" do "β–Ά\u{FE0F} play button" =~ Unicode::Emoji::REGEX_VALID assert_equal "β–Ά\u{FE0F}", $& end it "does not match singleton 'component' emoji codepoints" do "🏻 light skin tone" =~ Unicode::Emoji::REGEX_VALID assert_nil $& end it "matches modified emoji if modifier base emoji is used" do "πŸ›ŒπŸ½ person in bed: medium skin tone" =~ Unicode::Emoji::REGEX_VALID assert_equal "πŸ›ŒπŸ½", $& end it "does not match modified emoji if no modifier base emoji is used" do "🌡🏽 cactus" =~ Unicode::Emoji::REGEX_VALID assert_equal "🌡", $& end it "matches valid region flags" do "πŸ‡΅πŸ‡Ή Portugal" =~ Unicode::Emoji::REGEX_VALID assert_equal "πŸ‡΅πŸ‡Ή", $& end it "does not match invalid region flags" do "πŸ‡΅πŸ‡΅ PP Land" =~ Unicode::Emoji::REGEX_VALID assert_nil $& end it "matches emoji keycap sequences" do "2️⃣ keycap: 2" =~ Unicode::Emoji::REGEX_VALID assert_equal "2️⃣", $& end it "matches recommended tag sequences" do "🏴󠁧󠁒󠁳󠁣󠁴󠁿 Scotland" =~ Unicode::Emoji::REGEX_VALID assert_equal "🏴󠁧󠁒󠁳󠁣󠁴󠁿", $& end it "matches valid tag sequences, even though they are not recommended" do "🏴󠁧󠁒󠁑󠁧󠁒󠁿 GB AGB" =~ Unicode::Emoji::REGEX_VALID assert_equal "🏴󠁧󠁒󠁑󠁧󠁒󠁿", $& end it "does not match invalid tag sequences" do "🏴󠁧󠁒󠁑󠁑󠁑󠁿 GB AAA" =~ Unicode::Emoji::REGEX_VALID assert_equal "🏴", $& # only base flag is matched end it "matches recommended zwj sequences" do "πŸ€ΎπŸ½β€β™€οΈ woman playing handball: medium skin tone" =~ Unicode::Emoji::REGEX_VALID assert_equal "πŸ€ΎπŸ½β€β™€οΈ", $& end it "matches valid zwj sequences, even though they are not recommended" do "πŸ€ β€πŸ€’ vomiting cowboy" =~ Unicode::Emoji::REGEX_VALID assert_equal "πŸ€ β€πŸ€’", $& end end describe "REGEX_WELL_FORMED" do it "matches most singleton emoji codepoints" do "😴 sleeping face" =~ Unicode::Emoji::REGEX_WELL_FORMED assert_equal "😴", $& end it "matches singleton emoji in combination with emoji variation selector" do "😴\u{FE0F} sleeping face" =~ Unicode::Emoji::REGEX_WELL_FORMED assert_equal "😴\u{FE0F}", $& end it "does not match singleton emoji when in combination with text variation selector" do "😴\u{FE0E} sleeping face" =~ Unicode::Emoji::REGEX_WELL_FORMED assert_nil $& end it "does not match textual singleton emoji" do "β–Ά play button" =~ Unicode::Emoji::REGEX_WELL_FORMED assert_nil $& end it "matches textual singleton emoji in combination with emoji variation selector" do "β–Ά\u{FE0F} play button" =~ Unicode::Emoji::REGEX_WELL_FORMED assert_equal "β–Ά\u{FE0F}", $& end it "does not match singleton 'component' emoji codepoints" do "🏻 light skin tone" =~ Unicode::Emoji::REGEX_WELL_FORMED assert_nil $& end it "matches modified emoji if modifier base emoji is used" do "πŸ›ŒπŸ½ person in bed: medium skin tone" =~ Unicode::Emoji::REGEX_WELL_FORMED assert_equal "πŸ›ŒπŸ½", $& end it "does not match modified emoji if no modifier base emoji is used" do "🌡🏽 cactus" =~ Unicode::Emoji::REGEX_WELL_FORMED assert_equal "🌡", $& end it "matches valid region flags" do "πŸ‡΅πŸ‡Ή Portugal" =~ Unicode::Emoji::REGEX_WELL_FORMED assert_equal "πŸ‡΅πŸ‡Ή", $& end it "does match invalid region flags" do "πŸ‡΅πŸ‡΅ PP Land" =~ Unicode::Emoji::REGEX_WELL_FORMED assert_equal "πŸ‡΅πŸ‡΅", $& end it "matches emoji keycap sequences" do "2️⃣ keycap: 2" =~ Unicode::Emoji::REGEX_WELL_FORMED assert_equal "2️⃣", $& end it "matches recommended tag sequences" do "🏴󠁧󠁒󠁳󠁣󠁴󠁿 Scotland" =~ Unicode::Emoji::REGEX_WELL_FORMED assert_equal "🏴󠁧󠁒󠁳󠁣󠁴󠁿", $& end it "matches valid tag sequences, even though they are not recommended" do "🏴󠁧󠁒󠁑󠁧󠁒󠁿 GB AGB" =~ Unicode::Emoji::REGEX_WELL_FORMED assert_equal "🏴󠁧󠁒󠁑󠁧󠁒󠁿", $& end it "does match invalid tag sequences" do "😴󠁧󠁒󠁑󠁑󠁑󠁿 GB AAA" =~ Unicode::Emoji::REGEX_WELL_FORMED assert_equal "😴󠁧󠁒󠁑󠁑󠁑󠁿", $& end it "matches recommended zwj sequences" do "πŸ€ΎπŸ½β€β™€οΈ woman playing handball: medium skin tone" =~ Unicode::Emoji::REGEX_WELL_FORMED assert_equal "πŸ€ΎπŸ½β€β™€οΈ", $& end it "matches valid zwj sequences, even though they are not recommended" do "πŸ€ β€πŸ€’ vomiting cowboy" =~ Unicode::Emoji::REGEX_WELL_FORMED assert_equal "πŸ€ β€πŸ€’", $& end end describe "REGEX_BASIC" do it "matches most singleton emoji codepoints" do "😴 sleeping face" =~ Unicode::Emoji::REGEX_BASIC assert_equal "😴", $& end it "matches singleton emoji in combination with emoji variation selector" do "😴\u{FE0F} sleeping face" =~ Unicode::Emoji::REGEX_BASIC assert_equal "😴\u{FE0F}", $& end it "does not match singleton emoji when in combination with text variation selector" do "😴\u{FE0E} sleeping face" =~ Unicode::Emoji::REGEX_BASIC assert_nil $& end it "does not match textual singleton emoji" do "β–Ά play button" =~ Unicode::Emoji::REGEX assert_nil $& end it "matches textual singleton emoji in combination with emoji variation selector" do "β–Ά\u{FE0F} play button" =~ Unicode::Emoji::REGEX assert_equal "β–Ά\u{FE0F}", $& end it "does not match singleton 'component' emoji codepoints" do "🏻 light skin tone" =~ Unicode::Emoji::REGEX_BASIC assert_nil $& end it "does not match modified emoji" do "πŸ›ŒπŸ½ person in bed: medium skin tone" =~ Unicode::Emoji::REGEX_BASIC assert_equal "πŸ›Œ", $& end it "does not match region flags" do "πŸ‡΅πŸ‡Ή Portugal" =~ Unicode::Emoji::REGEX_BASIC assert_nil $& end it "does not match emoji keycap sequences" do "2️⃣ keycap: 2" =~ Unicode::Emoji::REGEX_BASIC assert_nil $& end it "does not match tag sequences" do "🏴󠁧󠁒󠁳󠁣󠁴󠁿 Scotland" =~ Unicode::Emoji::REGEX_BASIC assert_equal "🏴", $& # only base flag is matched end it "does not match zwj sequences" do "πŸ€ΎπŸ½β€β™€οΈ woman playing handball: medium skin tone" =~ Unicode::Emoji::REGEX_BASIC assert_equal "🀾", $& end end describe "REGEX_TEXT" do it "deos not match singleton emoji codepoints with emoji presentation and no variation selector" do "😴 sleeping face" =~ Unicode::Emoji::REGEX_TEXT assert_nil $& end it "does not match singleton emoji in combination with emoji variation selector" do "😴\u{FE0F} sleeping face" =~ Unicode::Emoji::REGEX_TEXT assert_nil $& end it "matches singleton emoji in combination with text variation selector" do "😴\u{FE0E} sleeping face" =~ Unicode::Emoji::REGEX_TEXT assert_equal "😴\u{FE0E}", $& end it "matches textual singleton emoji" do "β–Ά play button" =~ Unicode::Emoji::REGEX_TEXT assert_equal "β–Ά", $& end it "does not match textual singleton emoji in combination with emoji variation selector" do "β–Ά\u{FE0F} play button" =~ Unicode::Emoji::REGEX_TEXT assert_nil $& end it "does not match textual singleton emoji in combination with emoji modifiers" do "✌🏻 victory hand" =~ Unicode::Emoji::REGEX_TEXT assert_nil $& end it "does not match singleton 'component' emoji codepoints" do "🏻 light skin tone" =~ Unicode::Emoji::REGEX_TEXT assert_nil $& end it "does not match modified emoji" do "πŸ›ŒπŸ½ person in bed: medium skin tone" =~ Unicode::Emoji::REGEX_TEXT assert_nil $& end it "does not match region flags" do "πŸ‡΅πŸ‡Ή Portugal" =~ Unicode::Emoji::REGEX_TEXT assert_nil $& end it "does not match emoji keycap sequences" do "2️⃣ keycap: 2" =~ Unicode::Emoji::REGEX_TEXT assert_nil $& end it "does not match tag sequences" do "🏴󠁧󠁒󠁳󠁣󠁴󠁿 Scotland" =~ Unicode::Emoji::REGEX_TEXT assert_nil $& end it "does not match zwj sequences" do "πŸ€ΎπŸ½β€β™€οΈ woman playing handball: medium skin tone" =~ Unicode::Emoji::REGEX_TEXT assert_nil $& end end describe "REGEX_ANY" do it "returns any emoji-related codepoint (but no variation selectors or tags)" do matches = "1 string 😴\u{FE0F} sleeping face with πŸ‡΅ and modifier 🏾, also 🏴󠁧󠁒󠁳󠁣󠁴󠁿 Scotland".scan(Unicode::Emoji::REGEX_ANY) assert_equal ["1", "😴", "πŸ‡΅", "🏾", "🏴"], matches end end describe "REGEX_PICTO" do it "matches codepoints with Extended_Pictograph property (almost all emoji are, but also others)" do matches = "U+1F32D 🌭 HOT DOG, U+203C β€Ό DOUBLE EXCLAMATION MARK, U+26E8 ⛨ BLACK CROSS ON SHIELD".scan(Unicode::Emoji::REGEX_PICTO) assert_equal ["🌭", "β€Ό", "⛨"], matches end end describe "REGEX_PICTO" do it "matches codepoints with Extended_Pictograph property, but no Emoji property" do matches = "U+1F32D 🌭 HOT DOG, U+203C β€Ό DOUBLE EXCLAMATION MARK, U+26E8 ⛨ BLACK CROSS ON SHIELD".scan(Unicode::Emoji::REGEX_PICTO_NO_EMOJI) assert_equal ["⛨"], matches end end describe ".list" do it "returns a grouped list of emoji" do assert_includes Unicode::Emoji.list.keys, "Smileys & Emotion" end it "sub-groups the list of emoji" do assert_includes Unicode::Emoji.list("Smileys & Emotion").keys, "face-glasses" end it "has emoji in sub-groups" do assert_includes Unicode::Emoji.list("Smileys & Emotion", "face-glasses"), "😎" end it "issues a warning if attempting to retrieve old category" do assert_output nil, "Warning(unicode-emoji): The category of Smileys & People does not exist anymore\n" do assert_nil Unicode::Emoji.list("Smileys & People", "face-positive") end end end end