1
0
Fork 0
mirror of https://github.com/emojisum/emojisum.git synced 2024-12-02 11:55:42 +00:00
emojisum/emoji/map.go
Vincent Batts f0d758ab5f
emoji: adding a helper to parse a hex string into codepoint
Signed-off-by: Vincent Batts <vbatts@hashbangbash.com>
2018-10-22 15:19:50 +01:00

96 lines
2.5 KiB
Go

package emoji
import (
"encoding/hex"
"fmt"
"strconv"
"strings"
)
// Map returns the emoji at the provided position.
// This list is from 0-255
func Map(b byte) Words {
return mapGen.EmojiWords[int(b)]
}
// Version returns the version of the emojisum document currently compiled
// against
func Version() string {
return mapGen.Version
}
var mapGen VersionedMap
// VersionedMap is the structure used for the `emojimap.json` document
type VersionedMap struct {
Description string `json:"description"`
Version string `json:"version"`
// these are an ordered list, referened by a byte (each byte of a checksum digest)
EmojiWords []Words `json:"emojiwords"`
}
// Words are a set of options to represent an emoji.
// Possible options could be the ":colon_notation:", a "U+26CF" style
// codepoint, or the unicode value itself.
type Words []string
// IsColonNotation checks for whether a word is the :colon_notation: of emoji
func IsColonNotation(word string) bool {
return strings.HasPrefix(word, ":") && strings.HasSuffix(word, ":")
}
// IsCodepoint checks for whether a word is the "U+1234" codepoint style of emoji. Codepoints can sometimes be a combo, like flags
func IsCodepoint(word string) bool {
return strings.HasPrefix(strings.ToUpper(word), "U+")
}
var unicodeURL = `http://www.unicode.org/emoji/charts/full-emoji-list.html`
// UnicodeLinkURL returns a link to unicode.org list for CodePoint, or just the
// full list if not a codepoint
func UnicodeLinkURL(word string) string {
if !IsCodepoint(word) {
return unicodeURL
}
return fmt.Sprintf("%s#%s", unicodeURL, strings.Join(strings.Split(strings.TrimPrefix(strings.ToLower(word), "u+"), "u+"), "_"))
}
// CodepointToUnicode takes a "U+26CF" style word and returns the `\U00026CF` formated unicode string
func CodepointToUnicode(word string) string {
if !IsCodepoint(word) {
return word
}
var ret string
for _, chunk := range strings.Split(strings.TrimPrefix(strings.ToUpper(word), "U+"), "U+") {
c, err := strconv.ParseInt(chunk, 16, 64)
if err != nil {
return ret
}
ret = fmt.Sprintf("%s%c", ret, c)
}
return ret
}
// FromHexString parses string s as two character byte of hexadecimal into
// Unicode Codepoint
func FromHexString(s string) (string, error) {
d, err := hex.DecodeString(s)
if err != nil {
return "", err
}
var ret string
for _, b := range d {
for _, e := range Map(b) {
// use the first colon notation word and continue
if IsCodepoint(e) {
ret = ret + CodepointToUnicode(e)
break
}
}
}
return ret, nil
}