2020-04-28 14:05:39 -04:00
// Copyright 2020 The Gitea Authors. All rights reserved.
// Copyright 2015 Kenneth Shaw
2022-11-27 13:20:29 -05:00
// SPDX-License-Identifier: MIT
2020-04-28 14:05:39 -04:00
2021-08-24 11:47:09 -05:00
//go:build ignore
2020-04-28 14:05:39 -04:00
package main
import (
"flag"
"fmt"
"go/format"
2021-09-22 13:38:34 +08:00
"io"
2020-04-28 14:05:39 -04:00
"log"
"net/http"
2021-09-22 13:38:34 +08:00
"os"
2020-04-28 14:05:39 -04:00
"regexp"
"sort"
"strconv"
"strings"
2020-06-02 02:22:40 -04:00
"unicode/utf8"
2021-03-01 21:08:10 +00:00
2021-07-25 00:03:58 +08:00
"code.gitea.io/gitea/modules/json"
2020-04-28 14:05:39 -04:00
)
const (
gemojiURL = "https://raw.githubusercontent.com/github/gemoji/master/db/emoji.json"
2023-01-04 12:52:48 -05:00
maxUnicodeVersion = 14
2020-04-28 14:05:39 -04:00
)
2022-01-20 18:46:10 +01:00
var flagOut = flag . String ( "o" , "modules/emoji/emoji_data.go" , "out" )
2020-04-28 14:05:39 -04:00
// Gemoji is a set of emoji data.
type Gemoji [ ] Emoji
// Emoji represents a single emoji and associated data.
type Emoji struct {
Emoji string ` json:"emoji" `
Description string ` json:"description,omitempty" `
Aliases [ ] string ` json:"aliases" `
UnicodeVersion string ` json:"unicode_version,omitempty" `
2020-06-02 02:22:40 -04:00
SkinTones bool ` json:"skin_tones,omitempty" `
2020-04-28 14:05:39 -04:00
}
// Don't include some fields in JSON
func ( e Emoji ) MarshalJSON ( ) ( [ ] byte , error ) {
type emoji Emoji
x := emoji ( e )
x . UnicodeVersion = ""
x . Description = ""
2020-06-02 02:22:40 -04:00
x . SkinTones = false
2020-04-28 14:05:39 -04:00
return json . Marshal ( x )
}
func main ( ) {
var err error
flag . Parse ( )
// generate data
buf , err := generate ( )
if err != nil {
log . Fatal ( err )
}
// write
2022-01-20 18:46:10 +01:00
err = os . WriteFile ( * flagOut , buf , 0 o644 )
2020-04-28 14:05:39 -04:00
if err != nil {
log . Fatal ( err )
}
}
var replacer = strings . NewReplacer (
"main.Gemoji" , "Gemoji" ,
"main.Emoji" , "\n" ,
"}}" , "},\n}" ,
", Description:" , ", " ,
", Aliases:" , ", " ,
", UnicodeVersion:" , ", " ,
2020-06-02 02:22:40 -04:00
", SkinTones:" , ", " ,
2020-04-28 14:05:39 -04:00
)
var emojiRE = regexp . MustCompile ( ` \ { Emoji:"([^"]*)" ` )
func generate ( ) ( [ ] byte , error ) {
var err error
// load gemoji data
res , err := http . Get ( gemojiURL )
if err != nil {
return nil , err
}
defer res . Body . Close ( )
// read all
2021-09-22 13:38:34 +08:00
body , err := io . ReadAll ( res . Body )
2020-04-28 14:05:39 -04:00
if err != nil {
return nil , err
}
// unmarshal
var data Gemoji
err = json . Unmarshal ( body , & data )
if err != nil {
return nil , err
}
2022-01-20 18:46:10 +01:00
skinTones := make ( map [ string ] string )
2020-04-28 14:05:39 -04:00
2020-06-02 02:22:40 -04:00
skinTones [ "\U0001f3fb" ] = "Light Skin Tone"
skinTones [ "\U0001f3fc" ] = "Medium-Light Skin Tone"
skinTones [ "\U0001f3fd" ] = "Medium Skin Tone"
skinTones [ "\U0001f3fe" ] = "Medium-Dark Skin Tone"
skinTones [ "\U0001f3ff" ] = "Dark Skin Tone"
var tmp Gemoji
2022-01-20 18:46:10 +01:00
// filter out emoji that require greater than max unicode version
2020-04-28 14:05:39 -04:00
for i := range data {
val , _ := strconv . ParseFloat ( data [ i ] . UnicodeVersion , 64 )
if int ( val ) <= maxUnicodeVersion {
tmp = append ( tmp , data [ i ] )
}
}
data = tmp
sort . Slice ( data , func ( i , j int ) bool {
return data [ i ] . Aliases [ 0 ] < data [ j ] . Aliases [ 0 ]
} )
aliasMap := make ( map [ string ] int , len ( data ) )
for i , e := range data {
if e . Emoji == "" || len ( e . Aliases ) == 0 {
continue
}
for _ , a := range e . Aliases {
if a == "" {
continue
}
aliasMap [ a ] = i
}
}
// gitea customizations
i , ok := aliasMap [ "tada" ]
if ok {
data [ i ] . Aliases = append ( data [ i ] . Aliases , "hooray" )
}
i , ok = aliasMap [ "laughing" ]
if ok {
data [ i ] . Aliases = append ( data [ i ] . Aliases , "laugh" )
}
2020-06-02 02:22:40 -04:00
// write a JSON file to use with tribute (write before adding skin tones since we can't support them there yet)
file , _ := json . Marshal ( data )
2022-01-20 18:46:10 +01:00
_ = os . WriteFile ( "assets/emoji.json" , file , 0 o644 )
2020-06-02 02:22:40 -04:00
// Add skin tones to emoji that support it
var (
s [ ] string
newEmoji string
newDescription string
newData Emoji
)
for i := range data {
if data [ i ] . SkinTones {
for k , v := range skinTones {
s = strings . Split ( data [ i ] . Emoji , "" )
if utf8 . RuneCountInString ( data [ i ] . Emoji ) == 1 {
s = append ( s , k )
} else {
// insert into slice after first element because all emoji that support skin tones
2021-02-05 02:57:42 +09:00
// have that modifier placed at this spot
2020-06-02 02:22:40 -04:00
s = append ( s , "" )
copy ( s [ 2 : ] , s [ 1 : ] )
s [ 1 ] = k
}
newEmoji = strings . Join ( s , "" )
newDescription = data [ i ] . Description + ": " + v
newAlias := data [ i ] . Aliases [ 0 ] + "_" + strings . ReplaceAll ( v , " " , "_" )
newData = Emoji { newEmoji , newDescription , [ ] string { newAlias } , "12.0" , false }
data = append ( data , newData )
}
}
}
2023-01-05 12:58:51 +01:00
sort . Slice ( data , func ( i , j int ) bool {
return data [ i ] . Aliases [ 0 ] < data [ j ] . Aliases [ 0 ]
} )
2020-04-28 14:05:39 -04:00
// add header
str := replacer . Replace ( fmt . Sprintf ( hdr , gemojiURL , data ) )
// change the format of the unicode string
str = emojiRE . ReplaceAllStringFunc ( str , func ( s string ) string {
var err error
s , err = strconv . Unquote ( s [ len ( "{Emoji:" ) : ] )
if err != nil {
panic ( err )
}
return "{" + strconv . QuoteToASCII ( s )
} )
// format
return format . Source ( [ ] byte ( str ) )
}
const hdr = `
// Copyright 2020 The Gitea Authors. All rights reserved.
2022-11-27 13:20:29 -05:00
// SPDX-License-Identifier: MIT
2020-04-28 14:05:39 -04:00
package emoji
2022-08-30 21:15:45 -05:00
// Code generated by build/generate-emoji.go. DO NOT EDIT.
2020-04-28 14:05:39 -04:00
// Sourced from %s
var GemojiData = % # v
`