You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.

generate-emoji.go 4.7KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223
  1. // Copyright 2020 The Gitea Authors. All rights reserved.
  2. // Copyright 2015 Kenneth Shaw
  3. // SPDX-License-Identifier: MIT
  4. //go:build ignore
  5. package main
  6. import (
  7. "flag"
  8. "fmt"
  9. "go/format"
  10. "io"
  11. "log"
  12. "net/http"
  13. "os"
  14. "regexp"
  15. "sort"
  16. "strconv"
  17. "strings"
  18. "unicode/utf8"
  19. "code.gitea.io/gitea/modules/json"
  20. )
  21. const (
  22. gemojiURL = "https://raw.githubusercontent.com/github/gemoji/master/db/emoji.json"
  23. maxUnicodeVersion = 15
  24. )
  25. var flagOut = flag.String("o", "modules/emoji/emoji_data.go", "out")
  26. // Gemoji is a set of emoji data.
  27. type Gemoji []Emoji
  28. // Emoji represents a single emoji and associated data.
  29. type Emoji struct {
  30. Emoji string `json:"emoji"`
  31. Description string `json:"description,omitempty"`
  32. Aliases []string `json:"aliases"`
  33. UnicodeVersion string `json:"unicode_version,omitempty"`
  34. SkinTones bool `json:"skin_tones,omitempty"`
  35. }
  36. // Don't include some fields in JSON
  37. func (e Emoji) MarshalJSON() ([]byte, error) {
  38. type emoji Emoji
  39. x := emoji(e)
  40. x.UnicodeVersion = ""
  41. x.Description = ""
  42. x.SkinTones = false
  43. return json.Marshal(x)
  44. }
  45. func main() {
  46. var err error
  47. flag.Parse()
  48. // generate data
  49. buf, err := generate()
  50. if err != nil {
  51. log.Fatalf("generate err: %v", err)
  52. }
  53. // write
  54. err = os.WriteFile(*flagOut, buf, 0o644)
  55. if err != nil {
  56. log.Fatalf("WriteFile err: %v", err)
  57. }
  58. }
  59. var replacer = strings.NewReplacer(
  60. "main.Gemoji", "Gemoji",
  61. "main.Emoji", "\n",
  62. "}}", "},\n}",
  63. ", Description:", ", ",
  64. ", Aliases:", ", ",
  65. ", UnicodeVersion:", ", ",
  66. ", SkinTones:", ", ",
  67. )
  68. var emojiRE = regexp.MustCompile(`\{Emoji:"([^"]*)"`)
  69. func generate() ([]byte, error) {
  70. var err error
  71. // load gemoji data
  72. res, err := http.Get(gemojiURL)
  73. if err != nil {
  74. return nil, err
  75. }
  76. defer res.Body.Close()
  77. // read all
  78. body, err := io.ReadAll(res.Body)
  79. if err != nil {
  80. return nil, err
  81. }
  82. // unmarshal
  83. var data Gemoji
  84. err = json.Unmarshal(body, &data)
  85. if err != nil {
  86. return nil, err
  87. }
  88. skinTones := make(map[string]string)
  89. skinTones["\U0001f3fb"] = "Light Skin Tone"
  90. skinTones["\U0001f3fc"] = "Medium-Light Skin Tone"
  91. skinTones["\U0001f3fd"] = "Medium Skin Tone"
  92. skinTones["\U0001f3fe"] = "Medium-Dark Skin Tone"
  93. skinTones["\U0001f3ff"] = "Dark Skin Tone"
  94. var tmp Gemoji
  95. // filter out emoji that require greater than max unicode version
  96. for i := range data {
  97. val, _ := strconv.ParseFloat(data[i].UnicodeVersion, 64)
  98. if int(val) <= maxUnicodeVersion {
  99. tmp = append(tmp, data[i])
  100. }
  101. }
  102. data = tmp
  103. sort.Slice(data, func(i, j int) bool {
  104. return data[i].Aliases[0] < data[j].Aliases[0]
  105. })
  106. aliasMap := make(map[string]int, len(data))
  107. for i, e := range data {
  108. if e.Emoji == "" || len(e.Aliases) == 0 {
  109. continue
  110. }
  111. for _, a := range e.Aliases {
  112. if a == "" {
  113. continue
  114. }
  115. aliasMap[a] = i
  116. }
  117. }
  118. // gitea customizations
  119. i, ok := aliasMap["tada"]
  120. if ok {
  121. data[i].Aliases = append(data[i].Aliases, "hooray")
  122. }
  123. i, ok = aliasMap["laughing"]
  124. if ok {
  125. data[i].Aliases = append(data[i].Aliases, "laugh")
  126. }
  127. // write a JSON file to use with tribute (write before adding skin tones since we can't support them there yet)
  128. file, _ := json.Marshal(data)
  129. _ = os.WriteFile("assets/emoji.json", file, 0o644)
  130. // Add skin tones to emoji that support it
  131. var (
  132. s []string
  133. newEmoji string
  134. newDescription string
  135. newData Emoji
  136. )
  137. for i := range data {
  138. if data[i].SkinTones {
  139. for k, v := range skinTones {
  140. s = strings.Split(data[i].Emoji, "")
  141. if utf8.RuneCountInString(data[i].Emoji) == 1 {
  142. s = append(s, k)
  143. } else {
  144. // insert into slice after first element because all emoji that support skin tones
  145. // have that modifier placed at this spot
  146. s = append(s, "")
  147. copy(s[2:], s[1:])
  148. s[1] = k
  149. }
  150. newEmoji = strings.Join(s, "")
  151. newDescription = data[i].Description + ": " + v
  152. newAlias := data[i].Aliases[0] + "_" + strings.ReplaceAll(v, " ", "_")
  153. newData = Emoji{newEmoji, newDescription, []string{newAlias}, "12.0", false}
  154. data = append(data, newData)
  155. }
  156. }
  157. }
  158. sort.Slice(data, func(i, j int) bool {
  159. return data[i].Aliases[0] < data[j].Aliases[0]
  160. })
  161. // add header
  162. str := replacer.Replace(fmt.Sprintf(hdr, gemojiURL, data))
  163. // change the format of the unicode string
  164. str = emojiRE.ReplaceAllStringFunc(str, func(s string) string {
  165. var err error
  166. s, err = strconv.Unquote(s[len("{Emoji:"):])
  167. if err != nil {
  168. panic(err)
  169. }
  170. return "{" + strconv.QuoteToASCII(s)
  171. })
  172. // format
  173. return format.Source([]byte(str))
  174. }
  175. const hdr = `
  176. // Copyright 2020 The Gitea Authors. All rights reserved.
  177. // SPDX-License-Identifier: MIT
  178. package emoji
  179. // Code generated by build/generate-emoji.go. DO NOT EDIT.
  180. // Sourced from %s
  181. var GemojiData = %#v
  182. `