mirror of
https://github.com/crazy-max/diun.git
synced 2025-01-12 11:38:11 +00:00
64f77319b2
Bumps [github.com/PaulSonOfLars/gotgbot/v2](https://github.com/PaulSonOfLars/gotgbot) from 2.0.0-rc.27 to 2.0.0-rc.30. - [Release notes](https://github.com/PaulSonOfLars/gotgbot/releases) - [Commits](https://github.com/PaulSonOfLars/gotgbot/compare/v2.0.0-rc.27...v2.0.0-rc.30) --- updated-dependencies: - dependency-name: github.com/PaulSonOfLars/gotgbot/v2 dependency-type: direct:production update-type: version-update:semver-patch ... Signed-off-by: dependabot[bot] <support@github.com>
322 lines
10 KiB
Go
322 lines
10 KiB
Go
package gotgbot
|
|
|
|
import (
|
|
"html"
|
|
"strconv"
|
|
"strings"
|
|
"unicode"
|
|
"unicode/utf16"
|
|
)
|
|
|
|
var mdMap = map[string]string{
|
|
"bold": "*",
|
|
"italic": "_",
|
|
"code": "`",
|
|
}
|
|
|
|
var mdV2Map = map[string]string{
|
|
"bold": "*",
|
|
"italic": "_",
|
|
"code": "`",
|
|
"pre": "```",
|
|
"underline": "__",
|
|
"strikethrough": "~",
|
|
"spoiler": "||",
|
|
"blockquote": ">",
|
|
"expandable_blockquote": "**>",
|
|
}
|
|
|
|
var htmlMap = map[string]string{
|
|
"bold": "b",
|
|
"italic": "i",
|
|
"code": "code",
|
|
"pre": "pre",
|
|
"underline": "u",
|
|
"strikethrough": "s",
|
|
"spoiler": "span class=\"tg-spoiler\"",
|
|
"blockquote": "blockquote",
|
|
"expandable_blockquote": "blockquote expandable",
|
|
}
|
|
|
|
// OriginalMD gets the original markdown formatting of a message text.
|
|
func (m Message) OriginalMD() string {
|
|
return getOrigMsgMD(utf16.Encode([]rune(m.Text)), m.Entities)
|
|
}
|
|
|
|
// OriginalMDV2 gets the original markdownV2 formatting of a message text.
|
|
func (m Message) OriginalMDV2() string {
|
|
return getOrigMsgMDV2(utf16.Encode([]rune(m.Text)), m.Entities)
|
|
}
|
|
|
|
// OriginalHTML gets the original HTML formatting of a message text.
|
|
func (m Message) OriginalHTML() string {
|
|
return getOrigMsgHTML(utf16.Encode([]rune(m.Text)), m.Entities)
|
|
}
|
|
|
|
// OriginalCaptionMD gets the original markdown formatting of a message caption.
|
|
func (m Message) OriginalCaptionMD() string {
|
|
return getOrigMsgMD(utf16.Encode([]rune(m.Caption)), m.CaptionEntities)
|
|
}
|
|
|
|
// OriginalCaptionMDV2 gets the original markdownV2 formatting of a message caption.
|
|
func (m Message) OriginalCaptionMDV2() string {
|
|
return getOrigMsgMDV2(utf16.Encode([]rune(m.Caption)), m.CaptionEntities)
|
|
}
|
|
|
|
// OriginalCaptionHTML gets the original HTML formatting of a message caption.
|
|
func (m Message) OriginalCaptionHTML() string {
|
|
return getOrigMsgHTML(utf16.Encode([]rune(m.Caption)), m.CaptionEntities)
|
|
}
|
|
|
|
// Does not support nesting. only look at upper entities.
|
|
func getOrigMsgMD(utf16Data []uint16, ents []MessageEntity) string {
|
|
out := strings.Builder{}
|
|
prev := int64(0)
|
|
for _, ent := range getUpperEntities(ents) {
|
|
newPrev := ent.Offset + ent.Length
|
|
prevText := string(utf16.Decode(utf16Data[prev:ent.Offset]))
|
|
|
|
text := utf16.Decode(utf16Data[ent.Offset:newPrev])
|
|
pre, cleanCntnt, post := splitEdgeWhitespace(string(text), ent)
|
|
cleanCntntRune := []rune(cleanCntnt)
|
|
|
|
switch ent.Type {
|
|
case "bold", "italic", "code":
|
|
out.WriteString(prevText + pre + mdMap[ent.Type] + escapeContainedMDV1(cleanCntntRune, []rune(mdMap[ent.Type])) + mdMap[ent.Type] + post)
|
|
case "pre":
|
|
if ent.Language == "" {
|
|
out.WriteString(prevText + pre + mdMap[ent.Type] + escapeContainedMDV1(cleanCntntRune, []rune(mdMap[ent.Type])) + mdMap[ent.Type] + post)
|
|
} else {
|
|
out.WriteString(prevText + pre + mdMap[ent.Type] + ent.Language + "\n" + escapeContainedMDV1(cleanCntntRune, []rune(mdMap[ent.Type])) + mdMap[ent.Type] + post)
|
|
}
|
|
case "text_mention":
|
|
out.WriteString(prevText + pre + "[" + escapeContainedMDV1(cleanCntntRune, []rune("[]()")) + "](tg://user?id=" + strconv.FormatInt(ent.User.Id, 10) + ")" + post)
|
|
case "text_link":
|
|
out.WriteString(prevText + pre + "[" + escapeContainedMDV1(cleanCntntRune, []rune("[]()")) + "](" + ent.Url + ")" + post)
|
|
default:
|
|
continue
|
|
}
|
|
prev = newPrev
|
|
}
|
|
|
|
out.WriteString(string(utf16.Decode(utf16Data[prev:])))
|
|
return out.String()
|
|
}
|
|
|
|
func getOrigMsgHTML(utf16Data []uint16, ents []MessageEntity) string {
|
|
if len(ents) == 0 {
|
|
return html.EscapeString(string(utf16.Decode(utf16Data)))
|
|
}
|
|
|
|
bd := strings.Builder{}
|
|
prev := int64(0)
|
|
for _, e := range getUpperEntities(ents) {
|
|
data, end := fillNestedHTML(utf16Data, e, prev, getChildEntities(e, ents))
|
|
bd.WriteString(data)
|
|
prev = end
|
|
}
|
|
|
|
bd.WriteString(html.EscapeString(string(utf16.Decode(utf16Data[prev:]))))
|
|
return bd.String()
|
|
}
|
|
|
|
func getOrigMsgMDV2(utf16Data []uint16, ents []MessageEntity) string {
|
|
if len(ents) == 0 {
|
|
return string(utf16.Decode(utf16Data))
|
|
}
|
|
|
|
bd := strings.Builder{}
|
|
prev := int64(0)
|
|
for _, e := range getUpperEntities(ents) {
|
|
data, end := fillNestedMarkdownV2(utf16Data, e, prev, getChildEntities(e, ents))
|
|
bd.WriteString(data)
|
|
prev = end
|
|
}
|
|
|
|
bd.WriteString(string(utf16.Decode(utf16Data[prev:])))
|
|
return bd.String()
|
|
}
|
|
|
|
func fillNestedHTML(data []uint16, ent MessageEntity, start int64, entities []MessageEntity) (string, int64) {
|
|
entEnd := ent.Offset + ent.Length
|
|
if len(entities) == 0 || entEnd < entities[0].Offset {
|
|
// no nesting; just return straight away and move to next.
|
|
return writeFinalHTML(data, ent, start, html.EscapeString(string(utf16.Decode(data[ent.Offset:entEnd])))), entEnd
|
|
}
|
|
subPrev := ent.Offset
|
|
subEnd := ent.Offset
|
|
bd := strings.Builder{}
|
|
for _, e := range getUpperEntities(entities) {
|
|
if e.Offset < subEnd || e == ent {
|
|
continue
|
|
}
|
|
if e.Offset >= entEnd {
|
|
break
|
|
}
|
|
|
|
out, end := fillNestedHTML(data, e, subPrev, getChildEntities(e, entities))
|
|
bd.WriteString(out)
|
|
subPrev = end
|
|
}
|
|
|
|
bd.WriteString(html.EscapeString(string(utf16.Decode(data[subPrev:entEnd]))))
|
|
|
|
return writeFinalHTML(data, ent, start, bd.String()), entEnd
|
|
}
|
|
|
|
func fillNestedMarkdownV2(data []uint16, ent MessageEntity, start int64, entities []MessageEntity) (string, int64) {
|
|
entEnd := ent.Offset + ent.Length
|
|
if len(entities) == 0 || entEnd < entities[0].Offset {
|
|
// no nesting; just return straight away and move to next.
|
|
return writeFinalMarkdownV2(data, ent, start, string(utf16.Decode(data[ent.Offset:entEnd]))), entEnd
|
|
}
|
|
subPrev := ent.Offset
|
|
subEnd := ent.Offset
|
|
bd := strings.Builder{}
|
|
for _, e := range getUpperEntities(entities) {
|
|
if e.Offset < subEnd || e == ent {
|
|
continue
|
|
}
|
|
if e.Offset >= entEnd {
|
|
break
|
|
}
|
|
|
|
out, end := fillNestedMarkdownV2(data, e, subPrev, getChildEntities(e, entities))
|
|
bd.WriteString(out)
|
|
subPrev = end
|
|
}
|
|
|
|
bd.WriteString(string(utf16.Decode(data[subPrev:entEnd])))
|
|
|
|
return writeFinalMarkdownV2(data, ent, start, bd.String()), entEnd
|
|
}
|
|
|
|
func writeFinalHTML(data []uint16, ent MessageEntity, start int64, cntnt string) string {
|
|
prevText := html.EscapeString(string(utf16.Decode(data[start:ent.Offset])))
|
|
switch ent.Type {
|
|
case "bold", "italic", "code", "underline", "strikethrough", "spoiler":
|
|
return prevText + "<" + htmlMap[ent.Type] + ">" + cntnt + "</" + closeHTMLTag(htmlMap[ent.Type]) + ">"
|
|
case "pre":
|
|
// <pre>text</pre>
|
|
if ent.Language == "" {
|
|
return prevText + "<pre>" + cntnt + "</pre>"
|
|
}
|
|
// <pre><code class="lang">text</code></pre>
|
|
return prevText + `<pre><code class="` + ent.Language + `">` + cntnt + "</code></pre>"
|
|
case "custom_emoji":
|
|
return prevText + `<tg-emoji emoji-id="` + ent.CustomEmojiId + `">` + cntnt + "</tg-emoji>"
|
|
case "text_mention":
|
|
return prevText + `<a href="tg://user?id=` + strconv.FormatInt(ent.User.Id, 10) + `">` + cntnt + "</a>"
|
|
case "text_link":
|
|
return prevText + `<a href="` + ent.Url + `">` + cntnt + "</a>"
|
|
case "blockquote":
|
|
return prevText + `<blockquote>` + cntnt + "</blockquote>"
|
|
case "expandable_blockquote":
|
|
return prevText + `<blockquote expandable>` + cntnt + "</blockquote>"
|
|
default:
|
|
return prevText + cntnt
|
|
}
|
|
}
|
|
|
|
// closeHTMLTag makes sure to generate the correct HTML closing tag for a given opening tag.
|
|
func closeHTMLTag(s string) string {
|
|
if !strings.HasPrefix(s, "span") {
|
|
return s
|
|
}
|
|
return "span"
|
|
}
|
|
|
|
func writeFinalMarkdownV2(data []uint16, ent MessageEntity, start int64, cntnt string) string {
|
|
prevText := string(utf16.Decode(data[start:ent.Offset]))
|
|
pre, cleanCntnt, post := splitEdgeWhitespace(cntnt, ent)
|
|
switch ent.Type {
|
|
case "bold", "italic", "code", "underline", "strikethrough", "spoiler":
|
|
return prevText + pre + mdV2Map[ent.Type] + cleanCntnt + mdV2Map[ent.Type] + post
|
|
case "pre":
|
|
if ent.Language == "" {
|
|
return prevText + pre + "```\n" + cleanCntnt + "```" + post
|
|
}
|
|
return prevText + pre + "```" + ent.Language + "\n" + cleanCntnt + "```" + post
|
|
case "custom_emoji":
|
|
// Yes, custom emoji have a weird little ! at the front
|
|
// https://core.telegram.org/bots/api#markdownv2-style
|
|
return prevText + pre + "![" + cleanCntnt + "](tg://emoji?id=" + ent.CustomEmojiId + ")" + post
|
|
case "text_mention":
|
|
return prevText + pre + "[" + cleanCntnt + "](tg://user?id=" + strconv.FormatInt(ent.User.Id, 10) + ")" + post
|
|
case "text_link":
|
|
return prevText + pre + "[" + cleanCntnt + "](" + ent.Url + ")" + post
|
|
case "blockquote":
|
|
return prevText + pre + ">" + strings.Join(strings.Split(cleanCntnt, "\n"), "\n>") + post
|
|
case "expandable_blockquote":
|
|
return prevText + pre + "**>" + strings.Join(strings.Split(cleanCntnt, "\n"), "\n>") + "||" + post
|
|
default:
|
|
return prevText + cntnt
|
|
}
|
|
}
|
|
|
|
func getUpperEntities(ents []MessageEntity) []MessageEntity {
|
|
prev := int64(0)
|
|
uppers := make([]MessageEntity, 0, len(ents))
|
|
for _, e := range ents {
|
|
if e.Offset < prev {
|
|
continue
|
|
}
|
|
uppers = append(uppers, e)
|
|
prev = e.Offset + e.Length
|
|
}
|
|
return uppers
|
|
}
|
|
|
|
func getChildEntities(ent MessageEntity, ents []MessageEntity) []MessageEntity {
|
|
end := ent.Offset + ent.Length
|
|
children := make([]MessageEntity, 0, len(ents))
|
|
for _, e := range ents {
|
|
if e.Offset < ent.Offset || e == ent {
|
|
continue
|
|
}
|
|
if e.Offset >= end {
|
|
break
|
|
}
|
|
children = append(children, e)
|
|
}
|
|
return children
|
|
}
|
|
|
|
func splitEdgeWhitespace(text string, ent MessageEntity) (pre string, cntnt string, post string) {
|
|
keepNewLines := ent.Type == "pre"
|
|
|
|
bd := strings.Builder{}
|
|
rText := []rune(text)
|
|
for i := 0; i < len(rText) && unicode.IsSpace(rText[i]) && (!keepNewLines || rText[i] != '\n'); i++ {
|
|
bd.WriteRune(rText[i])
|
|
}
|
|
pre = bd.String()
|
|
|
|
text = strings.TrimPrefix(text, pre)
|
|
bd.Reset()
|
|
for i := len(rText) - 1; i >= 0 && unicode.IsSpace(rText[i]); i-- {
|
|
bd.WriteRune(rText[i])
|
|
}
|
|
post = bd.String()
|
|
return pre, strings.TrimSuffix(text, post), post
|
|
}
|
|
|
|
func escapeContainedMDV1(data []rune, mdType []rune) string {
|
|
out := strings.Builder{}
|
|
for _, x := range data {
|
|
if contains(x, mdType) {
|
|
out.WriteRune('\\')
|
|
}
|
|
out.WriteRune(x)
|
|
}
|
|
return out.String()
|
|
}
|
|
|
|
func contains(r rune, rs []rune) bool {
|
|
for _, rr := range rs {
|
|
if r == rr {
|
|
return true
|
|
}
|
|
}
|
|
return false
|
|
}
|