# matrix-appservice-kakaotalk - A Matrix-KakaoTalk puppeting bridge. # Copyright (C) 2022 Tulir Asokan, Andrew Ferrazzutti # # This program is free software: you can redistribute it and/or modify # it under the terms of the GNU Affero General Public License as published by # the Free Software Foundation, either version 3 of the License, or # (at your option) any later version. # # This program is distributed in the hope that it will be useful, # but WITHOUT ANY WARRANTY; without even the implied warranty of # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the # GNU Affero General Public License for more details. # # You should have received a copy of the GNU Affero General Public License # along with this program. If not, see . from __future__ import annotations from typing import Match import re from mautrix.types import Format, MessageType, TextMessageEventContent from ..kt.types.chat.attachment.mention import MentionStruct from .. import puppet as pu, user as u _START = r"^|\s" _END = r"$|\s" _TEXT_NO_SURROUNDING_SPACE = r"(?:[^\s].*?[^\s])|[^\s]" COMMON_REGEX = re.compile(rf"({_START})([_~*])({_TEXT_NO_SURROUNDING_SPACE})\2({_END})") INLINE_CODE_REGEX = re.compile(rf"({_START})(`)(.+?)`({_END})") MENTION_REGEX = re.compile(r"@(\d+)\u2063(.+?)\u2063") tags = {"_": "em", "*": "strong", "~": "del", "`": "code"} def _handle_match(html: str, match: Match, nested: bool) -> tuple[str, int]: start, end = match.start(), match.end() prefix, sigil, text, suffix = match.groups() if nested: text = _convert_formatting(text) tag = tags[sigil] # We don't want to include the whitespace suffix length, as that could be used as the # whitespace prefix right after this formatting block. pos = start + len(prefix) + (2 * len(tag) + 5) + len(text) html = f"{html[:start]}{prefix}<{tag}>{text}{suffix}{html[end:]}" return html, pos def _convert_formatting(html: str) -> str: pos = 0 while pos < len(html): i_match = INLINE_CODE_REGEX.search(html, pos) c_match = COMMON_REGEX.search(html, pos) if i_match and c_match: match = min(i_match, c_match, key=lambda match: match.start()) else: match = i_match or c_match if match: html, pos = _handle_match(html, match, nested=match != i_match) else: break return html def _handle_blockquote(output: list[str], blockquote: bool, line: str) -> tuple[bool, str]: if not blockquote and line.startswith("> "): line = line[len("> ") :] output.append("
") blockquote = True elif blockquote: if line.startswith(">"): line = line[len(">") :] if line.startswith(" "): line = line[1:] else: output.append("
") blockquote = False return blockquote, line async def kakaotalk_to_matrix(msg: str | None, mentions: list[MentionStruct] | None) -> TextMessageEventContent: # TODO Shouts text = msg or "" content = TextMessageEventContent(msgtype=MessageType.TEXT, body=text) if mentions: mention_user_ids = [] at_chunks = text.split("@") for m in mentions: for idx in m.at: chunk = at_chunks[idx] original = chunk[:m.len] mention_user_ids.append(int(m.user_id)) at_chunks[idx] = f"{m.user_id}\u2063{original}\u2063{chunk[m.len:]}" text = "@".join(at_chunks) mention_user_map = {} for ktid in mention_user_ids: user = await u.User.get_by_ktid(ktid) if user: mention_user_map[ktid] = user.mxid else: puppet = await pu.Puppet.get_by_ktid(ktid, create=False) mention_user_map[ktid] = puppet.mxid if puppet else None if mention_user_map: def _mention_replacer(match: Match) -> str: mxid = mention_user_map[int(match.group(1))] if not mxid: return match.group(2) return f'{match.group(2)}' content.format = Format.HTML content.formatted_body = MENTION_REGEX.sub(_mention_replacer, text).replace("\n", "
\n") return content