forked from fair/matrix-puppeteer-line
First crack at backfilling
This commit is contained in:
parent
ec081e94df
commit
0260ad89f4
|
@ -200,6 +200,7 @@ class Portal(DBPortal, BasePortal):
|
||||||
return ReuploadedMediaInfo(mxc, decryption_info, mime_type, file_name, len(data))
|
return ReuploadedMediaInfo(mxc, decryption_info, mime_type, file_name, len(data))
|
||||||
|
|
||||||
async def update_info(self, conv: ChatInfo) -> None:
|
async def update_info(self, conv: ChatInfo) -> None:
|
||||||
|
# TODO Not true: a single-participant chat could be a group!
|
||||||
if len(conv.participants) == 1:
|
if len(conv.participants) == 1:
|
||||||
self.other_user = conv.participants[0].id
|
self.other_user = conv.participants[0].id
|
||||||
if self._main_intent is self.az.intent:
|
if self._main_intent is self.az.intent:
|
||||||
|
@ -251,8 +252,7 @@ class Portal(DBPortal, BasePortal):
|
||||||
|
|
||||||
async def backfill(self, source: 'u.User') -> None:
|
async def backfill(self, source: 'u.User') -> None:
|
||||||
with self.backfill_lock:
|
with self.backfill_lock:
|
||||||
self.log.debug("Backfill: TODO!")
|
await self._backfill(source)
|
||||||
#await self._backfill(source)
|
|
||||||
|
|
||||||
async def _backfill(self, source: 'u.User') -> None:
|
async def _backfill(self, source: 'u.User') -> None:
|
||||||
self.log.debug("Backfilling history through %s", source.mxid)
|
self.log.debug("Backfilling history through %s", source.mxid)
|
||||||
|
|
|
@ -118,6 +118,7 @@ class Puppet(DBPuppet, BasePuppet):
|
||||||
|
|
||||||
@classmethod
|
@classmethod
|
||||||
async def get_by_custom_mxid(cls, mxid: UserID) -> Optional['u.User']:
|
async def get_by_custom_mxid(cls, mxid: UserID) -> Optional['u.User']:
|
||||||
if mxid == cls.config["bridge.user"]:
|
# TODO double-puppeting
|
||||||
return await cls.bridge.get_user(mxid)
|
#if mxid == cls.config["bridge.user"]:
|
||||||
|
# return await cls.bridge.get_user(mxid)
|
||||||
return None
|
return None
|
||||||
|
|
|
@ -55,6 +55,7 @@ class User(DBUser, BaseUser):
|
||||||
self._metric_value = defaultdict(lambda: False)
|
self._metric_value = defaultdict(lambda: False)
|
||||||
self._connection_check_task = None
|
self._connection_check_task = None
|
||||||
self.client = None
|
self.client = None
|
||||||
|
self.intent = None
|
||||||
|
|
||||||
@classmethod
|
@classmethod
|
||||||
def init_cls(cls, bridge: 'MessagesBridge') -> None:
|
def init_cls(cls, bridge: 'MessagesBridge') -> None:
|
||||||
|
@ -83,7 +84,7 @@ class User(DBUser, BaseUser):
|
||||||
self.log.warning("Failed to log in with shared secret")
|
self.log.warning("Failed to log in with shared secret")
|
||||||
return
|
return
|
||||||
self.log.debug("Logged in with shared secret")
|
self.log.debug("Logged in with shared secret")
|
||||||
#self.intent = self.az.intent.user(self.mxid, access_token)
|
self.intent = self.az.intent.user(self.mxid, access_token)
|
||||||
except Exception:
|
except Exception:
|
||||||
self.log.exception("Error logging in with shared secret")
|
self.log.exception("Error logging in with shared secret")
|
||||||
|
|
||||||
|
|
|
@ -73,10 +73,7 @@ class MautrixController {
|
||||||
*/
|
*/
|
||||||
async _tryParseDate(text, ref, option) {
|
async _tryParseDate(text, ref, option) {
|
||||||
const parsed = await window.__chronoParseDate(text, ref, option)
|
const parsed = await window.__chronoParseDate(text, ref, option)
|
||||||
if (parsed) {
|
return parsed ? new Date(parsed) : null
|
||||||
return new Date(parsed)
|
|
||||||
}
|
|
||||||
return null
|
|
||||||
}
|
}
|
||||||
|
|
||||||
/**
|
/**
|
||||||
|
@ -86,14 +83,11 @@ class MautrixController {
|
||||||
* @return {?Date} - The value in the date separator.
|
* @return {?Date} - The value in the date separator.
|
||||||
* @private
|
* @private
|
||||||
*/
|
*/
|
||||||
async _parseDate(text) {
|
async _tryParseDayDate(text) {
|
||||||
if (!text) {
|
if (!text) {
|
||||||
return null
|
return null
|
||||||
}
|
}
|
||||||
text = text
|
text = text.replace(/\. /, "/")
|
||||||
.replace(/[^\w\d\s,:.-]/g, "")
|
|
||||||
.replace(/\s{2,}/g, " ")
|
|
||||||
.trim()
|
|
||||||
const now = new Date()
|
const now = new Date()
|
||||||
let newDate = await this._tryParseDate(text)
|
let newDate = await this._tryParseDate(text)
|
||||||
if (!newDate || newDate > now) {
|
if (!newDate || newDate > now) {
|
||||||
|
@ -101,7 +95,7 @@ class MautrixController {
|
||||||
lastWeek.setDate(lastWeek.getDate() - 7)
|
lastWeek.setDate(lastWeek.getDate() - 7)
|
||||||
newDate = await this._tryParseDate(text, lastWeek, { forwardDate: true })
|
newDate = await this._tryParseDate(text, lastWeek, { forwardDate: true })
|
||||||
}
|
}
|
||||||
return newDate <= now ? newDate : null
|
return newDate && newDate <= now ? newDate : null
|
||||||
}
|
}
|
||||||
|
|
||||||
/**
|
/**
|
||||||
|
@ -122,14 +116,18 @@ class MautrixController {
|
||||||
* @return {MessageData}
|
* @return {MessageData}
|
||||||
* @private
|
* @private
|
||||||
*/
|
*/
|
||||||
_parseMessage(date, element) {
|
_tryParseMessage(date, element) {
|
||||||
const messageData = {
|
const messageData = {
|
||||||
id: +element.getAttribute("msg-id"),
|
id: +element.getAttribute("data-local-id"),
|
||||||
timestamp: date ? date.getTime() : null,
|
timestamp: date ? date.getTime() : null,
|
||||||
is_outgoing: element.getAttribute("is-outgoing") === "true",
|
is_outgoing: element.classList.contains("mdRGT07Own"),
|
||||||
}
|
}
|
||||||
messageData.text = element.querySelector("mws-text-message-part .text-msg")?.innerText
|
const messageElement = element.querySelector(".mdRGT07Body > .mdRGT07Msg")
|
||||||
if (element.querySelector("mws-image-message-part .image-msg")) {
|
if (messageElement.classList.contains("mdRGT07Text")) {
|
||||||
|
// TODO Use "Inner" or not?
|
||||||
|
messageData.text = messageElement.querySelector(".mdRGT07MsgTextInner")?.innerText
|
||||||
|
} else if (messageElement.classList.contains("mdRGT07Image")) {
|
||||||
|
// TODO Doesn't this need to be a URL?
|
||||||
messageData.image = true
|
messageData.image = true
|
||||||
}
|
}
|
||||||
return messageData
|
return messageData
|
||||||
|
@ -148,7 +146,7 @@ class MautrixController {
|
||||||
if (addedNode.classList.contains("mdRGT07Own")) {
|
if (addedNode.classList.contains("mdRGT07Own")) {
|
||||||
const timeElement = addedNode.querySelector("time.MdNonDisp")
|
const timeElement = addedNode.querySelector("time.MdNonDisp")
|
||||||
if (timeElement) {
|
if (timeElement) {
|
||||||
msgID = addedNode.getAttribute("data-local-id")
|
msgID = +addedNode.getAttribute("data-local-id")
|
||||||
observer.disconnect()
|
observer.disconnect()
|
||||||
observer = new MutationObserver(visibleTimeCallback)
|
observer = new MutationObserver(visibleTimeCallback)
|
||||||
observer.observe(timeElement, { attributes: true, attributeFilter: ["class"] })
|
observer.observe(timeElement, { attributes: true, attributeFilter: ["class"] })
|
||||||
|
@ -184,27 +182,29 @@ class MautrixController {
|
||||||
}
|
}
|
||||||
|
|
||||||
/**
|
/**
|
||||||
* Parse a message list in the given element. The element should probably be the .content div
|
* Parse the message list of whatever the currently-viewed chat is.
|
||||||
* inside a mws-message-list element.
|
|
||||||
*
|
*
|
||||||
* @param {Element} element - The message list element.
|
|
||||||
* @return {[MessageData]} - A list of messages.
|
* @return {[MessageData]} - A list of messages.
|
||||||
*/
|
*/
|
||||||
async parseMessageList(element) {
|
async parseMessageList() {
|
||||||
|
const msgList = document.querySelector("#_chat_room_msg_list")
|
||||||
const messages = []
|
const messages = []
|
||||||
let messageDate = null
|
let refDate = null
|
||||||
for (const child of element.children) {
|
for (const child of msgList.children) {
|
||||||
switch (child.tagName.toLowerCase()) {
|
if (child.tagName == "DIV") {
|
||||||
case "mws-message-wrapper":
|
if (child.classList.contains("mdRGT10Date")) {
|
||||||
if (!child.getAttribute("msg-id").startsWith("tmp_")) {
|
refDate = await this._tryParseDayDate(child.firstElementChild.innerText)
|
||||||
messages.push(this._parseMessage(messageDate, child))
|
}
|
||||||
|
else if (child.classList.contains("MdRGT07Cont")) {
|
||||||
|
// TODO :not(.MdNonDisp) to exclude not-yet-posted messages,
|
||||||
|
// but that is unlikely to be a problem here.
|
||||||
|
// Also, offscreen times may have .MdNonDisp on them
|
||||||
|
const timeElement = child.querySelector("time")
|
||||||
|
if (timeElement) {
|
||||||
|
const messageDate = await this._tryParseDate(timeElement.innerText, refDate)
|
||||||
|
messages.push(this._tryParseMessage(messageDate, child))
|
||||||
|
}
|
||||||
}
|
}
|
||||||
break
|
|
||||||
case "mws-tombstone-message-wrapper":
|
|
||||||
messageDate = await this._parseDate(
|
|
||||||
child.querySelector("mws-relative-timestamp")?.innerText,
|
|
||||||
) || messageDate
|
|
||||||
break
|
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
return messages
|
return messages
|
||||||
|
|
|
@ -98,8 +98,8 @@ export default class MessagesPuppeteer {
|
||||||
/* TODO
|
/* TODO
|
||||||
await this.page.exposeFunction("__mautrixReceiveChanges",
|
await this.page.exposeFunction("__mautrixReceiveChanges",
|
||||||
this._receiveChatListChanges.bind(this))
|
this._receiveChatListChanges.bind(this))
|
||||||
await this.page.exposeFunction("__chronoParseDate", chrono.parseDate)
|
|
||||||
*/
|
*/
|
||||||
|
await this.page.exposeFunction("__chronoParseDate", chrono.parseDate)
|
||||||
|
|
||||||
// NOTE Must *always* re-login on a browser session, so no need to check if already logged in
|
// NOTE Must *always* re-login on a browser session, so no need to check if already logged in
|
||||||
this.loginRunning = false
|
this.loginRunning = false
|
||||||
|
@ -504,14 +504,13 @@ export default class MessagesPuppeteer {
|
||||||
// Probably use a MutationObserver mapped to msgID
|
// Probably use a MutationObserver mapped to msgID
|
||||||
|
|
||||||
async _getMessagesUnsafe(id, minID = 0) {
|
async _getMessagesUnsafe(id, minID = 0) {
|
||||||
/* TODO Also handle "decrypting" state
|
// TODO Also handle "decrypting" state
|
||||||
|
// TODO Handle unloaded messages. Maybe scroll up
|
||||||
await this._switchChatUnsafe(id)
|
await this._switchChatUnsafe(id)
|
||||||
this.log("Waiting for messages to load")
|
this.log("Waiting for messages to load")
|
||||||
await this.page.waitFor("mws-message-wrapper")
|
const messages = await this.page.evaluate(
|
||||||
const messages = await this.page.$eval("mws-messages-list .content",
|
() => window.__mautrixController.parseMessageList())
|
||||||
element => window.__mautrixController.parseMessageList(element))
|
|
||||||
return messages.filter(msg => msg.id > minID && !this.sentMessageIDs.has(msg.id))
|
return messages.filter(msg => msg.id > minID && !this.sentMessageIDs.has(msg.id))
|
||||||
*/
|
|
||||||
}
|
}
|
||||||
|
|
||||||
async _processChatListChangeUnsafe(id) {
|
async _processChatListChangeUnsafe(id) {
|
||||||
|
|
Loading…
Reference in New Issue