2018-07-09 00:21:24 +02:00
|
|
|
# This file is part of Gajim.
|
|
|
|
#
|
|
|
|
# Gajim is free software; you can redistribute it and/or modify
|
|
|
|
# it under the terms of the GNU General Public License as published
|
|
|
|
# by the Free Software Foundation; version 3 only.
|
|
|
|
#
|
|
|
|
# Gajim is distributed in the hope that it will be useful,
|
|
|
|
# but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
|
|
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
|
|
# GNU General Public License for more details.
|
|
|
|
#
|
|
|
|
# You should have received a copy of the GNU General Public License
|
|
|
|
# along with Gajim. If not, see <http://www.gnu.org/licenses/>.
|
|
|
|
|
|
|
|
# XEP-0313: Message Archive Management
|
|
|
|
|
2018-09-15 20:45:38 +02:00
|
|
|
import time
|
2018-07-09 00:21:24 +02:00
|
|
|
from datetime import datetime, timedelta
|
|
|
|
|
|
|
|
import nbxmpp
|
2019-01-04 00:03:35 +01:00
|
|
|
from nbxmpp.structs import StanzaHandler
|
2018-07-09 00:21:24 +02:00
|
|
|
|
|
|
|
from gajim.common import app
|
2018-12-18 22:41:06 +01:00
|
|
|
from gajim.common.nec import NetworkEvent
|
2018-07-09 00:21:24 +02:00
|
|
|
from gajim.common.nec import NetworkIncomingEvent
|
2018-09-15 20:45:38 +02:00
|
|
|
from gajim.common.const import ArchiveState
|
|
|
|
from gajim.common.const import KindConstant
|
|
|
|
from gajim.common.const import SyncThreshold
|
2018-07-09 00:21:24 +02:00
|
|
|
from gajim.common.caps_cache import muc_caps_cache
|
2018-09-15 20:45:38 +02:00
|
|
|
from gajim.common.helpers import get_sync_threshold
|
2018-11-30 23:05:15 +01:00
|
|
|
from gajim.common.helpers import AdditionalDataDict
|
2018-07-09 00:21:24 +02:00
|
|
|
from gajim.common.modules.misc import parse_oob
|
|
|
|
from gajim.common.modules.misc import parse_correction
|
2019-02-19 19:17:56 +01:00
|
|
|
from gajim.common.modules.util import get_eme_message
|
2019-03-09 23:16:27 +01:00
|
|
|
from gajim.common.modules.base import BaseModule
|
2018-07-09 00:21:24 +02:00
|
|
|
|
|
|
|
|
2019-03-09 23:16:27 +01:00
|
|
|
class MAM(BaseModule):
|
2018-07-09 00:21:24 +02:00
|
|
|
def __init__(self, con):
|
2019-03-09 23:16:27 +01:00
|
|
|
BaseModule.__init__(self, con)
|
2018-07-09 00:21:24 +02:00
|
|
|
|
|
|
|
self.handlers = [
|
2019-01-04 00:03:35 +01:00
|
|
|
StanzaHandler(name='message',
|
|
|
|
callback=self._mam_message_received,
|
|
|
|
priority=51),
|
2018-07-09 00:21:24 +02:00
|
|
|
]
|
|
|
|
|
|
|
|
self.available = False
|
|
|
|
self.archiving_namespace = None
|
|
|
|
self._mam_query_ids = {}
|
|
|
|
|
2018-07-29 19:36:02 +02:00
|
|
|
# Holds archive jids where catch up was successful
|
|
|
|
self._catch_up_finished = []
|
|
|
|
|
2018-09-11 22:25:55 +02:00
|
|
|
def pass_disco(self, from_, _identities, features, _data, _node):
|
2018-07-22 12:18:24 +02:00
|
|
|
if nbxmpp.NS_MAM_2 in features:
|
|
|
|
self.archiving_namespace = nbxmpp.NS_MAM_2
|
|
|
|
elif nbxmpp.NS_MAM_1 in features:
|
|
|
|
self.archiving_namespace = nbxmpp.NS_MAM_1
|
|
|
|
else:
|
|
|
|
return
|
|
|
|
|
|
|
|
self.available = True
|
2019-03-09 23:16:27 +01:00
|
|
|
self._log.info('Discovered MAM %s: %s', self.archiving_namespace, from_)
|
2018-12-18 22:41:06 +01:00
|
|
|
|
|
|
|
app.nec.push_incoming_event(
|
|
|
|
NetworkEvent('feature-discovered',
|
|
|
|
account=self._account,
|
|
|
|
feature=self.archiving_namespace))
|
2018-07-22 12:18:24 +02:00
|
|
|
|
2019-03-09 23:16:27 +01:00
|
|
|
def _from_valid_archive(self, _stanza, properties):
|
2019-01-04 00:03:35 +01:00
|
|
|
if properties.type.is_groupchat:
|
|
|
|
expected_archive = properties.jid
|
2018-07-09 00:21:24 +02:00
|
|
|
else:
|
|
|
|
expected_archive = self._con.get_own_jid()
|
|
|
|
|
2019-01-04 00:03:35 +01:00
|
|
|
return properties.mam.archive.bareMatch(expected_archive)
|
2018-09-11 22:25:55 +02:00
|
|
|
|
2019-01-04 00:03:35 +01:00
|
|
|
def _get_unique_id(self, properties):
|
|
|
|
if properties.type.is_groupchat:
|
|
|
|
return properties.mam.id, None
|
2018-07-09 00:21:24 +02:00
|
|
|
|
2019-01-04 00:03:35 +01:00
|
|
|
if properties.is_self_message:
|
|
|
|
return None, properties.id
|
2018-07-09 00:21:24 +02:00
|
|
|
|
2019-01-04 00:03:35 +01:00
|
|
|
if properties.is_muc_pm:
|
|
|
|
return properties.mam.id, properties.id
|
2018-07-09 00:21:24 +02:00
|
|
|
|
2019-01-04 00:03:35 +01:00
|
|
|
if self._con.get_own_jid().bareMatch(properties.jid):
|
2018-07-09 00:21:24 +02:00
|
|
|
# message we sent
|
2019-01-04 00:03:35 +01:00
|
|
|
return properties.mam.id, properties.id
|
2018-07-09 00:21:24 +02:00
|
|
|
|
|
|
|
# A message we received
|
2019-01-04 00:03:35 +01:00
|
|
|
return properties.mam.id, None
|
|
|
|
|
|
|
|
def _mam_message_received(self, _con, stanza, properties):
|
|
|
|
if not properties.is_mam_message:
|
|
|
|
return
|
2018-07-09 00:21:24 +02:00
|
|
|
|
|
|
|
app.nec.push_incoming_event(
|
|
|
|
NetworkIncomingEvent('raw-mam-message-received',
|
|
|
|
conn=self._con,
|
|
|
|
stanza=stanza))
|
|
|
|
|
2019-01-04 00:03:35 +01:00
|
|
|
if not self._from_valid_archive(stanza, properties):
|
2019-03-09 23:16:27 +01:00
|
|
|
self._log.warning('Message from invalid archive %s',
|
|
|
|
properties.mam.archive)
|
2018-07-09 00:21:24 +02:00
|
|
|
raise nbxmpp.NodeProcessed
|
|
|
|
|
2019-03-09 23:16:27 +01:00
|
|
|
self._log.info('Received message from archive: %s',
|
|
|
|
properties.mam.archive)
|
2019-01-04 00:03:35 +01:00
|
|
|
if not self._is_valid_request(properties):
|
2019-03-09 23:16:27 +01:00
|
|
|
self._log.warning('Invalid MAM Message: unknown query id %s',
|
|
|
|
properties.mam.query_id)
|
|
|
|
self._log.debug(stanza)
|
2018-07-09 00:21:24 +02:00
|
|
|
raise nbxmpp.NodeProcessed
|
|
|
|
|
|
|
|
event_attrs = {}
|
|
|
|
|
2019-01-04 00:03:35 +01:00
|
|
|
groupchat = properties.type.is_groupchat
|
|
|
|
|
2018-07-09 00:21:24 +02:00
|
|
|
if groupchat:
|
2019-01-04 00:03:35 +01:00
|
|
|
event_attrs.update(self._parse_gc_attrs(properties))
|
2018-07-09 00:21:24 +02:00
|
|
|
else:
|
2019-01-04 00:03:35 +01:00
|
|
|
event_attrs.update(self._parse_chat_attrs(stanza, properties))
|
2018-07-09 00:21:24 +02:00
|
|
|
|
2019-01-04 00:03:35 +01:00
|
|
|
stanza_id, message_id = self._get_unique_id(properties)
|
2018-07-09 00:21:24 +02:00
|
|
|
|
2019-01-04 00:03:35 +01:00
|
|
|
if properties.mam.is_ver_2:
|
2018-07-09 00:21:24 +02:00
|
|
|
# Search only with stanza-id for duplicates on mam:2
|
|
|
|
if app.logger.find_stanza_id(self._account,
|
2019-01-04 00:03:35 +01:00
|
|
|
str(properties.mam.archive),
|
2018-07-09 00:21:24 +02:00
|
|
|
stanza_id,
|
2019-01-04 00:03:35 +01:00
|
|
|
message_id,
|
2018-07-09 00:21:24 +02:00
|
|
|
groupchat=groupchat):
|
2019-03-09 23:16:27 +01:00
|
|
|
self._log.info('Found duplicate with stanza-id: %s, '
|
|
|
|
'message-id: %s', stanza_id, message_id)
|
2018-07-09 00:21:24 +02:00
|
|
|
raise nbxmpp.NodeProcessed
|
|
|
|
|
2019-03-11 19:22:54 +01:00
|
|
|
additional_data = AdditionalDataDict()
|
|
|
|
if properties.has_user_delay:
|
|
|
|
# Record it as a user timestamp
|
|
|
|
additional_data.set_value(
|
|
|
|
'gajim', 'user_timestamp', properties.user_timestamp)
|
|
|
|
|
2018-07-09 00:21:24 +02:00
|
|
|
event_attrs.update(
|
|
|
|
{'conn': self._con,
|
2019-03-11 19:22:54 +01:00
|
|
|
'additional_data': additional_data,
|
2018-07-09 00:21:24 +02:00
|
|
|
'encrypted': False,
|
2019-01-04 00:03:35 +01:00
|
|
|
'timestamp': properties.mam.timestamp,
|
|
|
|
'self_message': properties.is_self_message,
|
2018-07-09 00:21:24 +02:00
|
|
|
'groupchat': groupchat,
|
2019-01-04 00:03:35 +01:00
|
|
|
'muc_pm': properties.is_muc_pm,
|
2018-07-09 00:21:24 +02:00
|
|
|
'stanza_id': stanza_id,
|
2019-01-04 00:03:35 +01:00
|
|
|
'origin_id': message_id,
|
|
|
|
'message_id': properties.id,
|
2018-07-09 00:21:24 +02:00
|
|
|
'correct_id': None,
|
2019-01-04 00:03:35 +01:00
|
|
|
'archive_jid': properties.mam.archive,
|
|
|
|
'msgtxt': properties.body,
|
|
|
|
'message': stanza,
|
|
|
|
'stanza': stanza,
|
|
|
|
'namespace': properties.mam.namespace,
|
2018-07-09 00:21:24 +02:00
|
|
|
})
|
|
|
|
|
|
|
|
if groupchat:
|
|
|
|
event = MamGcMessageReceivedEvent(None, **event_attrs)
|
|
|
|
else:
|
|
|
|
event = MamMessageReceivedEvent(None, **event_attrs)
|
|
|
|
|
2019-02-11 20:29:20 +01:00
|
|
|
if properties.is_encrypted:
|
|
|
|
event.additional_data['encrypted'] = properties.encrypted.additional_data
|
2018-07-09 00:21:24 +02:00
|
|
|
self._decryption_finished(event)
|
2019-02-11 20:29:20 +01:00
|
|
|
else:
|
|
|
|
app.plugin_manager.extension_point(
|
|
|
|
'decrypt', self._con, event, self._decryption_finished)
|
|
|
|
if not event.encrypted:
|
2019-02-19 19:17:56 +01:00
|
|
|
if properties.eme is not None:
|
|
|
|
event.msgtxt = get_eme_message(properties.eme)
|
2019-02-11 20:29:20 +01:00
|
|
|
self._decryption_finished(event)
|
2018-07-09 00:21:24 +02:00
|
|
|
|
|
|
|
raise nbxmpp.NodeProcessed
|
|
|
|
|
2018-09-11 22:25:55 +02:00
|
|
|
@staticmethod
|
2019-01-04 00:03:35 +01:00
|
|
|
def _parse_gc_attrs(properties):
|
2018-07-09 00:21:24 +02:00
|
|
|
real_jid = None
|
2019-01-04 00:03:35 +01:00
|
|
|
if properties.muc_user is not None:
|
|
|
|
real_jid = properties.muc_user.jid
|
|
|
|
return {'with_': properties.jid,
|
|
|
|
'nick': properties.muc_nickname,
|
2018-07-09 00:21:24 +02:00
|
|
|
'real_jid': real_jid,
|
|
|
|
'kind': KindConstant.GC_MSG}
|
|
|
|
|
2019-01-04 00:03:35 +01:00
|
|
|
def _parse_chat_attrs(self, stanza, properties):
|
|
|
|
frm = properties.jid
|
|
|
|
to = stanza.getTo()
|
2018-07-09 00:21:24 +02:00
|
|
|
if frm.bareMatch(self._con.get_own_jid()):
|
|
|
|
with_ = to
|
|
|
|
kind = KindConstant.CHAT_MSG_SENT
|
|
|
|
else:
|
|
|
|
with_ = frm
|
|
|
|
kind = KindConstant.CHAT_MSG_RECV
|
|
|
|
|
|
|
|
return {'with_': with_,
|
|
|
|
'nick': None,
|
|
|
|
'kind': kind}
|
|
|
|
|
|
|
|
def _decryption_finished(self, event):
|
|
|
|
if not event.msgtxt:
|
|
|
|
# For example Chatstates, Receipts, Chatmarkers
|
2019-03-09 23:16:27 +01:00
|
|
|
self._log.debug(event.message.getProperties())
|
2018-07-09 00:21:24 +02:00
|
|
|
return
|
2018-12-01 01:12:52 +01:00
|
|
|
|
2018-07-09 00:21:24 +02:00
|
|
|
event.correct_id = parse_correction(event.message)
|
2018-11-30 23:05:15 +01:00
|
|
|
parse_oob(event)
|
2018-07-09 00:21:24 +02:00
|
|
|
|
|
|
|
with_ = event.with_.getStripped()
|
|
|
|
if event.muc_pm:
|
|
|
|
# we store the message with the full JID
|
|
|
|
with_ = str(event.with_)
|
|
|
|
|
|
|
|
stanza_id = event.stanza_id
|
|
|
|
if event.self_message:
|
|
|
|
# Self messages can only be deduped with origin-id
|
|
|
|
if event.origin_id is None:
|
2019-03-09 23:16:27 +01:00
|
|
|
self._log.warning('Self message without origin-id found')
|
2018-07-09 00:21:24 +02:00
|
|
|
return
|
|
|
|
stanza_id = event.origin_id
|
|
|
|
|
|
|
|
if event.namespace == nbxmpp.NS_MAM_1:
|
|
|
|
if app.logger.search_for_duplicate(
|
|
|
|
self._account, with_, event.timestamp, event.msgtxt):
|
2019-03-09 23:16:27 +01:00
|
|
|
self._log.info('Found duplicate with fallback for mam:1')
|
2018-07-09 00:21:24 +02:00
|
|
|
return
|
|
|
|
|
|
|
|
app.logger.insert_into_logs(self._account,
|
|
|
|
with_,
|
|
|
|
event.timestamp,
|
|
|
|
event.kind,
|
|
|
|
unread=False,
|
|
|
|
message=event.msgtxt,
|
|
|
|
contact_name=event.nick,
|
|
|
|
additional_data=event.additional_data,
|
2019-01-04 00:03:35 +01:00
|
|
|
stanza_id=stanza_id,
|
|
|
|
message_id=event.message_id)
|
2018-07-09 00:21:24 +02:00
|
|
|
|
|
|
|
app.nec.push_incoming_event(
|
|
|
|
MamDecryptedMessageReceived(None, **vars(event)))
|
|
|
|
|
2019-01-04 00:03:35 +01:00
|
|
|
def _is_valid_request(self, properties):
|
|
|
|
valid_id = self._mam_query_ids.get(str(properties.mam.archive), None)
|
|
|
|
return valid_id == properties.mam.query_id
|
2018-07-09 00:21:24 +02:00
|
|
|
|
|
|
|
def _get_query_id(self, jid):
|
|
|
|
query_id = self._con.connection.getAnID()
|
|
|
|
self._mam_query_ids[jid] = query_id
|
|
|
|
return query_id
|
|
|
|
|
2019-03-09 23:16:27 +01:00
|
|
|
def _parse_iq(self, stanza):
|
2018-07-09 00:21:24 +02:00
|
|
|
if not nbxmpp.isResultNode(stanza):
|
2019-03-09 23:16:27 +01:00
|
|
|
self._log.error('Error on MAM query: %s', stanza.getError())
|
2018-07-09 00:21:24 +02:00
|
|
|
raise InvalidMamIQ
|
|
|
|
|
|
|
|
fin = stanza.getTag('fin')
|
|
|
|
if fin is None:
|
2019-03-09 23:16:27 +01:00
|
|
|
self._log.error('Malformed MAM query result received: %s', stanza)
|
2018-07-09 00:21:24 +02:00
|
|
|
raise InvalidMamIQ
|
|
|
|
|
|
|
|
set_ = fin.getTag('set', namespace=nbxmpp.NS_RSM)
|
|
|
|
if set_ is None:
|
2019-03-09 23:16:27 +01:00
|
|
|
self._log.error(
|
2018-07-09 00:21:24 +02:00
|
|
|
'Malformed MAM query result received (no "set" Node): %s',
|
|
|
|
stanza)
|
|
|
|
raise InvalidMamIQ
|
|
|
|
return fin, set_
|
|
|
|
|
|
|
|
def _get_from_jid(self, stanza):
|
|
|
|
jid = stanza.getFrom()
|
|
|
|
if jid is None:
|
|
|
|
# No from means, iq from our own archive
|
|
|
|
jid = self._con.get_own_jid().getStripped()
|
|
|
|
else:
|
|
|
|
jid = jid.getStripped()
|
|
|
|
return jid
|
|
|
|
|
|
|
|
def request_archive_count(self, start_date, end_date):
|
|
|
|
jid = self._con.get_own_jid().getStripped()
|
2019-03-09 23:16:27 +01:00
|
|
|
self._log.info('Request archive count from: %s', jid)
|
2018-07-09 00:21:24 +02:00
|
|
|
query_id = self._get_query_id(jid)
|
|
|
|
query = self._get_archive_query(
|
|
|
|
query_id, start=start_date, end=end_date, max_=0)
|
|
|
|
self._con.connection.SendAndCallForResponse(
|
|
|
|
query, self._received_count, {'query_id': query_id})
|
|
|
|
return query_id
|
|
|
|
|
2018-09-11 22:25:55 +02:00
|
|
|
def _received_count(self, _con, stanza, query_id):
|
2018-07-09 00:21:24 +02:00
|
|
|
try:
|
|
|
|
_, set_ = self._parse_iq(stanza)
|
|
|
|
except InvalidMamIQ:
|
|
|
|
return
|
|
|
|
|
|
|
|
jid = self._get_from_jid(stanza)
|
|
|
|
self._mam_query_ids.pop(jid)
|
|
|
|
|
|
|
|
count = set_.getTagData('count')
|
2019-03-09 23:16:27 +01:00
|
|
|
self._log.info('Received archive count: %s', count)
|
2018-07-09 00:21:24 +02:00
|
|
|
app.nec.push_incoming_event(ArchivingCountReceived(
|
|
|
|
None, query_id=query_id, count=count))
|
|
|
|
|
|
|
|
def request_archive_on_signin(self):
|
|
|
|
own_jid = self._con.get_own_jid().getStripped()
|
|
|
|
|
|
|
|
if own_jid in self._mam_query_ids:
|
2019-03-09 23:16:27 +01:00
|
|
|
self._log.warning('MAM request for %s already running', own_jid)
|
2018-07-09 00:21:24 +02:00
|
|
|
return
|
|
|
|
|
2018-09-15 20:45:38 +02:00
|
|
|
archive = app.logger.get_archive_infos(own_jid)
|
2018-07-09 00:21:24 +02:00
|
|
|
|
|
|
|
# Migration of last_mam_id from config to DB
|
|
|
|
if archive is not None:
|
|
|
|
mam_id = archive.last_mam_id
|
|
|
|
else:
|
|
|
|
mam_id = app.config.get_per(
|
|
|
|
'accounts', self._account, 'last_mam_id')
|
|
|
|
if mam_id:
|
|
|
|
app.config.del_per('accounts', self._account, 'last_mam_id')
|
|
|
|
|
|
|
|
start_date = None
|
|
|
|
query_id = self._get_query_id(own_jid)
|
|
|
|
if mam_id:
|
2019-03-09 23:16:27 +01:00
|
|
|
self._log.info('MAM query after: %s', mam_id)
|
2018-07-09 00:21:24 +02:00
|
|
|
query = self._get_archive_query(query_id, after=mam_id)
|
|
|
|
else:
|
|
|
|
# First Start, we request the last week
|
|
|
|
start_date = datetime.utcnow() - timedelta(days=7)
|
2019-03-09 23:16:27 +01:00
|
|
|
self._log.info('First start: query archive start: %s', start_date)
|
2018-07-09 00:21:24 +02:00
|
|
|
query = self._get_archive_query(query_id, start=start_date)
|
2018-07-29 19:36:02 +02:00
|
|
|
|
|
|
|
if own_jid in self._catch_up_finished:
|
|
|
|
self._catch_up_finished.remove(own_jid)
|
2018-07-09 00:21:24 +02:00
|
|
|
self._send_archive_query(query, query_id, start_date)
|
|
|
|
|
|
|
|
def request_archive_on_muc_join(self, jid):
|
2018-09-15 20:45:38 +02:00
|
|
|
archive = app.logger.get_archive_infos(jid)
|
|
|
|
threshold = get_sync_threshold(jid, archive)
|
2019-03-09 23:16:27 +01:00
|
|
|
self._log.info('Threshold for %s: %s', jid, threshold)
|
2018-07-09 00:21:24 +02:00
|
|
|
query_id = self._get_query_id(jid)
|
|
|
|
start_date = None
|
2018-09-15 20:45:38 +02:00
|
|
|
if archive is None or archive.last_mam_id is None:
|
2018-07-09 00:21:24 +02:00
|
|
|
# First Start, we dont request history
|
|
|
|
# Depending on what a MUC saves, there could be thousands
|
|
|
|
# of Messages even in just one day.
|
|
|
|
start_date = datetime.utcnow() - timedelta(days=1)
|
2019-03-09 23:16:27 +01:00
|
|
|
self._log.info('First join: query archive %s from: %s',
|
|
|
|
jid, start_date)
|
2018-09-11 22:25:55 +02:00
|
|
|
query = self._get_archive_query(
|
|
|
|
query_id, jid=jid, start=start_date)
|
2018-07-29 19:36:02 +02:00
|
|
|
|
2018-09-15 20:45:38 +02:00
|
|
|
elif threshold == SyncThreshold.NO_THRESHOLD:
|
|
|
|
# Not our first join and no threshold set
|
2019-03-09 23:16:27 +01:00
|
|
|
self._log.info('Request from archive: %s, after mam-id %s',
|
|
|
|
jid, archive.last_mam_id)
|
2018-09-15 20:45:38 +02:00
|
|
|
query = self._get_archive_query(
|
|
|
|
query_id, jid=jid, after=archive.last_mam_id)
|
|
|
|
|
|
|
|
else:
|
|
|
|
# Not our first join, check how much time elapsed since our
|
|
|
|
# last join and check against threshold
|
|
|
|
last_timestamp = archive.last_muc_timestamp
|
|
|
|
if last_timestamp is None:
|
2019-03-09 23:16:27 +01:00
|
|
|
self._log.info('No last muc timestamp found ( mam:1? )')
|
2018-09-15 20:45:38 +02:00
|
|
|
last_timestamp = 0
|
|
|
|
|
|
|
|
last = datetime.utcfromtimestamp(float(last_timestamp))
|
|
|
|
if datetime.utcnow() - last > timedelta(days=threshold):
|
|
|
|
# To much time has elapsed since last join, apply threshold
|
|
|
|
start_date = datetime.utcnow() - timedelta(days=threshold)
|
2019-03-09 23:16:27 +01:00
|
|
|
self._log.info('Too much time elapsed since last join, '
|
|
|
|
'request from: %s, threshold: %s',
|
|
|
|
start_date, threshold)
|
2018-09-15 20:45:38 +02:00
|
|
|
query = self._get_archive_query(
|
|
|
|
query_id, jid=jid, start=start_date)
|
|
|
|
else:
|
|
|
|
# Request from last mam-id
|
2019-03-09 23:16:27 +01:00
|
|
|
self._log.info('Request from archive %s after %s:',
|
|
|
|
jid, archive.last_mam_id)
|
2018-09-15 20:45:38 +02:00
|
|
|
query = self._get_archive_query(
|
|
|
|
query_id, jid=jid, after=archive.last_mam_id)
|
|
|
|
|
2018-07-29 19:36:02 +02:00
|
|
|
if jid in self._catch_up_finished:
|
|
|
|
self._catch_up_finished.remove(jid)
|
2018-07-09 00:21:24 +02:00
|
|
|
self._send_archive_query(query, query_id, start_date, groupchat=True)
|
|
|
|
|
|
|
|
def _send_archive_query(self, query, query_id, start_date=None,
|
|
|
|
groupchat=False):
|
|
|
|
self._con.connection.SendAndCallForResponse(
|
|
|
|
query, self._result_finished, {'query_id': query_id,
|
|
|
|
'start_date': start_date,
|
|
|
|
'groupchat': groupchat})
|
|
|
|
|
2018-09-11 22:25:55 +02:00
|
|
|
def _result_finished(self, _con, stanza, query_id, start_date, groupchat):
|
2018-07-09 00:21:24 +02:00
|
|
|
try:
|
|
|
|
fin, set_ = self._parse_iq(stanza)
|
|
|
|
except InvalidMamIQ:
|
|
|
|
return
|
|
|
|
|
|
|
|
jid = self._get_from_jid(stanza)
|
|
|
|
|
|
|
|
last = set_.getTagData('last')
|
|
|
|
if last is None:
|
2019-03-09 23:16:27 +01:00
|
|
|
self._log.info('End of MAM query, no items retrieved')
|
2018-07-29 19:36:02 +02:00
|
|
|
self._catch_up_finished.append(jid)
|
2018-07-09 00:21:24 +02:00
|
|
|
self._mam_query_ids.pop(jid)
|
|
|
|
return
|
|
|
|
|
|
|
|
complete = fin.getAttr('complete')
|
|
|
|
if complete != 'true':
|
2018-09-15 20:45:38 +02:00
|
|
|
app.logger.set_archive_infos(jid, last_mam_id=last)
|
2018-07-09 00:21:24 +02:00
|
|
|
self._mam_query_ids.pop(jid)
|
|
|
|
query_id = self._get_query_id(jid)
|
|
|
|
query = self._get_archive_query(query_id, jid=jid, after=last)
|
|
|
|
self._send_archive_query(query, query_id, groupchat=groupchat)
|
|
|
|
else:
|
|
|
|
self._mam_query_ids.pop(jid)
|
2018-09-15 20:45:38 +02:00
|
|
|
app.logger.set_archive_infos(
|
|
|
|
jid, last_mam_id=last, last_muc_timestamp=time.time())
|
|
|
|
if start_date is not None and not groupchat:
|
|
|
|
# Record the earliest timestamp we request from
|
|
|
|
# the account archive. For the account archive we only
|
|
|
|
# set start_date at the very first request.
|
|
|
|
app.logger.set_archive_infos(
|
|
|
|
jid, oldest_mam_timestamp=start_date.timestamp())
|
2018-07-29 19:36:02 +02:00
|
|
|
|
|
|
|
self._catch_up_finished.append(jid)
|
2019-03-09 23:16:27 +01:00
|
|
|
self._log.info('End of MAM query, last mam id: %s', last)
|
2018-07-09 00:21:24 +02:00
|
|
|
|
|
|
|
def request_archive_interval(self, start_date, end_date, after=None,
|
|
|
|
query_id=None):
|
|
|
|
jid = self._con.get_own_jid().getStripped()
|
|
|
|
if after is None:
|
2019-03-09 23:16:27 +01:00
|
|
|
self._log.info('Request intervall from %s to %s from %s',
|
|
|
|
start_date, end_date, jid)
|
2018-07-09 00:21:24 +02:00
|
|
|
else:
|
2019-03-09 23:16:27 +01:00
|
|
|
self._log.info('Query page after %s from %s', after, jid)
|
2018-07-09 00:21:24 +02:00
|
|
|
if query_id is None:
|
|
|
|
query_id = self._get_query_id(jid)
|
|
|
|
self._mam_query_ids[jid] = query_id
|
|
|
|
query = self._get_archive_query(query_id, start=start_date,
|
|
|
|
end=end_date, after=after, max_=30)
|
|
|
|
|
|
|
|
self._con.connection.SendAndCallForResponse(
|
|
|
|
query, self._intervall_result, {'query_id': query_id,
|
|
|
|
'start_date': start_date,
|
|
|
|
'end_date': end_date})
|
|
|
|
return query_id
|
|
|
|
|
2018-09-11 22:25:55 +02:00
|
|
|
def _intervall_result(self, _con, stanza, query_id,
|
2018-07-09 00:21:24 +02:00
|
|
|
start_date, end_date):
|
|
|
|
try:
|
|
|
|
fin, set_ = self._parse_iq(stanza)
|
|
|
|
except InvalidMamIQ:
|
|
|
|
return
|
|
|
|
|
|
|
|
jid = self._get_from_jid(stanza)
|
|
|
|
self._mam_query_ids.pop(jid)
|
|
|
|
if start_date:
|
|
|
|
timestamp = start_date.timestamp()
|
|
|
|
else:
|
|
|
|
timestamp = ArchiveState.ALL
|
|
|
|
|
|
|
|
last = set_.getTagData('last')
|
|
|
|
if last is None:
|
|
|
|
app.nec.push_incoming_event(ArchivingIntervalFinished(
|
|
|
|
None, query_id=query_id))
|
2018-09-15 20:45:38 +02:00
|
|
|
app.logger.set_archive_infos(
|
2018-07-09 00:21:24 +02:00
|
|
|
jid, oldest_mam_timestamp=timestamp)
|
2019-03-09 23:16:27 +01:00
|
|
|
self._log.info('End of MAM request, no items retrieved')
|
2018-07-09 00:21:24 +02:00
|
|
|
return
|
|
|
|
|
|
|
|
complete = fin.getAttr('complete')
|
|
|
|
if complete != 'true':
|
|
|
|
self.request_archive_interval(start_date, end_date, last, query_id)
|
|
|
|
else:
|
2019-03-09 23:16:27 +01:00
|
|
|
self._log.info('Request finished')
|
2018-09-15 20:45:38 +02:00
|
|
|
app.logger.set_archive_infos(
|
2018-07-09 00:21:24 +02:00
|
|
|
jid, oldest_mam_timestamp=timestamp)
|
|
|
|
app.nec.push_incoming_event(ArchivingIntervalFinished(
|
|
|
|
None, query_id=query_id))
|
|
|
|
|
|
|
|
def _get_archive_query(self, query_id, jid=None, start=None, end=None,
|
2018-09-30 10:01:42 +02:00
|
|
|
with_=None, after=None, max_=70):
|
2018-07-09 00:21:24 +02:00
|
|
|
# Muc archive query?
|
|
|
|
namespace = muc_caps_cache.get_mam_namespace(jid)
|
|
|
|
if namespace is None:
|
|
|
|
# Query to our own archive
|
|
|
|
namespace = self.archiving_namespace
|
|
|
|
|
|
|
|
iq = nbxmpp.Iq('set', to=jid)
|
|
|
|
query = iq.addChild('query', namespace=namespace)
|
|
|
|
form = query.addChild(node=nbxmpp.DataForm(typ='submit'))
|
|
|
|
field = nbxmpp.DataField(typ='hidden',
|
|
|
|
name='FORM_TYPE',
|
|
|
|
value=namespace)
|
|
|
|
form.addChild(node=field)
|
|
|
|
if start:
|
2018-09-11 22:25:55 +02:00
|
|
|
field = nbxmpp.DataField(
|
|
|
|
typ='text-single',
|
|
|
|
name='start',
|
|
|
|
value=start.strftime('%Y-%m-%dT%H:%M:%SZ'))
|
2018-07-09 00:21:24 +02:00
|
|
|
form.addChild(node=field)
|
|
|
|
if end:
|
|
|
|
field = nbxmpp.DataField(typ='text-single',
|
|
|
|
name='end',
|
|
|
|
value=end.strftime('%Y-%m-%dT%H:%M:%SZ'))
|
|
|
|
form.addChild(node=field)
|
|
|
|
if with_:
|
2018-09-11 22:25:55 +02:00
|
|
|
field = nbxmpp.DataField(typ='jid-single',
|
|
|
|
name='with',
|
|
|
|
value=with_)
|
2018-07-09 00:21:24 +02:00
|
|
|
form.addChild(node=field)
|
|
|
|
|
|
|
|
set_ = query.setTag('set', namespace=nbxmpp.NS_RSM)
|
|
|
|
set_.setTagData('max', max_)
|
|
|
|
if after:
|
|
|
|
set_.setTagData('after', after)
|
|
|
|
query.setAttr('queryid', query_id)
|
|
|
|
return iq
|
|
|
|
|
2018-07-29 19:36:02 +02:00
|
|
|
def save_archive_id(self, jid, stanza_id, timestamp):
|
|
|
|
if jid is None:
|
|
|
|
jid = self._con.get_own_jid().getStripped()
|
|
|
|
if jid not in self._catch_up_finished:
|
|
|
|
return
|
2019-03-09 23:16:27 +01:00
|
|
|
self._log.info('Save: %s: %s, %s', jid, stanza_id, timestamp)
|
2018-09-15 20:45:38 +02:00
|
|
|
if stanza_id is None:
|
|
|
|
# mam:1
|
|
|
|
app.logger.set_archive_infos(jid, last_muc_timestamp=timestamp)
|
|
|
|
else:
|
|
|
|
# mam:2
|
|
|
|
app.logger.set_archive_infos(
|
|
|
|
jid, last_mam_id=stanza_id, last_muc_timestamp=timestamp)
|
2018-07-29 19:36:02 +02:00
|
|
|
|
2018-07-09 00:21:24 +02:00
|
|
|
def request_mam_preferences(self):
|
2019-03-09 23:16:27 +01:00
|
|
|
self._log.info('Request MAM preferences')
|
2018-07-09 00:21:24 +02:00
|
|
|
iq = nbxmpp.Iq('get', self.archiving_namespace)
|
|
|
|
iq.setQuery('prefs')
|
|
|
|
self._con.connection.SendAndCallForResponse(
|
|
|
|
iq, self._preferences_received)
|
|
|
|
|
|
|
|
def _preferences_received(self, stanza):
|
|
|
|
if not nbxmpp.isResultNode(stanza):
|
2019-03-09 23:16:27 +01:00
|
|
|
self._log.info('Error: %s', stanza.getError())
|
2018-07-09 00:21:24 +02:00
|
|
|
app.nec.push_incoming_event(MAMPreferenceError(
|
|
|
|
None, conn=self._con, error=stanza.getError()))
|
|
|
|
return
|
|
|
|
|
2019-03-09 23:16:27 +01:00
|
|
|
self._log.info('Received MAM preferences')
|
2018-07-09 00:21:24 +02:00
|
|
|
prefs = stanza.getTag('prefs', namespace=self.archiving_namespace)
|
|
|
|
if prefs is None:
|
2019-03-09 23:16:27 +01:00
|
|
|
self._log.error('Malformed stanza (no prefs node): %s', stanza)
|
2018-07-09 00:21:24 +02:00
|
|
|
return
|
|
|
|
|
|
|
|
rules = []
|
|
|
|
default = prefs.getAttr('default')
|
|
|
|
for item in prefs.getTag('always').getTags('jid'):
|
|
|
|
rules.append((item.getData(), 'Always'))
|
|
|
|
|
|
|
|
for item in prefs.getTag('never').getTags('jid'):
|
|
|
|
rules.append((item.getData(), 'Never'))
|
|
|
|
|
|
|
|
app.nec.push_incoming_event(MAMPreferenceReceived(
|
|
|
|
None, conn=self._con, rules=rules, default=default))
|
|
|
|
|
|
|
|
def set_mam_preferences(self, rules, default):
|
|
|
|
iq = nbxmpp.Iq(typ='set')
|
|
|
|
prefs = iq.addChild(name='prefs',
|
|
|
|
namespace=self.archiving_namespace,
|
|
|
|
attrs={'default': default})
|
|
|
|
always = prefs.addChild(name='always')
|
|
|
|
never = prefs.addChild(name='never')
|
|
|
|
for item in rules:
|
|
|
|
jid, archive = item
|
|
|
|
if archive:
|
|
|
|
always.addChild(name='jid').setData(jid)
|
|
|
|
else:
|
|
|
|
never.addChild(name='jid').setData(jid)
|
|
|
|
|
|
|
|
self._con.connection.SendAndCallForResponse(
|
|
|
|
iq, self._preferences_saved)
|
|
|
|
|
|
|
|
def _preferences_saved(self, stanza):
|
|
|
|
if not nbxmpp.isResultNode(stanza):
|
2019-03-09 23:16:27 +01:00
|
|
|
self._log.info('Error: %s', stanza.getError())
|
2018-07-09 00:21:24 +02:00
|
|
|
app.nec.push_incoming_event(MAMPreferenceError(
|
|
|
|
None, conn=self._con, error=stanza.getError()))
|
|
|
|
else:
|
2019-03-09 23:16:27 +01:00
|
|
|
self._log.info('Preferences saved')
|
2018-07-09 00:21:24 +02:00
|
|
|
app.nec.push_incoming_event(
|
|
|
|
MAMPreferenceSaved(None, conn=self._con))
|
|
|
|
|
|
|
|
|
|
|
|
class MamMessageReceivedEvent(NetworkIncomingEvent):
|
|
|
|
name = 'mam-message-received'
|
|
|
|
|
|
|
|
|
|
|
|
class MamGcMessageReceivedEvent(NetworkIncomingEvent):
|
2018-07-26 17:27:56 +02:00
|
|
|
name = 'mam-gc-message-received'
|
2018-07-09 00:21:24 +02:00
|
|
|
|
|
|
|
|
|
|
|
class MamDecryptedMessageReceived(NetworkIncomingEvent):
|
|
|
|
name = 'mam-decrypted-message-received'
|
|
|
|
|
|
|
|
|
|
|
|
class MAMPreferenceError(NetworkIncomingEvent):
|
|
|
|
name = 'mam-prefs-error'
|
|
|
|
|
|
|
|
|
|
|
|
class MAMPreferenceReceived(NetworkIncomingEvent):
|
|
|
|
name = 'mam-prefs-received'
|
|
|
|
|
|
|
|
|
|
|
|
class MAMPreferenceSaved(NetworkIncomingEvent):
|
|
|
|
name = 'mam-prefs-saved'
|
|
|
|
|
|
|
|
|
|
|
|
class ArchivingCountReceived(NetworkIncomingEvent):
|
|
|
|
name = 'archiving-count-received'
|
|
|
|
|
|
|
|
|
|
|
|
class ArchivingIntervalFinished(NetworkIncomingEvent):
|
|
|
|
name = 'archiving-interval-finished'
|
|
|
|
|
|
|
|
|
|
|
|
class ArchivingErrorReceived(NetworkIncomingEvent):
|
|
|
|
name = 'archiving-error-received'
|
|
|
|
|
|
|
|
|
|
|
|
class InvalidMamIQ(Exception):
|
|
|
|
pass
|
|
|
|
|
|
|
|
|
|
|
|
def get_instance(*args, **kwargs):
|
|
|
|
return MAM(*args, **kwargs), 'MAM'
|