997 lines
33 KiB
Python
997 lines
33 KiB
Python
# Copyright (C) 2003-2014 Yann Leboulanger <asterix AT lagaule.org>
|
||
# Copyright (C) 2004-2005 Vincent Hanquez <tab AT snarc.org>
|
||
# Copyright (C) 2005-2006 Nikos Kouremenos <kourem AT gmail.com>
|
||
# Copyright (C) 2006 Dimitur Kirov <dkirov AT gmail.com>
|
||
# Copyright (C) 2006-2008 Jean-Marie Traissard <jim AT lapin.org>
|
||
# Copyright (C) 2007 Tomasz Melcer <liori AT exroot.org>
|
||
# Julien Pivotto <roidelapluie AT gmail.com>
|
||
# Copyright (C) 2018 Philipp Hörist <philipp AT hoerist.com>
|
||
#
|
||
# This file is part of Gajim.
|
||
#
|
||
# Gajim is free software; you can redistribute it and/or modify
|
||
# it under the terms of the GNU General Public License as published
|
||
# by the Free Software Foundation; version 3 only.
|
||
#
|
||
# Gajim is distributed in the hope that it will be useful,
|
||
# but WITHOUT ANY WARRANTY; without even the implied warranty of
|
||
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
||
# GNU General Public License for more details.
|
||
#
|
||
# You should have received a copy of the GNU General Public License
|
||
# along with Gajim. If not, see <http://www.gnu.org/licenses/>.
|
||
|
||
import time
|
||
import datetime
|
||
import calendar
|
||
import json
|
||
import logging
|
||
import sqlite3 as sqlite
|
||
from collections import namedtuple
|
||
|
||
from gajim.common import app
|
||
from gajim.common import configpaths
|
||
from gajim.common.helpers import AdditionalDataDict
|
||
from gajim.common.const import ShowConstant
|
||
from gajim.common.const import KindConstant
|
||
from gajim.common.const import JIDConstant
|
||
|
||
from gajim.common.storage.base import SqliteStorage
|
||
from gajim.common.storage.base import timeit
|
||
|
||
|
||
CURRENT_USER_VERSION = 6
|
||
|
||
ARCHIVE_SQL_STATEMENT = '''
|
||
CREATE TABLE jids(
|
||
jid_id INTEGER PRIMARY KEY AUTOINCREMENT UNIQUE,
|
||
jid TEXT UNIQUE,
|
||
type INTEGER
|
||
);
|
||
CREATE TABLE unread_messages(
|
||
message_id INTEGER PRIMARY KEY AUTOINCREMENT UNIQUE,
|
||
jid_id INTEGER,
|
||
shown BOOLEAN default 0
|
||
);
|
||
CREATE INDEX idx_unread_messages_jid_id ON unread_messages (jid_id);
|
||
CREATE TABLE logs(
|
||
log_line_id INTEGER PRIMARY KEY AUTOINCREMENT UNIQUE,
|
||
account_id INTEGER,
|
||
jid_id INTEGER,
|
||
contact_name TEXT,
|
||
time INTEGER,
|
||
kind INTEGER,
|
||
show INTEGER,
|
||
message TEXT,
|
||
error TEXT,
|
||
subject TEXT,
|
||
additional_data TEXT,
|
||
stanza_id TEXT,
|
||
message_id TEXT,
|
||
encryption TEXT,
|
||
encryption_state TEXT,
|
||
marker INTEGER
|
||
);
|
||
CREATE TABLE last_archive_message(
|
||
jid_id INTEGER PRIMARY KEY UNIQUE,
|
||
last_mam_id TEXT,
|
||
oldest_mam_timestamp TEXT,
|
||
last_muc_timestamp TEXT
|
||
);
|
||
CREATE INDEX idx_logs_jid_id_time ON logs (jid_id, time DESC);
|
||
CREATE INDEX idx_logs_stanza_id ON logs (stanza_id);
|
||
CREATE INDEX idx_logs_message_id ON logs (message_id);
|
||
PRAGMA user_version=%s;
|
||
''' % CURRENT_USER_VERSION
|
||
|
||
|
||
log = logging.getLogger('gajim.c.storage.archive')
|
||
|
||
|
||
class MessageArchiveStorage(SqliteStorage):
|
||
def __init__(self):
|
||
SqliteStorage.__init__(self,
|
||
log,
|
||
configpaths.get('LOG_DB'),
|
||
ARCHIVE_SQL_STATEMENT)
|
||
|
||
self._jid_ids = {}
|
||
self._jid_ids_reversed = {}
|
||
|
||
def init(self, **kwargs):
|
||
SqliteStorage.init(self,
|
||
detect_types=sqlite.PARSE_COLNAMES)
|
||
|
||
self._set_journal_mode('WAL')
|
||
self._enable_secure_delete()
|
||
|
||
self._con.row_factory = self._namedtuple_factory
|
||
|
||
self._con.create_function("like", 1, self._like)
|
||
self._con.create_function("get_timeout", 0, self._get_timeout)
|
||
|
||
self._get_jid_ids_from_db()
|
||
self._cleanup_chat_history()
|
||
|
||
def _namedtuple_factory(self, cursor, row):
|
||
fields = [col[0] for col in cursor.description]
|
||
Row = namedtuple("Row", fields)
|
||
named_row = Row(*row)
|
||
if 'additional_data' in fields:
|
||
_dict = json.loads(named_row.additional_data or '{}')
|
||
named_row = named_row._replace(
|
||
additional_data=AdditionalDataDict(_dict))
|
||
|
||
# if an alias `account` for the field `account_id` is used for the
|
||
# query, the account_id is converted to the account jid
|
||
if 'account' in fields:
|
||
if named_row.account:
|
||
jid = self._jid_ids_reversed[named_row.account].jid
|
||
named_row = named_row._replace(account=jid)
|
||
return named_row
|
||
|
||
def _migrate(self):
|
||
user_version = self.user_version
|
||
if user_version == 0:
|
||
# All migrations from 0.16.9 until 1.0.0
|
||
statements = [
|
||
'ALTER TABLE logs ADD COLUMN "account_id" INTEGER',
|
||
'ALTER TABLE logs ADD COLUMN "stanza_id" TEXT',
|
||
'ALTER TABLE logs ADD COLUMN "encryption" TEXT',
|
||
'ALTER TABLE logs ADD COLUMN "encryption_state" TEXT',
|
||
'ALTER TABLE logs ADD COLUMN "marker" INTEGER',
|
||
'ALTER TABLE logs ADD COLUMN "additional_data" TEXT',
|
||
'''CREATE TABLE IF NOT EXISTS last_archive_message(
|
||
jid_id INTEGER PRIMARY KEY UNIQUE,
|
||
last_mam_id TEXT,
|
||
oldest_mam_timestamp TEXT,
|
||
last_muc_timestamp TEXT
|
||
)''',
|
||
|
||
'''CREATE INDEX IF NOT EXISTS idx_logs_stanza_id
|
||
ON logs(stanza_id)''',
|
||
'PRAGMA user_version=1'
|
||
]
|
||
|
||
self._execute_multiple(statements)
|
||
|
||
if user_version < 2:
|
||
statements = [
|
||
'ALTER TABLE last_archive_message ADD COLUMN "sync_threshold" INTEGER',
|
||
'PRAGMA user_version=2'
|
||
]
|
||
self._execute_multiple(statements)
|
||
|
||
if user_version < 3:
|
||
statements = [
|
||
'ALTER TABLE logs ADD COLUMN "message_id" TEXT',
|
||
'PRAGMA user_version=3'
|
||
]
|
||
self._execute_multiple(statements)
|
||
|
||
if user_version < 4:
|
||
statements = [
|
||
'ALTER TABLE logs ADD COLUMN "error" TEXT',
|
||
'PRAGMA user_version=4'
|
||
]
|
||
self._execute_multiple(statements)
|
||
|
||
if user_version < 5:
|
||
statements = [
|
||
'CREATE INDEX idx_logs_message_id ON logs (message_id)',
|
||
'PRAGMA user_version=5'
|
||
]
|
||
self._execute_multiple(statements)
|
||
|
||
@staticmethod
|
||
def dispatch(event, error):
|
||
app.ged.raise_event(event, None, str(error))
|
||
|
||
@staticmethod
|
||
def _get_timeout():
|
||
"""
|
||
returns the timeout in epoch
|
||
"""
|
||
timeout = app.settings.get('restore_timeout')
|
||
|
||
now = int(time.time())
|
||
if timeout > 0:
|
||
timeout = now - (timeout * 60)
|
||
return timeout
|
||
|
||
@staticmethod
|
||
def _like(search_str):
|
||
return '%{}%'.format(search_str)
|
||
|
||
@timeit
|
||
def _get_jid_ids_from_db(self):
|
||
"""
|
||
Load all jid/jid_id tuples into a dict for faster access
|
||
"""
|
||
rows = self._con.execute(
|
||
'SELECT jid_id, jid, type FROM jids').fetchall()
|
||
for row in rows:
|
||
self._jid_ids[row.jid] = row
|
||
self._jid_ids_reversed[row.jid_id] = row
|
||
|
||
def get_jids_in_db(self):
|
||
return self._jid_ids.keys()
|
||
|
||
def jid_is_from_pm(self, jid):
|
||
"""
|
||
If jid is gajim@conf/nkour it's likely a pm one, how we know gajim@conf
|
||
is not a normal guy and nkour is not his resource? we ask if gajim@conf
|
||
is already in jids (with type room jid) this fails if user disables
|
||
logging for room and only enables for pm (so highly unlikely) and if we
|
||
fail we do not go chaos (user will see the first pm as if it was message
|
||
in room's public chat) and after that all okay
|
||
"""
|
||
if jid.find('/') > -1:
|
||
possible_room_jid = jid.split('/', 1)[0]
|
||
return self.jid_is_room_jid(possible_room_jid)
|
||
# it's not a full jid, so it's not a pm one
|
||
return False
|
||
|
||
def jid_is_room_jid(self, jid):
|
||
"""
|
||
Return True if it's a room jid, False if it's not, None if we don't know
|
||
"""
|
||
jid_ = self._jid_ids.get(jid)
|
||
if jid_ is None:
|
||
return None
|
||
return jid_.type == JIDConstant.ROOM_TYPE
|
||
|
||
@staticmethod
|
||
def _get_family_jids(account, jid):
|
||
"""
|
||
Get all jids of the metacontacts family
|
||
|
||
:param account: The account
|
||
|
||
:param jid: The JID
|
||
|
||
returns a list of JIDs'
|
||
"""
|
||
family = app.contacts.get_metacontacts_family(account, jid)
|
||
if family:
|
||
return [user['jid'] for user in family]
|
||
return [jid]
|
||
|
||
def get_account_id(self, account, type_=JIDConstant.NORMAL_TYPE):
|
||
jid = app.get_jid_from_account(account)
|
||
return self.get_jid_id(jid, type_=type_)
|
||
|
||
@timeit
|
||
def get_jid_id(self, jid, kind=None, type_=None):
|
||
"""
|
||
Get the jid id from a jid.
|
||
In case the jid id is not found create a new one.
|
||
|
||
:param jid: The JID
|
||
|
||
:param kind: The KindConstant
|
||
|
||
:param type_: The JIDConstant
|
||
|
||
return the jid id
|
||
"""
|
||
|
||
if kind in (KindConstant.GC_MSG, KindConstant.GCSTATUS):
|
||
type_ = JIDConstant.ROOM_TYPE
|
||
elif kind is not None:
|
||
type_ = JIDConstant.NORMAL_TYPE
|
||
|
||
result = self._jid_ids.get(jid, None)
|
||
if result is not None:
|
||
return result.jid_id
|
||
|
||
sql = 'SELECT jid_id, jid, type FROM jids WHERE jid = ?'
|
||
row = self._con.execute(sql, [jid]).fetchone()
|
||
if row is not None:
|
||
self._jid_ids[jid] = row
|
||
return row.jid_id
|
||
|
||
if type_ is None:
|
||
raise ValueError(
|
||
'Unable to insert new JID because type is missing')
|
||
|
||
sql = 'INSERT INTO jids (jid, type) VALUES (?, ?)'
|
||
lastrowid = self._con.execute(sql, (jid, type_)).lastrowid
|
||
Row = namedtuple('Row', 'jid_id jid type')
|
||
self._jid_ids[jid] = Row(lastrowid, jid, type_)
|
||
self._delayed_commit()
|
||
return lastrowid
|
||
|
||
@staticmethod
|
||
def convert_show_values_to_db_api_values(show):
|
||
"""
|
||
Convert from string style to constant ints for db
|
||
"""
|
||
|
||
if show == 'online':
|
||
return ShowConstant.ONLINE
|
||
if show == 'chat':
|
||
return ShowConstant.CHAT
|
||
if show == 'away':
|
||
return ShowConstant.AWAY
|
||
if show == 'xa':
|
||
return ShowConstant.XA
|
||
if show == 'dnd':
|
||
return ShowConstant.DND
|
||
if show == 'offline':
|
||
return ShowConstant.OFFLINE
|
||
if show is None:
|
||
return ShowConstant.ONLINE
|
||
# invisible in GC when someone goes invisible
|
||
# it's a RFC violation .... but we should not crash
|
||
return None
|
||
|
||
@timeit
|
||
def insert_unread_events(self, message_id, jid_id):
|
||
"""
|
||
Add unread message with id: message_id
|
||
"""
|
||
sql = '''INSERT INTO unread_messages (message_id, jid_id, shown)
|
||
VALUES (?, ?, 0)'''
|
||
self._con.execute(sql, (message_id, jid_id))
|
||
self._delayed_commit()
|
||
|
||
@timeit
|
||
def set_read_messages(self, message_ids):
|
||
"""
|
||
Mark all messages with ids in message_ids as read
|
||
"""
|
||
ids = ','.join([str(i) for i in message_ids])
|
||
sql = 'DELETE FROM unread_messages WHERE message_id IN (%s)' % ids
|
||
self._con.execute(sql)
|
||
self._delayed_commit()
|
||
|
||
@timeit
|
||
def set_shown_unread_msgs(self, msg_log_id):
|
||
"""
|
||
Mark unread message as shown un GUI
|
||
"""
|
||
sql = 'UPDATE unread_messages SET shown = 1 where message_id = %s' % \
|
||
msg_log_id
|
||
self._con.execute(sql)
|
||
self._delayed_commit()
|
||
|
||
@timeit
|
||
def reset_shown_unread_messages(self):
|
||
"""
|
||
Set shown field to False in unread_messages table
|
||
"""
|
||
sql = 'UPDATE unread_messages SET shown = 0'
|
||
self._con.execute(sql)
|
||
self._delayed_commit()
|
||
|
||
@timeit
|
||
def get_unread_msgs(self):
|
||
"""
|
||
Get all unread messages
|
||
"""
|
||
all_messages = []
|
||
try:
|
||
unread_results = self._con.execute(
|
||
'SELECT message_id, shown from unread_messages').fetchall()
|
||
except Exception:
|
||
unread_results = []
|
||
for message in unread_results:
|
||
msg_log_id = message.message_id
|
||
shown = message.shown
|
||
# here we get infos for that message, and related jid from jids table
|
||
# do NOT change order of SELECTed things, unless you change function(s)
|
||
# that called this function
|
||
result = self._con.execute('''
|
||
SELECT logs.log_line_id, logs.message, logs.time, logs.subject,
|
||
jids.jid, logs.additional_data
|
||
FROM logs, jids
|
||
WHERE logs.log_line_id = %d AND logs.jid_id = jids.jid_id
|
||
''' % msg_log_id
|
||
).fetchone()
|
||
if result is None:
|
||
# Log line is no more in logs table.
|
||
# remove it from unread_messages
|
||
self.set_read_messages([msg_log_id])
|
||
continue
|
||
|
||
all_messages.append((result, shown))
|
||
return all_messages
|
||
|
||
@timeit
|
||
def load_groupchat_messages(self, account, jid):
|
||
account_id = self.get_account_id(account, type_=JIDConstant.ROOM_TYPE)
|
||
|
||
sql = '''
|
||
SELECT time, contact_name, message, additional_data, message_id
|
||
FROM logs NATURAL JOIN jids WHERE jid = ?
|
||
AND account_id = ? AND kind = ?
|
||
ORDER BY time DESC, log_line_id DESC LIMIT ?'''
|
||
|
||
messages = self._con.execute(
|
||
sql, (jid, account_id, KindConstant.GC_MSG, 50)).fetchall()
|
||
|
||
messages.reverse()
|
||
return messages
|
||
|
||
@timeit
|
||
def get_last_conversation_lines(self, account, jid, pending):
|
||
"""
|
||
Get recent messages
|
||
|
||
Pending messages are already in queue to be printed when the
|
||
ChatControl is opened, so we don’t want to request those messages.
|
||
How many messages are requested depends on the 'restore_lines'
|
||
config value. How far back in time messages are requested depends on
|
||
_get_timeout().
|
||
|
||
:param account: The account
|
||
|
||
:param jid: The jid from which we request the conversation lines
|
||
|
||
:param pending: How many messages are currently pending so we don’t
|
||
request those messages
|
||
|
||
returns a list of namedtuples
|
||
"""
|
||
|
||
restore = app.settings.get('restore_lines')
|
||
if restore <= 0:
|
||
return []
|
||
|
||
kinds = map(str, [KindConstant.SINGLE_MSG_RECV,
|
||
KindConstant.SINGLE_MSG_SENT,
|
||
KindConstant.CHAT_MSG_RECV,
|
||
KindConstant.CHAT_MSG_SENT,
|
||
KindConstant.ERROR])
|
||
|
||
jids = self._get_family_jids(account, jid)
|
||
account_id = self.get_account_id(account)
|
||
|
||
sql = '''
|
||
SELECT time, kind, message, error as "error [common_error]",
|
||
subject, additional_data, marker as "marker [marker]",
|
||
message_id
|
||
FROM logs NATURAL JOIN jids WHERE jid IN ({jids})
|
||
AND account_id = {account_id} AND kind IN ({kinds})
|
||
AND time > get_timeout()
|
||
ORDER BY time DESC, log_line_id DESC LIMIT ? OFFSET ?
|
||
'''.format(jids=', '.join('?' * len(jids)),
|
||
account_id=account_id,
|
||
kinds=', '.join(kinds))
|
||
|
||
messages = self._con.execute(
|
||
sql, tuple(jids) + (restore, pending)).fetchall()
|
||
|
||
messages.reverse()
|
||
return messages
|
||
|
||
@timeit
|
||
def get_conversation_for_date(self, account, jid, date):
|
||
"""
|
||
Load the complete conversation with a given jid on a specific date
|
||
|
||
:param account: The account
|
||
|
||
:param jid: The jid for which we request the conversation
|
||
|
||
:param date: datetime.datetime instance
|
||
example: datetime.datetime(year, month, day)
|
||
|
||
returns a list of namedtuples
|
||
"""
|
||
|
||
jids = self._get_family_jids(account, jid)
|
||
|
||
delta = datetime.timedelta(
|
||
hours=23, minutes=59, seconds=59, microseconds=999999)
|
||
|
||
sql = '''
|
||
SELECT contact_name, time, kind, show, message, subject,
|
||
additional_data, log_line_id
|
||
FROM logs NATURAL JOIN jids WHERE jid IN ({jids})
|
||
AND time BETWEEN ? AND ?
|
||
ORDER BY time, log_line_id
|
||
'''.format(jids=', '.join('?' * len(jids)))
|
||
|
||
return self._con.execute(sql, tuple(jids) +
|
||
(date.timestamp(),
|
||
(date + delta).timestamp())).fetchall()
|
||
|
||
@timeit
|
||
def search_log(self, account, jid, query, date=None):
|
||
"""
|
||
Search the conversation log for messages containing the `query` string.
|
||
|
||
The search can either span the complete log for the given
|
||
`account` and `jid` or be restricted to a single day by
|
||
specifying `date`.
|
||
|
||
:param account: The account
|
||
|
||
:param jid: The jid for which we request the conversation
|
||
|
||
:param query: A search string
|
||
|
||
:param date: datetime.datetime instance
|
||
example: datetime.datetime(year, month, day)
|
||
|
||
returns a list of namedtuples
|
||
"""
|
||
jids = self._get_family_jids(account, jid)
|
||
|
||
if date:
|
||
delta = datetime.timedelta(
|
||
hours=23, minutes=59, seconds=59, microseconds=999999)
|
||
|
||
between = '''
|
||
AND time BETWEEN {start} AND {end}
|
||
'''.format(start=date.timestamp(),
|
||
end=(date + delta).timestamp())
|
||
|
||
sql = '''
|
||
SELECT contact_name, time, kind, show, message, subject,
|
||
additional_data, log_line_id
|
||
FROM logs NATURAL JOIN jids WHERE jid IN ({jids})
|
||
AND message LIKE like(?) {date_search}
|
||
ORDER BY time DESC, log_line_id
|
||
'''.format(jids=', '.join('?' * len(jids)),
|
||
date_search=between if date else '')
|
||
|
||
return self._con.execute(sql, tuple(jids) + (query,)).fetchall()
|
||
|
||
@timeit
|
||
def get_days_with_logs(self, account, jid, year, month):
|
||
"""
|
||
Request the days in a month where we received messages
|
||
for a given `jid`.
|
||
|
||
:param account: The account
|
||
|
||
:param jid: The jid for which we request the days
|
||
|
||
:param year: The year
|
||
|
||
:param month: The month
|
||
|
||
returns a list of namedtuples
|
||
"""
|
||
jids = self._get_family_jids(account, jid)
|
||
|
||
kinds = map(str, [KindConstant.STATUS,
|
||
KindConstant.GCSTATUS])
|
||
|
||
# Calculate the start and end datetime of the month
|
||
date = datetime.datetime(year, month, 1)
|
||
days = calendar.monthrange(year, month)[1] - 1
|
||
delta = datetime.timedelta(
|
||
days=days, hours=23, minutes=59, seconds=59, microseconds=999999)
|
||
|
||
sql = """
|
||
SELECT DISTINCT
|
||
CAST(strftime('%d', time, 'unixepoch', 'localtime') AS INTEGER)
|
||
AS day FROM logs NATURAL JOIN jids WHERE jid IN ({jids})
|
||
AND time BETWEEN ? AND ?
|
||
AND kind NOT IN ({kinds})
|
||
ORDER BY time
|
||
""".format(jids=', '.join('?' * len(jids)),
|
||
kinds=', '.join(kinds))
|
||
|
||
return self._con.execute(sql, tuple(jids) +
|
||
(date.timestamp(),
|
||
(date + delta).timestamp())).fetchall()
|
||
|
||
@timeit
|
||
def get_last_date_that_has_logs(self, account, jid):
|
||
"""
|
||
Get the timestamp of the last message we received for the jid.
|
||
|
||
:param account: The account
|
||
|
||
:param jid: The jid for which we request the last timestamp
|
||
|
||
returns a timestamp or None
|
||
"""
|
||
jids = self._get_family_jids(account, jid)
|
||
|
||
kinds = map(str, [KindConstant.STATUS,
|
||
KindConstant.GCSTATUS])
|
||
|
||
sql = '''
|
||
SELECT MAX(time) as time FROM logs
|
||
NATURAL JOIN jids WHERE jid IN ({jids})
|
||
AND kind NOT IN ({kinds})
|
||
'''.format(jids=', '.join('?' * len(jids)),
|
||
kinds=', '.join(kinds))
|
||
|
||
# fetchone() returns always at least one Row with all
|
||
# attributes set to None because of the MAX() function
|
||
return self._con.execute(sql, tuple(jids)).fetchone().time
|
||
|
||
@timeit
|
||
def get_first_date_that_has_logs(self, account, jid):
|
||
"""
|
||
Get the timestamp of the first message we received for the jid.
|
||
|
||
:param account: The account
|
||
|
||
:param jid: The jid for which we request the first timestamp
|
||
|
||
returns a timestamp or None
|
||
"""
|
||
jids = self._get_family_jids(account, jid)
|
||
|
||
kinds = map(str, [KindConstant.STATUS,
|
||
KindConstant.GCSTATUS])
|
||
|
||
sql = '''
|
||
SELECT MIN(time) as time FROM logs
|
||
NATURAL JOIN jids WHERE jid IN ({jids})
|
||
AND kind NOT IN ({kinds})
|
||
'''.format(jids=', '.join('?' * len(jids)),
|
||
kinds=', '.join(kinds))
|
||
|
||
# fetchone() returns always at least one Row with all
|
||
# attributes set to None because of the MIN() function
|
||
return self._con.execute(sql, tuple(jids)).fetchone().time
|
||
|
||
@timeit
|
||
def get_date_has_logs(self, account, jid, date):
|
||
"""
|
||
Get single timestamp of a message we received for the jid
|
||
in the time range of one day.
|
||
|
||
:param account: The account
|
||
|
||
:param jid: The jid for which we request the first timestamp
|
||
|
||
:param date: datetime.datetime instance
|
||
example: datetime.datetime(year, month, day)
|
||
|
||
returns a timestamp or None
|
||
"""
|
||
jids = self._get_family_jids(account, jid)
|
||
|
||
delta = datetime.timedelta(
|
||
hours=23, minutes=59, seconds=59, microseconds=999999)
|
||
|
||
start = date.timestamp()
|
||
end = (date + delta).timestamp()
|
||
|
||
sql = '''
|
||
SELECT time
|
||
FROM logs NATURAL JOIN jids WHERE jid IN ({jids})
|
||
AND time BETWEEN ? AND ?
|
||
'''.format(jids=', '.join('?' * len(jids)))
|
||
|
||
return self._con.execute(
|
||
sql, tuple(jids) + (start, end)).fetchone()
|
||
|
||
@timeit
|
||
def deduplicate_muc_message(self, account, jid, resource,
|
||
timestamp, message_id):
|
||
"""
|
||
Check if a message is already in the `logs` table
|
||
|
||
:param account: The account
|
||
|
||
:param jid: The muc jid as string
|
||
|
||
:param resource: The resource
|
||
|
||
:param timestamp: The timestamp in UTC epoch
|
||
|
||
:param message_id: The message-id
|
||
"""
|
||
|
||
# Add 60 seconds around the timestamp
|
||
start_time = timestamp - 60
|
||
end_time = timestamp + 60
|
||
|
||
account_id = self.get_account_id(account)
|
||
log.debug('Search for MUC duplicate')
|
||
log.debug('start: %s, end: %s, jid: %s, resource: %s, message-id: %s',
|
||
start_time, end_time, jid, resource, message_id)
|
||
|
||
sql = '''
|
||
SELECT * FROM logs
|
||
NATURAL JOIN jids WHERE
|
||
jid = ? AND
|
||
contact_name = ? AND
|
||
message_id = ? AND
|
||
account_id = ? AND
|
||
time BETWEEN ? AND ?
|
||
'''
|
||
|
||
result = self._con.execute(sql, (jid,
|
||
resource,
|
||
message_id,
|
||
account_id,
|
||
start_time,
|
||
end_time)).fetchone()
|
||
|
||
if result is not None:
|
||
log.debug('Found duplicate')
|
||
return True
|
||
return False
|
||
|
||
@timeit
|
||
def find_stanza_id(self, account, archive_jid, stanza_id, origin_id=None,
|
||
groupchat=False):
|
||
"""
|
||
Checks if a stanza-id is already in the `logs` table
|
||
|
||
:param account: The account
|
||
|
||
:param archive_jid: The jid of the archive the stanza-id belongs to
|
||
only used if groupchat=True
|
||
|
||
:param stanza_id: The stanza-id
|
||
|
||
:param origin_id: The origin-id
|
||
|
||
:param groupchat: stanza-id is from a groupchat
|
||
|
||
return True if the stanza-id was found
|
||
"""
|
||
ids = []
|
||
if stanza_id is not None:
|
||
ids.append(stanza_id)
|
||
if origin_id is not None:
|
||
ids.append(origin_id)
|
||
|
||
if not ids:
|
||
return False
|
||
|
||
type_ = JIDConstant.NORMAL_TYPE
|
||
if groupchat:
|
||
type_ = JIDConstant.ROOM_TYPE
|
||
|
||
archive_id = self.get_jid_id(archive_jid, type_=type_)
|
||
account_id = self.get_account_id(account)
|
||
|
||
if groupchat:
|
||
# Stanza ID is only unique within a specific archive.
|
||
# So a Stanza ID could be repeated in different MUCs, so we
|
||
# filter also for the archive JID which is the bare MUC jid.
|
||
|
||
# Use Unary-"+" operator for "jid_id", otherwise the
|
||
# idx_logs_jid_id_time index is used instead of the much better
|
||
# idx_logs_stanza_id index
|
||
sql = '''
|
||
SELECT stanza_id FROM logs
|
||
WHERE stanza_id IN ({values})
|
||
AND +jid_id = ? AND account_id = ? LIMIT 1
|
||
'''.format(values=', '.join('?' * len(ids)))
|
||
result = self._con.execute(
|
||
sql, tuple(ids) + (archive_id, account_id)).fetchone()
|
||
else:
|
||
sql = '''
|
||
SELECT stanza_id FROM logs
|
||
WHERE stanza_id IN ({values}) AND account_id = ? AND kind != ? LIMIT 1
|
||
'''.format(values=', '.join('?' * len(ids)))
|
||
result = self._con.execute(
|
||
sql, tuple(ids) + (account_id, KindConstant.GC_MSG)).fetchone()
|
||
|
||
if result is not None:
|
||
log.info('Found duplicated message, stanza-id: %s, origin-id: %s, '
|
||
'archive-jid: %s, account: %s', stanza_id, origin_id, archive_jid, account_id)
|
||
return True
|
||
return False
|
||
|
||
def insert_jid(self, jid, kind=None, type_=JIDConstant.NORMAL_TYPE):
|
||
"""
|
||
Insert a new jid into the `jids` table.
|
||
This is an alias of get_jid_id() for better readablility.
|
||
|
||
:param jid: The jid as string
|
||
|
||
:param kind: A KindConstant
|
||
|
||
:param type_: A JIDConstant
|
||
"""
|
||
return self.get_jid_id(jid, kind, type_)
|
||
|
||
@timeit
|
||
def insert_into_logs(self, account, jid, time_, kind,
|
||
unread=True, **kwargs):
|
||
"""
|
||
Insert a new message into the `logs` table
|
||
|
||
:param jid: The jid as string
|
||
|
||
:param time_: The timestamp in UTC epoch
|
||
|
||
:param kind: A KindConstant
|
||
|
||
:param unread: If True the message is added to the`unread_messages`
|
||
table. Only if kind == CHAT_MSG_RECV
|
||
|
||
:param kwargs: Every additional named argument must correspond to
|
||
a field in the `logs` table
|
||
"""
|
||
jid_id = self.get_jid_id(jid, kind=kind)
|
||
account_id = self.get_account_id(account)
|
||
|
||
if 'additional_data' in kwargs:
|
||
if not kwargs['additional_data']:
|
||
del kwargs['additional_data']
|
||
else:
|
||
serialized_dict = json.dumps(kwargs["additional_data"].data)
|
||
kwargs['additional_data'] = serialized_dict
|
||
|
||
sql = '''
|
||
INSERT INTO logs (account_id, jid_id, time, kind, {columns})
|
||
VALUES (?, ?, ?, ?, {values})
|
||
'''.format(columns=', '.join(kwargs.keys()),
|
||
values=', '.join('?' * len(kwargs)))
|
||
|
||
lastrowid = self._con.execute(
|
||
sql, (account_id, jid_id, time_, kind) + tuple(kwargs.values())).lastrowid
|
||
|
||
log.info('Insert into DB: jid: %s, time: %s, kind: %s, stanza_id: %s',
|
||
jid, time_, kind, kwargs.get('stanza_id', None))
|
||
|
||
if unread and kind == KindConstant.CHAT_MSG_RECV:
|
||
sql = '''INSERT INTO unread_messages (message_id, jid_id)
|
||
VALUES (?, (SELECT jid_id FROM jids WHERE jid = ?))'''
|
||
self._con.execute(sql, (lastrowid, jid))
|
||
|
||
self._delayed_commit()
|
||
|
||
return lastrowid
|
||
|
||
@timeit
|
||
def set_message_error(self, account_jid, jid, message_id, error):
|
||
"""
|
||
Update the corresponding message with the error
|
||
|
||
:param account_jid: The jid of the account
|
||
|
||
:param jid: The jid that belongs to the avatar
|
||
|
||
:param message_id: The id of the message
|
||
|
||
:param error: The error stanza as string
|
||
|
||
"""
|
||
|
||
account_id = self.get_jid_id(account_jid)
|
||
try:
|
||
jid_id = self.get_jid_id(str(jid))
|
||
except ValueError:
|
||
# Unknown JID
|
||
return
|
||
|
||
sql = '''
|
||
UPDATE logs SET error = ?
|
||
WHERE account_id = ? AND jid_id = ? AND message_id = ?
|
||
'''
|
||
self._con.execute(sql, (error, account_id, jid_id, message_id))
|
||
self._delayed_commit()
|
||
|
||
@timeit
|
||
def set_marker(self, account_jid, jid, message_id, state):
|
||
"""
|
||
Update the marker state of the corresponding message
|
||
|
||
:param account_jid: The jid of the account
|
||
|
||
:param jid: The jid that belongs to the avatar
|
||
|
||
:param message_id: The id of the message
|
||
|
||
:param state: The state, 'received' or 'displayed'
|
||
|
||
"""
|
||
if state not in ('received', 'displayed'):
|
||
raise ValueError('Invalid marker state')
|
||
|
||
account_id = self.get_jid_id(account_jid)
|
||
try:
|
||
jid_id = self.get_jid_id(str(jid))
|
||
except ValueError:
|
||
# Unknown JID
|
||
return
|
||
|
||
state = 0 if state == 'received' else 1
|
||
|
||
sql = '''
|
||
UPDATE logs SET marker = ?
|
||
WHERE account_id = ? AND jid_id = ? AND message_id = ?
|
||
'''
|
||
self._con.execute(sql, (state, account_id, jid_id, message_id))
|
||
self._delayed_commit()
|
||
|
||
@timeit
|
||
def get_archive_infos(self, jid):
|
||
"""
|
||
Get the archive infos
|
||
|
||
:param jid: The jid that belongs to the avatar
|
||
|
||
"""
|
||
jid_id = self.get_jid_id(jid, type_=JIDConstant.ROOM_TYPE)
|
||
sql = '''SELECT * FROM last_archive_message WHERE jid_id = ?'''
|
||
return self._con.execute(sql, (jid_id,)).fetchone()
|
||
|
||
@timeit
|
||
def set_archive_infos(self, jid, **kwargs):
|
||
"""
|
||
Set archive infos
|
||
|
||
:param jid: The jid that belongs to the avatar
|
||
|
||
:param last_mam_id: The last MAM result id
|
||
|
||
:param oldest_mam_timestamp: The oldest date we requested MAM
|
||
history for
|
||
|
||
:param last_muc_timestamp: The timestamp of the last message we
|
||
received in a MUC
|
||
|
||
:param sync_threshold: The max days that we request from a
|
||
MUC archive
|
||
|
||
"""
|
||
jid_id = self.get_jid_id(jid)
|
||
exists = self.get_archive_infos(jid)
|
||
if not exists:
|
||
sql = '''INSERT INTO last_archive_message
|
||
(jid_id, last_mam_id, oldest_mam_timestamp,
|
||
last_muc_timestamp)
|
||
VALUES (?, ?, ?, ?)'''
|
||
self._con.execute(sql, (
|
||
jid_id,
|
||
kwargs.get('last_mam_id', None),
|
||
kwargs.get('oldest_mam_timestamp', None),
|
||
kwargs.get('last_muc_timestamp', None),
|
||
))
|
||
else:
|
||
for key, value in list(kwargs.items()):
|
||
if value is None:
|
||
del kwargs[key]
|
||
|
||
args = ' = ?, '.join(kwargs.keys()) + ' = ?'
|
||
sql = '''UPDATE last_archive_message SET {}
|
||
WHERE jid_id = ?'''.format(args)
|
||
self._con.execute(sql, tuple(kwargs.values()) + (jid_id,))
|
||
log.info('Set message archive info: %s %s', jid, kwargs)
|
||
self._delayed_commit()
|
||
|
||
@timeit
|
||
def reset_archive_infos(self, jid):
|
||
"""
|
||
Set archive infos
|
||
|
||
:param jid: The jid of the archive
|
||
|
||
"""
|
||
jid_id = self.get_jid_id(jid)
|
||
sql = '''UPDATE last_archive_message
|
||
SET last_mam_id = NULL, oldest_mam_timestamp = NULL,
|
||
last_muc_timestamp = NULL
|
||
WHERE jid_id = ?'''
|
||
self._con.execute(sql, (jid_id,))
|
||
log.info('Reset message archive info: %s', jid)
|
||
self._delayed_commit()
|
||
|
||
def _cleanup_chat_history(self):
|
||
"""
|
||
Remove messages from account where messages are older than max_age
|
||
"""
|
||
for account in app.settings.get_accounts():
|
||
max_age = app.settings.get_account_setting(
|
||
account, 'chat_history_max_age')
|
||
if max_age == -1:
|
||
continue
|
||
account_id = self.get_account_id(account)
|
||
now = time.time()
|
||
point_in_time = now - int(max_age)
|
||
|
||
sql = 'DELETE FROM logs WHERE account_id = ? AND time < ?'
|
||
|
||
cursor = self._con.execute(sql, (account_id, point_in_time))
|
||
self._delayed_commit()
|
||
log.info('Removed %s old messages for %s', cursor.rowcount, account)
|