libervia-backend: sat/memory/sqlite.py comparison

comparison sat/memory/sqlite.py @ 2699:310e41bd6666

core (memory/sqlite): added stanza_id: /!\ database schema change /!\ stanza_id is a new field in history added to prepare the implementation of MAM for messages. A new "last_stanza_id" can be used in filters to retrieve last message with a know stanza id (useful for history synchronisation).

author	Goffi <goffi@goffi.org>
date	Sat, 01 Dec 2018 10:08:17 +0100
parents	26edcf3a30eb
children	9adf44996e58

comparison

equal deleted inserted replaced

-:5060cbeec01e
+:310e41bd6666
 import cPickle as pickle
 import hashlib
 import sqlite3
 import json
-CURRENT_DB_VERSION = 5
+CURRENT_DB_VERSION = 6
 # XXX: DATABASE schemas are used in the following way:
 #      - 'current' key is for the actual database schema, for a new base
 #      - x(int) is for update needed between x-1 and x. All number are needed between y and z to do an update
 #        e.g.: if CURRENT_DB_VERSION is 6, 'current' is the actuel DB, and to update from version 3, numbers 4, 5 and 6 are needed
 ("UNIQUE (name)",))),
 ('components',      (("profile_id INTEGER PRIMARY KEY", "entry_point TEXT NOT NULL"),
 ("FOREIGN KEY(profile_id) REFERENCES profiles(id) ON DELETE CASCADE",))),
 ('message_types',   (("type TEXT PRIMARY KEY",),
 ())),
-('history',         (("uid TEXT PRIMARY KEY", "update_uid TEXT", "profile_id INTEGER", "source TEXT", "dest TEXT", "source_res TEXT", "dest_res TEXT",
+('history',         (("uid TEXT PRIMARY KEY", "stanza_id TEXT", "update_uid TEXT", "profile_id INTEGER", "source TEXT", "dest TEXT", "source_res TEXT", "dest_res TEXT",
 "timestamp DATETIME NOT NULL", "received_timestamp DATETIME", # XXX: timestamp is the time when the message was emitted. If received time stamp is not NULL, the message was delayed and timestamp is the declared value (and received_timestamp the time of reception)
 "type TEXT", "extra BLOB"),
 ("FOREIGN KEY(profile_id) REFERENCES profiles(id) ON DELETE CASCADE", "FOREIGN KEY(type) REFERENCES message_types(type)",
 "UNIQUE (profile_id, timestamp, source, dest, source_res, dest_res)" # avoid storing 2 time the same message (specially for delayed ones)
 ))),
 ("'normal'",),
 ("'info'",) # info is not standard, but used to keep track of info like join/leave in a MUC
 )),
 )),
 },
+6:         {'cols create': {'history': ('stanza_id TEXT',)},
+},
 5:         {'create': {'files': (("id TEXT NOT NULL", "version TEXT NOT NULL", "parent TEXT NOT NULL",
 "type TEXT CHECK(type in ('{file}', '{directory}')) NOT NULL DEFAULT '{file}'".format(
 file=C.FILE_TYPE_FILE, directory=C.FILE_TYPE_DIRECTORY),
 "file_hash TEXT", "hash_algo TEXT", "name TEXT NOT NULL", "size INTEGER",
 "namespace TEXT", "mime_type TEXT",
 },
 1:         {'cols create': {'history': ('extra BLOB',)},
 },
 }
-NOT_IN_EXTRA = ('received_timestamp', 'update_uid') # keys which are in message data extra but not stored in sqlite's extra field
+NOT_IN_EXTRA = ('stanza_id', 'received_timestamp', 'update_uid') # keys which are in message data extra but not stored in sqlite's extra field
 # this is specific to this sqlite storage and for now only used for received_timestamp
 # because this value is stored in a separate field
 class ConnectionPool(adbapi.ConnectionPool):
 @param data(dict): message data as build by SatMessageProtocol.onMessage
 """
 extra = pickle.dumps({k: v for k, v in data['extra'].iteritems() if k not in NOT_IN_EXTRA}, 0)
 from_jid = data['from']
 to_jid = data['to']
-d = self.dbpool.runQuery("INSERT INTO history(uid, update_uid, profile_id, source, dest, source_res, dest_res, timestamp, received_timestamp, type, extra) VALUES (?,?,?,?,?,?,?,?,?,?,?)",
+d = self.dbpool.runQuery("INSERT INTO history(uid, stanza_id, update_uid, profile_id, source, dest, source_res, dest_res, timestamp, received_timestamp, type, extra) VALUES (?,?,?,?,?,?,?,?,?,?,?,?)",
-(data['uid'], data['extra'].get('update_uid'), self.profiles[profile], data['from'].userhost(), to_jid.userhost(), from_jid.resource, to_jid.resource, data['timestamp'], data.get('received_timestamp'), data['type'], sqlite3.Binary(extra)))
+(data['uid'], data['extra'].get('stanza_id'), data['extra'].get('update_uid'), self.profiles[profile], data['from'].userhost(), to_jid.userhost(), from_jid.resource, to_jid.resource, data['timestamp'], data.get('received_timestamp'), data['type'], sqlite3.Binary(extra)))
 d.addCallbacks(self._addToHistoryCb, self._addToHistoryEb, callbackArgs=[data], errbackArgs=[data])
 d.addErrback(self._logHistoryError, from_jid, to_jid, data)
 return d
 def sqliteHistoryToList(self, query_result):
 """Get SQL query result and return a list of message data dicts"""
 result = []
 current = {'uid': None}
 for row in reversed(query_result):
-uid, update_uid, source, dest, source_res, dest_res, timestamp, received_timestamp,\
+uid, stanza_id, update_uid, source, dest, source_res, dest_res, timestamp, received_timestamp,\
 type_, extra, message, message_lang, subject, subject_lang, thread, thread_parent = row
 if uid != current['uid']:
 # new message
 try:
 extra = pickle.loads(str(extra or ""))
 'subject': {},
 'type': type_,
 'extra': extra,
 'timestamp': timestamp,
 }
+if stanza_id is not None:
+current['extra']['stanza_id'] = stanza_id
 if update_uid is not None:
 current['extra']['update_uid'] = update_uid
 if received_timestamp is not None:
 current['extra']['received_timestamp'] = str(received_timestamp)
 result.append(current)
 @param to_jid (JID): dest JID (full, or bare for catchall)
 @param limit (int): maximum number of messages to get:
 - 0 for no message (returns the empty list)
 - None for unlimited
 @param between (bool): confound source and dest (ignore the direction)
-@param search (unicode): pattern to filter the history results
+@param filters (dict[unicode, unicode]): pattern to filter the history results
 @param profile (unicode): %(doc_profile)s
 @return: list of tuple as in [messageNew]
 """
 assert profile
 if filters is None:
 filters = {}
 if limit == 0:
 return defer.succeed([])
-query_parts = [u"SELECT uid, update_uid, source, dest, source_res, dest_res, timestamp, received_timestamp,\
+query_parts = [u"SELECT uid, stanza_id, update_uid, source, dest, source_res, dest_res, timestamp, received_timestamp,\
 type, extra, message, message.language, subject, subject.language, thread_id, thread.parent_id\
 FROM history LEFT JOIN message ON history.uid = message.history_uid\
 LEFT JOIN subject ON history.uid=subject.history_uid\
 LEFT JOIN thread ON history.uid=thread.history_uid\
-WHERE profile_id=? AND"] # FIXME: not sure if it's the best request, messages and subjects can appear several times here
+WHERE profile_id=?"] # FIXME: not sure if it's the best request, messages and subjects can appear several times here
 values = [self.profiles[profile]]
-def test_jid(type_, _jid):
+def test_jid(type_, jid_):
-values.append(_jid.userhost())
+values.append(jid_.userhost())
-if _jid.resource:
+if jid_.resource:
-values.append(_jid.resource)
+values.append(jid_.resource)
-return u'(%s=? AND %s_res=?)' % (type_, type_)
+return u'({type_}=? AND {type_}_res=?)'.format(type_=type_)
-return u'%s=?' % (type_, )
+return u'{type_}=?'.format(type_=type_)
-if between:
+if not from_jid and not to_jid:
-query_parts.append(u"((%s AND %s) OR (%s AND %s))" % (test_jid('source', from_jid),
+# not jid specified, we want all one2one communications
-test_jid('dest', to_jid),
+pass
-test_jid('source', to_jid),
+elif between:
-test_jid('dest', from_jid)))
+if not from_jid or not to_jid:
+# we only have one jid specified, we check all messages
+# from or to this jid
+jid_ = from_jid or to_jid
+query_parts.append(u"AND ({source} OR {dest})".format(
+source=test_jid(u'source', jid_),
+dest=test_jid(u'dest' , jid_)))
+else:
+# we have 2 jids specified, we check all communications between
+# those 2 jids
+query_parts.append(
+u"AND (({source_from} AND {dest_to}) "
+u"OR ({source_to} AND {dest_from}))".format(
+source_from=test_jid('source', from_jid),
+dest_to=test_jid('dest', to_jid),
+source_to=test_jid('source', to_jid),
+dest_from=test_jid('dest', from_jid)))
 else:
-query_parts.append(u"%s AND %s" % (test_jid('source', from_jid),
+# we want one communication in specific direction (from somebody or
-test_jid('dest', to_jid)))
+# to somebody).
+q = []
+if from_jid is not None:
+q.append(test_jid('source', from_jid))
+if to_jid is not None:
+q.append(test_jid('dest', to_jid))
+query_parts.append(u"AND " + u" AND ".join(q))
+# set to True if "ORDER BY" is already added
+order = False
 if filters:
 if 'body' in filters:
 # TODO: use REGEXP (function to be defined) instead of GLOB: https://www.sqlite.org/lang_expr.html
 query_parts.append(u"AND message LIKE ?")
 values.extend(types)
 if 'not_types' in filters:
 types = filters['not_types'].split()
 query_parts.append(u"AND type NOT IN ({})".format(u','.join("?"*len(types))))
 values.extend(types)
+if 'last_stanza_id' in filters:
+# this request get the last message with a "stanza_id" that we
-query_parts.append(u"ORDER BY timestamp DESC") # we reverse the order in sqliteHistoryToList
+# have in history. This is mainly used to retrieve messages sent
-# we use DESC here so LIMIT keep the last messages
+# while we were offline, using MAM (XEP-0313).
+if (filters[u'last_stanza_id'] is not True
+or from_jid is not None or to_jid is not None
+or limit != 1):
+raise ValueError(u"Unexpected values for last_stanza_id filter")
+query_parts.append(u"AND stanza_id IS NOT NULL ORDER BY history.rowid DESC")
+order = True
+if not order:
+query_parts.append(u"ORDER BY timestamp DESC") # we reverse the order in sqliteHistoryToList
+# we use DESC here so LIMIT keep the last messages
 if limit is not None:
 query_parts.append(u"LIMIT ?")
 values.append(limit)
 d = self.dbpool.runQuery(u" ".join(query_parts), values)

Mercurial > libervia-backend

comparison sat/memory/sqlite.py @ 2699:310e41bd6666