# HG changeset patch # User Goffi # Date 1664030266 -7200 # Node ID 4cb38c8312a10ca45ec70d162e41d00e8c990f64 # Parent 944f51f9c2b41354846847ee24ac3f4407492fbe plugin XEP-0384, xml_tools: avoid `getItems` timeout + fix empty node crash + parsing: - use `max_items` in `getItems` calls for bundles, as otherwise some pubsub service may return full nodes, which may be huge is `max_items=1` is not set on the node, possibly resulting in timeouts. - the plugin was crashing when TWOMEMO devices list node has no items at all. This is not the case anymore. - a naive parsing method has been implemented in `xml_tools` to replace the serialisation/deserialisation method. This should be more efficient and will avoid annoying `ns0:` prefixes in XML logs. diff -r 944f51f9c2b4 -r 4cb38c8312a1 sat/plugins/plugin_xep_0384.py --- a/sat/plugins/plugin_xep_0384.py Sat Sep 24 16:31:39 2022 +0200 +++ b/sat/plugins/plugin_xep_0384.py Sat Sep 24 16:37:46 2022 +0200 @@ -419,7 +419,7 @@ node = f"eu.siacs.conversations.axolotl.bundles:{device_id}" try: - items, __ = await xep_0060.getItems(client, jid.JID(bare_jid), node) + items, __ = await xep_0060.getItems(client, jid.JID(bare_jid), node, max_items=1) except Exception as e: raise omemo.BundleDownloadFailed( f"Bundle download failed for {bare_jid}: {device_id} under namespace" @@ -432,7 +432,7 @@ f" {namespace}: Unexpected number of items retrieved: {len(items)}." ) - element = next(iter(domish_to_etree(cast(domish.Element, items[0]))), None) + element = next(iter(xml_tools.domish_elt_2_et_elt(cast(domish.Element, items[0]))), None) if element is None: raise omemo.BundleDownloadFailed( f"Bundle download failed for {bare_jid}: {device_id} under namespace" @@ -476,7 +476,7 @@ client, client.jid.userhostJID(), node, - etree_to_domish(element), + xml_tools.et_elt_2_domish_elt(element), item_id=str(bundle.device_id), extra={ xep_0060.EXTRA_PUBLISH_OPTIONS: { @@ -516,7 +516,7 @@ client, client.jid.userhostJID(), node, - etree_to_domish(element), + xml_tools.et_elt_2_domish_elt(element), item_id=xep_0060.ID_SINGLETON, extra={ xep_0060.EXTRA_PUBLISH_OPTIONS: { xep_0060.OPT_MAX_ITEMS: 1 }, @@ -563,7 +563,7 @@ ) element = next( - iter(domish_to_etree(cast(domish.Element, items[0]))), + iter(xml_tools.domish_elt_2_et_elt(cast(domish.Element, items[0]))), None ) if element is None: @@ -650,7 +650,7 @@ client, client.jid.userhostJID(), node, - etree_to_domish(element), + xml_tools.et_elt_2_domish_elt(element), item_id=xep_0060.ID_SINGLETON, extra={ xep_0060.EXTRA_PUBLISH_OPTIONS: { @@ -705,13 +705,15 @@ f" {namespace}" ) from e - if len(items) != 1: + if len(items) == 0: + return {} + elif len(items) != 1: raise omemo.DeviceListDownloadFailed( f"Device list download failed for {bare_jid} under namespace" f" {namespace}: Unexpected number of items retrieved: {len(items)}." ) - element = next(iter(domish_to_etree(cast(domish.Element, items[0]))), None) + element = next(iter(xml_tools.domish_elt_2_et_elt(cast(domish.Element, items[0]))), None) if element is None: raise omemo.DeviceListDownloadFailed( f"Device list download failed for {bare_jid} under namespace" @@ -866,10 +868,10 @@ "timestamp": time.time() })) - message_data["xml"].addChild(etree_to_domish(element)) + message_data["xml"].addChild(xml_tools.et_elt_2_domish_elt(element)) try: - await client.send(message_data["xml"]) + await client.a_send(message_data["xml"]) except Exception as e: raise omemo.MessageSendingFailed() from e @@ -1493,7 +1495,6 @@ encrypted. @return: Whether to continue the message received flow. """ - muc_plaintext_cache_key: Optional[MUCPlaintextCacheKey] = None sender_jid = jid.JID(message_elt["from"]) @@ -1583,7 +1584,7 @@ if twomemo_encrypted_elt is not None: try: message = twomemo.etree.parse_message( - domish_to_etree(twomemo_encrypted_elt), + xml_tools.domish_elt_2_et_elt(twomemo_encrypted_elt), sender_bare_jid ) except (ValueError, XMLSchemaValidationError): @@ -1597,7 +1598,7 @@ if oldmemo_encrypted_elt is not None: try: message = await oldmemo.etree.parse_message( - domish_to_etree(oldmemo_encrypted_elt), + xml_tools.domish_elt_2_et_elt(oldmemo_encrypted_elt), sender_bare_jid, client.jid.userhost(), session_manager @@ -1999,11 +2000,11 @@ if namespace == twomemo.twomemo.NAMESPACE: # Add the encrypted element - stanza.addChild(etree_to_domish(twomemo.etree.serialize_message(message))) + stanza.addChild(xml_tools.et_elt_2_domish_elt(twomemo.etree.serialize_message(message))) if namespace == oldmemo.oldmemo.NAMESPACE: # Add the encrypted element - stanza.addChild(etree_to_domish(oldmemo.etree.serialize_message(message))) + stanza.addChild(xml_tools.et_elt_2_domish_elt(oldmemo.etree.serialize_message(message))) if muc_plaintext_cache_key is not None: self.__muc_plaintext_cache[muc_plaintext_cache_key] = plaintext @@ -2031,7 +2032,7 @@ log.debug("Ignoring empty device list update.") return - item_elt = domish_to_etree(item) + item_elt = xml_tools.domish_elt_2_et_elt(item) device_list: Dict[int, Optional[str]] = {} namespace: Optional[str] = None diff -r 944f51f9c2b4 -r 4cb38c8312a1 sat/tools/xml_tools.py --- a/sat/tools/xml_tools.py Sat Sep 24 16:31:39 2022 +0200 +++ b/sat/tools/xml_tools.py Sat Sep 24 16:37:46 2022 +0200 @@ -18,7 +18,7 @@ import re -from typing import Optional +from typing import Optional, Tuple import html.entities from collections import OrderedDict from xml.dom import minidom, NotFoundErr @@ -30,6 +30,7 @@ from sat.core.i18n import _ from sat.core.constants import Const as C from sat.core.log import getLogger +import xml.etree.ElementTree as ET log = getLogger(__name__) @@ -1957,3 +1958,55 @@ def ppElt(elt): """Pretty print a domish.Element""" print(pFmtElt(elt)) + + +# ElementTree + +def et_get_namespace_and_name(et_elt: ET.Element) -> Tuple[Optional[str], str]: + """Retrieve element namespace and name from ElementTree element + + @param et_elt: ElementTree element + @return: namespace and name of the element + if not namespace if specified, None is returned + """ + name = et_elt.tag + if not name: + raise ValueError("no name set in ET element") + elif name[0] != "{": + return None, name + end_idx = name.find("}") + if end_idx == -1: + raise ValueError("Invalid ET name") + return name[1:end_idx], name[end_idx+1:] + + +def et_elt_2_domish_elt(et_elt: ET.Element) -> domish.Element: + """Convert ElementTree element to Twisted's domish.Element + + Note: this is a naive implementation, adapted to XMPP, and some content are ignored + (attributes namespaces, tail) + """ + namespace, name = et_get_namespace_and_name(et_elt) + elt = domish.Element((namespace, name), attribs=et_elt.attrib) + if et_elt.text: + elt.addContent(et_elt.text) + for child in et_elt: + elt.addChild(et_elt_2_domish_elt(child)) + return elt + + +def domish_elt_2_et_elt(elt: domish.Element) -> ET.Element: + """Convert Twisted's domish.Element to ElementTree equivalent + + Note: this is a naive implementation, adapter to XMPP, and some text content may be + missing (content put after a tag, i.e. what would go to the "tail" attribute of ET + Element) + """ + tag = f"{{{elt.uri}}}{elt.name}" if elt.uri else elt.name + et_elt = ET.Element(tag, attrib=elt.attributes) + content = str(elt) + if content: + et_elt.text = str(elt) + for child in elt.elements(): + et_elt.append(domish_elt_2_et_elt(child)) + return et_elt