Mercurial > libervia-backend
view src/plugins/plugin_exp_lang_detect.py @ 2316:7b448ac50a69
jp (pubsub): new search command:
search is a kind of "grep for Pubsub". It's a powerful command which allows to look for specific data in a pubsub node, recurse sub nodes if requested, and execute an action on the result.
search allows to look for items with following filter:
- simple text search
- regex
- xpath
- python code
filters are read an applied in the order in which they appear on the command line.
Then flags can be used to modify behaviour, currently there are:
- ignore-case to specify if search must be case sensitive or not
- invert to invert result of the search (i.e. don't match instead of match)
- dot-all which is specific for regex, cf. re module
- only-matching which return the matching part instead of the full item
Once a item match filters, an action is applied to it, currenlty there are:
- print, which do a simple output of the full item (default)
- exec, which run a jp command, specifying the service, node and item corresponding to the match
- exteral, which run a external command, sending the full item on stdin
By default search is only done on requested node, but if max-depth is more than 0, sub nodes will be searched too.
author | Goffi <goffi@goffi.org> |
---|---|
date | Sat, 08 Jul 2017 21:54:24 +0200 |
parents | 33c8c4973743 |
children | 8b37a62336c3 |
line wrap: on
line source
#!/usr/bin/env python2 # -*- coding: utf-8 -*- # SAT plugin to detect language (experimental) # Copyright (C) 2009-2016 Jérôme Poisson (goffi@goffi.org) # This program is free software: you can redistribute it and/or modify # it under the terms of the GNU Affero General Public License as published by # the Free Software Foundation, either version 3 of the License, or # (at your option) any later version. # This program is distributed in the hope that it will be useful, # but WITHOUT ANY WARRANTY; without even the implied warranty of # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the # GNU Affero General Public License for more details. # You should have received a copy of the GNU Affero General Public License # along with this program. If not, see <http://www.gnu.org/licenses/>. from sat.core.i18n import _, D_ from sat.core.constants import Const as C from sat.core.log import getLogger log = getLogger(__name__) from sat.core import exceptions try: from langid.langid import LanguageIdentifier, model except ImportError: raise exceptions.MissingModule(u'Missing module langid, please download/install it with "pip install langid")') identifier = LanguageIdentifier.from_modelstring(model, norm_probs=False) PLUGIN_INFO = { C.PI_NAME: "Language detection plugin", C.PI_IMPORT_NAME: "EXP-LANG-DETECT", C.PI_TYPE: "EXP", C.PI_PROTOCOLS: [], C.PI_DEPENDENCIES: [], C.PI_MAIN: "LangDetect", C.PI_HANDLER: "no", C.PI_DESCRIPTION: _("""Detect and set message language when unknown""") } CATEGORY = D_(u"Misc") NAME = u"lang_detect" LABEL = D_(u"language detection") PARAMS = """ <params> <individual> <category name="{category_name}"> <param name="{name}" label="{label}" type="bool" value="true" /> </category> </individual> </params> """.format(category_name=CATEGORY, name=NAME, label=_(LABEL), ) class LangDetect(object): def __init__(self, host): log.info(_(u"Language detection plugin initialization")) self.host = host host.memory.updateParams(PARAMS) host.trigger.add("MessageReceived", self.MessageReceivedTrigger) host.trigger.add("sendMessage", self.MessageSendTrigger) def addLanguage(self, mess_data): message = mess_data['message'] if len(message) == 1 and message.keys()[0] == '': msg = message.values()[0] lang = identifier.classify(msg)[0] mess_data["message"] = {lang: msg} return mess_data def MessageReceivedTrigger(self, client, message_elt, post_treat): """ Check if source is linked and repeat message, else do nothing """ lang_detect = self.host.memory.getParamA(NAME, CATEGORY, profile_key=client.profile) if lang_detect: post_treat.addCallback(self.addLanguage) return True def MessageSendTrigger(self, client, data, pre_xml_treatments, post_xml_treatments): lang_detect = self.host.memory.getParamA(NAME, CATEGORY, profile_key=client.profile) if lang_detect: self.addLanguage(data) return True