2012-06-30 15:51:50 +00:00
|
|
|
# coding=utf-8
|
|
|
|
|
2014-10-04 05:33:34 +00:00
|
|
|
"""Find synonyms"""
|
2014-08-27 23:39:31 +00:00
|
|
|
|
2012-06-30 15:51:50 +00:00
|
|
|
import re
|
|
|
|
from urllib.parse import quote
|
|
|
|
|
2015-01-04 22:57:09 +00:00
|
|
|
from nemubot.exception import IRCException
|
2015-01-03 19:34:44 +00:00
|
|
|
from nemubot.hooks import hook
|
|
|
|
from nemubot.tools import web
|
2012-11-04 15:26:20 +00:00
|
|
|
|
2015-06-03 20:07:06 +00:00
|
|
|
nemubotversion = 4.0
|
2012-06-30 15:51:50 +00:00
|
|
|
|
2014-09-26 16:00:22 +00:00
|
|
|
from more import Response
|
|
|
|
|
2014-12-17 06:32:34 +00:00
|
|
|
|
2014-08-12 18:10:19 +00:00
|
|
|
def help_full():
|
2014-10-04 05:33:34 +00:00
|
|
|
return "!syno [LANG] <word>: give a list of synonyms for <word>."
|
2012-06-30 15:51:50 +00:00
|
|
|
|
2014-12-17 06:32:34 +00:00
|
|
|
|
2014-10-04 05:33:34 +00:00
|
|
|
def load(context):
|
|
|
|
global lang_binding
|
2014-07-25 13:12:37 +00:00
|
|
|
|
2015-06-03 20:07:06 +00:00
|
|
|
if not context.config or not context.config.hasAttribute("bighugelabskey"):
|
|
|
|
logger.error("You need a NigHugeLabs API key in order to have english "
|
|
|
|
"theasorus. Add it to the module configuration file:\n"
|
|
|
|
"<module name=\"syno\" bighugelabskey=\"XXXXXXXXXXXXXXXX\""
|
|
|
|
" />\nRegister at https://words.bighugelabs.com/getkey.php")
|
2014-07-25 13:12:37 +00:00
|
|
|
else:
|
2015-06-03 20:07:06 +00:00
|
|
|
lang_binding["en"] = lambda word: get_english_synos(context.config["bighugelabskey"], word)
|
2012-08-16 03:24:56 +00:00
|
|
|
|
|
|
|
|
2014-10-04 05:33:34 +00:00
|
|
|
def get_french_synos(word):
|
2013-03-20 14:08:24 +00:00
|
|
|
url = "http://www.crisco.unicaen.fr/des/synonymes/" + quote(word.encode("ISO-8859-1"))
|
|
|
|
page = web.getURLContent(url)
|
2014-07-25 13:12:37 +00:00
|
|
|
|
2014-10-04 05:33:34 +00:00
|
|
|
best = list(); synos = list(); anton = list()
|
|
|
|
|
2012-11-04 15:26:20 +00:00
|
|
|
if page is not None:
|
2014-07-08 00:44:20 +00:00
|
|
|
for line in page.split("\n"):
|
2014-07-25 13:12:37 +00:00
|
|
|
|
|
|
|
if line.find("!-- Fin liste des antonymes --") > 0:
|
|
|
|
for elt in re.finditer(">([^<>]+)</a>", line):
|
|
|
|
anton.append(elt.group(1))
|
|
|
|
|
|
|
|
elif line.find("!--Fin liste des synonymes--") > 0:
|
|
|
|
for elt in re.finditer(">([^<>]+)</a>", line):
|
2012-08-16 03:24:56 +00:00
|
|
|
synos.append(elt.group(1))
|
2014-07-25 13:12:37 +00:00
|
|
|
|
|
|
|
elif re.match("[ \t]*<tr[^>]*>.*</tr>[ \t]*</table>.*", line) is not None:
|
|
|
|
for elt in re.finditer(">&[^;]+;([^&]*)&[^;]+;<", line):
|
|
|
|
best.append(elt.group(1))
|
|
|
|
|
2014-10-04 05:33:34 +00:00
|
|
|
return (best, synos, anton)
|
|
|
|
|
|
|
|
|
|
|
|
def get_english_synos(key, word):
|
2014-12-17 06:32:34 +00:00
|
|
|
cnt = web.getJSON("http://words.bighugelabs.com/api/2/%s/%s/json" %
|
|
|
|
(quote(key), quote(word.encode("ISO-8859-1"))))
|
2014-10-04 05:33:34 +00:00
|
|
|
|
|
|
|
best = list(); synos = list(); anton = list()
|
|
|
|
|
|
|
|
if cnt is not None:
|
|
|
|
for k, c in cnt.items():
|
|
|
|
if "syn" in c: best += c["syn"]
|
|
|
|
if "rel" in c: synos += c["rel"]
|
|
|
|
if "ant" in c: anton += c["ant"]
|
2014-07-25 13:12:37 +00:00
|
|
|
|
2014-10-04 05:33:34 +00:00
|
|
|
return (best, synos, anton)
|
|
|
|
|
|
|
|
|
|
|
|
lang_binding = { 'fr': get_french_synos }
|
|
|
|
|
|
|
|
|
|
|
|
@hook("cmd_hook", "synonymes", data="synonymes")
|
|
|
|
@hook("cmd_hook", "antonymes", data="antonymes")
|
|
|
|
def go(msg, what):
|
2015-06-03 20:07:06 +00:00
|
|
|
if not len(msg.args):
|
2014-10-04 05:33:34 +00:00
|
|
|
raise IRCException("de quel mot veux-tu connaître la liste des synonymes ?")
|
|
|
|
|
|
|
|
# Detect lang
|
2015-06-03 20:07:06 +00:00
|
|
|
if msg.args[0] in lang_binding:
|
|
|
|
func = lang_binding[msg.args[0]]
|
|
|
|
word = ' '.join(msg.args[1:])
|
2012-08-16 03:24:56 +00:00
|
|
|
else:
|
2014-10-04 05:33:34 +00:00
|
|
|
func = lang_binding["fr"]
|
2015-06-03 20:07:06 +00:00
|
|
|
word = ' '.join(msg.args)
|
2014-10-04 05:33:34 +00:00
|
|
|
# TODO: depreciate usage without lang
|
2015-06-03 20:07:06 +00:00
|
|
|
#raise IRCException("language %s is not handled yet." % msg.args[0])
|
2014-10-04 05:33:34 +00:00
|
|
|
|
|
|
|
try:
|
|
|
|
best, synos, anton = func(word)
|
|
|
|
except:
|
|
|
|
best, synos, anton = (list(), list(), list())
|
|
|
|
|
|
|
|
if what == "synonymes":
|
|
|
|
if len(synos) > 0 or len(best) > 0:
|
|
|
|
res = Response(channel=msg.channel, title="Synonymes de %s" % word)
|
|
|
|
if len(best) > 0: res.append_message(best)
|
|
|
|
if len(synos) > 0: res.append_message(synos)
|
|
|
|
return res
|
|
|
|
else:
|
|
|
|
raise IRCException("Aucun synonyme de %s n'a été trouvé" % word)
|
|
|
|
|
|
|
|
elif what == "antonymes":
|
|
|
|
if len(anton) > 0:
|
|
|
|
res = Response(anton, channel=msg.channel,
|
|
|
|
title="Antonymes de %s" % word)
|
|
|
|
return res
|
|
|
|
else:
|
|
|
|
raise IRCException("Aucun antonyme de %s n'a été trouvé" % word)
|
|
|
|
|
|
|
|
else:
|
|
|
|
raise IRCException("WHAT?!")
|