New module: ddg: search on internet through Duckduckgo and Wolfram|Alpha
This commit is contained in:
parent
cf18e7c2e7
commit
16f6cefc59
3 changed files with 187 additions and 0 deletions
68
modules/ddg/DDGSearch.py
Normal file
68
modules/ddg/DDGSearch.py
Normal file
|
|
@ -0,0 +1,68 @@
|
|||
# coding=utf-8
|
||||
|
||||
import http.client
|
||||
import re
|
||||
from urllib.parse import quote
|
||||
|
||||
import module_states_file as xmlparser
|
||||
|
||||
class DDGSearch:
|
||||
def __init__(self, terms):
|
||||
self.terms = terms
|
||||
self.curRT = -1
|
||||
(res, page) = getPage(terms)
|
||||
if res == http.client.OK:
|
||||
self.ddgres = xmlparser.parse_string(page)
|
||||
else:
|
||||
self.ddgres = None
|
||||
|
||||
@property
|
||||
def type(self):
|
||||
return self.ddgres.getFirstNode("Type").getContent()
|
||||
|
||||
@property
|
||||
def definition(self):
|
||||
if self.ddgres.hasNode("Definition"):
|
||||
return self.ddgres.getFirstNode("Definition").getContent()
|
||||
else:
|
||||
return "Sorry, no definition found for %s" % self.terms
|
||||
|
||||
@property
|
||||
def nextRes(self):
|
||||
if self.type == "D":
|
||||
if len(self.ddgres.getFirstNode("RelatedTopics").getNodes("RelatedTopic")) > self.curRT + 1:
|
||||
self.curRT += 1
|
||||
node = self.ddgres.getFirstNode("RelatedTopics").getNodes("RelatedTopic")[self.curRT]
|
||||
return node.getFirstNode("Text").getContent()
|
||||
elif self.ddgres.hasNode("Answer"):
|
||||
if self.curRT < 0:
|
||||
self.curRT = 0
|
||||
return striphtml(self.ddgres.getFirstNode("Answer").getContent())
|
||||
elif self.ddgres.hasNode("Abstract") and len (self.ddgres.getNode("Abstract").getContent()) > 0:
|
||||
if self.curRT < 0:
|
||||
self.curRT = 0
|
||||
return self.ddgres.getNode("Abstract").getContent() + " <" + self.ddgres.getNode("AbstractURL").getContent() + ">"
|
||||
elif len(self.ddgres.getFirstNode("RelatedTopics").getNodes("RelatedTopic")) > self.curRT:
|
||||
node = self.ddgres.getFirstNode("RelatedTopics").getNodes("RelatedTopic")[self.curRT]
|
||||
self.curRT += 1
|
||||
return node.getFirstNode("Text").getContent()
|
||||
return "No more results"
|
||||
|
||||
|
||||
def striphtml(data):
|
||||
p = re.compile(r'<.*?>')
|
||||
return p.sub('', data)
|
||||
|
||||
def getPage(terms):
|
||||
conn = http.client.HTTPConnection("api.duckduckgo.com")
|
||||
try:
|
||||
conn.request("GET", "/?q=%s&format=xml" % quote(terms))
|
||||
except socket.gaierror:
|
||||
print ("impossible de récupérer la page %s."%(p))
|
||||
return (http.client.INTERNAL_SERVER_ERROR, None)
|
||||
|
||||
res = conn.getresponse()
|
||||
data = res.read()
|
||||
|
||||
conn.close()
|
||||
return (res.status, data)
|
||||
Loading…
Add table
Add a link
Reference in a new issue