f14160403f3f067b9f8d0f080d847fd27138c9f6
[zzz-dywypi.git] / plugins / WWWJDIC / plugin.py
1 ###
2 # Copyright (c) 2010, Alex Munroe
3 # All rights reserved.
4 #
5 # Redistribution and use in source and binary forms, with or without
6 # modification, are permitted provided that the following conditions are met:
7 #
8 # * Redistributions of source code must retain the above copyright notice,
9 # this list of conditions, and the following disclaimer.
10 # * Redistributions in binary form must reproduce the above copyright notice,
11 # this list of conditions, and the following disclaimer in the
12 # documentation and/or other materials provided with the distribution.
13 # * Neither the name of the author of this software nor the name of
14 # contributors to this software may be used to endorse or promote products
15 # derived from this software without specific prior written consent.
16 #
17 # THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
18 # AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
19 # IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
20 # ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
21 # LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
22 # CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
23 # SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
24 # INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
25 # CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
26 # ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
27 # POSSIBILITY OF SUCH DAMAGE.
28
29 ###
30
31 import supybot.utils as utils
32 from supybot.commands import *
33 import supybot.plugins as plugins
34 import supybot.ircutils as ircutils
35 import supybot.callbacks as callbacks
36
37 import urllib
38 import urllib2
39 from BeautifulSoup import BeautifulSoup, NavigableString
40
41
42 class WWWJDIC(callbacks.Plugin):
43 """Add the help for "@plugin help WWWJDIC" here
44 This should describe *how* to use this plugin."""
45 threaded = True
46
47 def jdic(self, irc, msg, args, thing):
48 """<thing...>
49
50 Looks up <thing> in the EDICT Japanese dictionary.
51 To use roomaji, prefix with @ for hiragana or # for katakana."""
52
53 # Fix encoding. Sigh. Stolen from Pokedex.plugin.
54 if not isinstance(thing, unicode):
55 ascii_thing = thing
56 try:
57 thing = ascii_thing.decode('utf8')
58 except UnicodeDecodeError:
59 thing = ascii_thing.decode('latin1')
60
61
62 # Unnngh this is horrendous. urllib doesn't understand unicode at all;
63 # manually encode as bytes and then urlencode
64 url_thing = urllib.quote(thing.encode('utf8'))
65
66 # Hit up wwwjdic
67 # 1 = edict; Z = raw results; U = utf8 input; R = exact + common
68 res = urllib2.urlopen(
69 u"http://www.csse.monash.edu.au/~jwb/cgi-bin/wwwjdic.cgi?1ZUR"
70 + url_thing
71 )
72
73 # Even the raw results come wrapped in minimal HTML. This sucks.
74 # They're just in this form though:
75 # <pre>
76 # entry 1
77 # entry 2
78 # So grab everything from that pre tag, split by lines, and spit it
79 # back out.
80 soup = BeautifulSoup(res)
81 thing_ct = 0
82 for entry in soup.pre.string.splitlines():
83 entry = entry.strip()
84 if entry == '':
85 continue
86
87 self._reply(irc, entry)
88
89 # Don't send back more than three; that's probably plenty
90 thing_ct += 1
91 if thing_ct >= 3:
92 break
93
94 jdic = wrap(jdic, [rest('something')])
95
96
97 def _reply(self, irc, response):
98 """Wraps irc.reply() to do some Unicode decoding.
99
100 Also stolen from Pokedex.plugin.
101 """
102 if isinstance(response, str):
103 irc.reply(response)
104 else:
105 irc.reply(response.encode('utf8'))
106
107
108
109
110 Class = WWWJDIC
111
112
113 # vim:set shiftwidth=4 softtabstop=4 expandtab textwidth=79: