summaryrefslogtreecommitdiff
path: root/ircbot.py
blob: 07f6ff3de6f54b5df260fe3943ff8620335d3808 (plain) (blame)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
#!/usr/bin/env python2

import logging
import sys
import importlib

from irc.client import SimpleIRCClient

import numpy
import theano
from theano import tensor

from blocks.model import Model

import datastream
from paramsaveload import SaveLoadParams
from blocks.graph import ComputationGraph

import random

logging.basicConfig(level='INFO')
logger = logging.getLogger(__name__)


class IRCClient(SimpleIRCClient):
    def __init__(self, model, sample_temperature, server, port, nick, channels, saveload):
        super(IRCClient, self).__init__()

        out = model.out[:, -1, :] / numpy.float32(sample_temperature)
        prob = tensor.nnet.softmax(out)

        cg = ComputationGraph([prob])
        assert(len(cg.inputs) == 1)
        assert(cg.inputs[0].name == 'bytes')

        # channel functions & state
        chfun = {}
        for ch in channels + ['']:
            logger.info("Building theano function for channel '%s'"%ch)
            state_vars = [theano.shared(v[0:1, :].zeros_like().eval(), v.name+'-'+ch)
                                    for v, _ in model.states]
            givens = [(v, x) for (v, _), x in zip(model.states, state_vars)]
            updates= [(x, upd) for x, (_, upd) in zip(state_vars, model.states)] 

            pred = theano.function(inputs=cg.inputs, outputs=[prob],
                                   givens=givens, updates=updates)
            reset_states = theano.function(inputs=[], outputs=[],
                                           updates=[(v, v.zeros_like()) for v in state_vars])
            chfun[ch] = (pred, reset_states)

        self.saveload = saveload

        self.chfuns = chfun

        self.chans = chans
        self.nick = nick
        self.server = None


    def on_welcome(self, server, ev):
        logger.info("Welcomed to " + repr(server))
        for ch in self.chans:
            if ch != '' and ch[0] == '#':
                server.join(ch)

    def on_join(self, server, ev):
        self.server = server

    def str2data(self, s):
        return numpy.array([ord(x) for x in s], dtype='int16')[None, :]

    def pred_until(self, pred_f, prob, delim='\n', forbid_first=None):
        s = ''
        while True:
            prob = prob / 1.00001
            pred = numpy.random.multinomial(1, prob[0, :]).nonzero()[0][0].astype('int16')
            if forbid_first is not None and s == '' and int(pred) == forbid_first:
                continue # try again

            s = s + chr(int(pred))

            prob, = pred_f(pred[None, None])

            if s[-1] == delim:
                break
        return s[:-1]

    def privmsg(self, chan, msg):
        if len(msg) > 500:
            msg = 'blip bloup'
        logger.info("%s >> %s" % (chan, msg))
        self.server.privmsg(chan, msg.decode('utf-8', 'ignore'))

    def on_pubmsg(self, server, ev):
        chan = ev.target.encode('utf-8')
        nick = ev.source.split('!')[0].encode('utf-8')
        msg = ev.arguments[0].encode('utf-8')

        logger.info("%s <%s> %s" % (chan, nick, msg))

        s0 = nick+'\t'+msg

        rep = None

        if chan in self.chfuns:
            pred_f, _ = self.chfuns[chan]
            if s0[-2:] == '^I':
                prob, = pred_f(self.str2data(s0[:-2]))
                rep = s0[:-2] + self.pred_until(pred_f, prob)
                rep = rep.split('\t', 1)[-1]
            else:
                # feed phrase to bot
                prob, = pred_f(self.str2data(s0+'\n'))
                if any(x in msg.lower() for x in [self.nick, 'frigal']):
                    if random.uniform(0, 1) < 0.3:
                        fromnick = self.pred_until(pred_f, prob, '\t', forbid_first=ord(nick[0])) 
                        logger.info("from '%s'"%fromnick)
                        prob, = pred_f(self.str2data(nick+': '))
                        rep = nick + ': ' + self.pred_until(pred_f, prob)
        else:
            logger.warn('Recieved message on unknown channel: %s'%chan)
        
        if rep != None:
            self.privmsg(chan, rep)



if __name__ == "__main__":
    if len(sys.argv) < 2:
        print >> sys.stderr, 'Usage: %s [options] config' % sys.argv[0]
        sys.exit(1)
    model_name = sys.argv[-1]
    config = importlib.import_module('.%s' % model_name, 'config')

    # Build model
    logger.info('Building model...')
    m = config.Model(config)

    # Define the computation graph && load parameters
    logger.info('Building computation graph...')
    dump_path = 'params/%s-use_on_irc.pkl' % model_name
    saveload = SaveLoadParams(path=dump_path,
                              model=Model(m.sgd_cost))
    saveload.do_load()

    # Build IRC client
    server = 'clipper.ens.fr'
    port = 6667
    nick = 'frigo'
    chans = ['#frigotest']

    irc = IRCClient(model=m,
                    sample_temperature=config.sample_temperature,
                    server=server,
                    port=port,
                    nick=nick,
                    channels=chans,
                    saveload=saveload)
    irc.connect(server, port, nick)
    irc.reactor.process_forever()


#  vim: set sts=4 ts=4 sw=4 tw=0 et :