basic_LM/utils.py at master · Dutil/basic_LM · GitHub

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
import numpy as np
import ipdb
from theano import tensor as T, config
import os, pickle, RNN

def oneHot( word, nb_class):
        onehot = np.zeros(nb_class, dtype=np.float32)
        onehot[word] = 1
        return onehot

def oneHots(xs, nb_class):
    return np.array([oneHot(x, nb_class) for x in xs]).astype(np.float32)


def t_crossEntropy(p, q):
    return - T.sum(p * T.log(q))

def crossEntropy(ps, qs):
    #ipdb.set_trace()
    return -1* sum([np.dot(p, [np.math.log(i, 2) for i in q]) for p, q in zip(ps, qs)])


def save_everything(saving_path, rnn, metadata):

    if not os.path.exists(saving_path):
        os.mkdir(saving_path)

    print "saving to... {}".format(saving_path)

    rnn_file_name = os.path.join(saving_path, "rnn.pkl")
    metadata_name = os.path.join(saving_path, "metadata")

    rnn.save(rnn_file_name)
    pickle.dump(metadata, open(metadata_name, 'w'))

def load_everything(loading_path):


    rnn_file_name = os.path.join(loading_path, "rnn.pkl")
    metadata_name = os.path.join(loading_path, "metadata")

    # ATTENTION, LSTM ne marche pas, je sais.
    #ipdb.set_trace()
    rnn = None

    #if is_LSTM:
    #    rnn = RNN.LSTM()
    #else:
    #    rnn = RNN.RNN()
    rnn = RNN.MLP()

    rnn.load(rnn_file_name)

    metadata = pickle.load(open(metadata_name))

    return rnn, metadata


def hotify_minibatch(minibatch, v_size, pad_before=1):
    """
    Makes sure all the sentences in the minibatch are the same length. Also add an empty word at the beginning.
    Plus make the sentences 1-hot.
    :param minibatch: a list of sentences
    :return: a padded list of sentences.
    """
    max_len = max([len(x) for x in minibatch])
    sentences = []

    # ipdb.set_trace()
    for sentence in minibatch:
        sentence = oneHots(sentence, v_size)  # one hot representation
        sentence = np.pad(sentence, ((pad_before, max_len - len(sentence)), (0, 0)),
                          'constant', constant_values=(0))  # padding to the max length
        sentences.append(sentence)

    sentences = np.array(sentences).astype(config.floatX)
    sentences = sentences.transpose((1, 0, 2))
    return sentences