summaryrefslogtreecommitdiff
path: root/python/src/sa/features.pxi
blob: fcb93f2697ae3f5ad83aa5104ad2757bac579284 (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
cdef StringMap FD = StringMap()

INITIAL_CAPACITY = 7 # default number of features
INCREMENT = INITIAL_CAPACITY # double size

cdef class FeatureVector:
    def __cinit__(self):
        self.names = IntList(INITIAL_CAPACITY, INCREMENT)
        self.values = FloatList(INITIAL_CAPACITY, INCREMENT)

    def set(self, unsigned name, float value):
        self.names.append(name)
        self.values.append(value)

    def __iter__(self):
        cdef unsigned i
        for i in range(self.names.len):
            yield (FD.word(self.names[i]), self.values[i])

    def __str__(self):
        return ' '.join('%s=%s' % feat for feat in self)

cdef class Scorer:
    cdef models
    def __init__(self, *models):
        names = [FD.index(<char *>model.__name__) for model in models]
        self.models = zip(names, models)

    cdef FeatureVector score(self, Phrase fphrase, Phrase ephrase,
            unsigned paircount, unsigned fcount, unsigned fsample_count):
        cdef FeatureVector scores = FeatureVector()
        for name, model in self.models:
            scores.set(name, model(fphrase, ephrase, paircount, fcount, fsample_count))
        return scores