summaryrefslogtreecommitdiff
path: root/klm/lm/interpolate/arpa_to_stream.hh
blob: 4613998d41a80fb77e9d8aa13b228d89dbfe3a21 (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
#include "lm/read_arpa.hh"
#include "util/file_piece.hh"

#include <vector>

#include <stdint.h>

namespace util { namespace stream { class ChainPositions; } }

namespace lm {

namespace ngram {
template <class T> class GrowableVocab;
class WriteUniqueWords;
} // namespace ngram

namespace interpolate {

class ARPAToStream {
  public:
    // Takes ownership of fd.
    explicit ARPAToStream(int fd, ngram::GrowableVocab<ngram::WriteUniqueWords> &vocab);

    std::size_t Order() const { return counts_.size(); }

    const std::vector<uint64_t> &Counts() const { return counts_; }

    void Run(const util::stream::ChainPositions &positions);

  private:
    util::FilePiece in_;

    std::vector<uint64_t> counts_;

    ngram::GrowableVocab<ngram::WriteUniqueWords> &vocab_;
};

}} // namespaces