blob: 921a2b22cfcc9c174daee807948984230cbdd4b6 (
plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
|
#ifndef LM_NEURAL_WORDVECS_H
#define LM_NEURAL_WORDVECS_H
#include "util/scoped.hh"
#include "lm/vocab.hh"
#include <Eigen/Dense>
namespace util { class FilePiece; }
namespace lm {
namespace neural {
class WordVecs {
public:
// Columns of the matrix are word vectors. The column index is the word.
typedef Eigen::Matrix<float, Eigen::Dynamic, Eigen::Dynamic, Eigen::ColMajor> Storage;
/* The file should begin with a line stating the number of word vectors and
* the length of the vectors. Then it's followed by lines containing a
* word followed by floating-point values.
*/
explicit WordVecs(util::FilePiece &in);
const Storage &Vectors() const { return vecs_; }
WordIndex Index(StringPiece str) const { return vocab_.Index(str); }
private:
util::scoped_malloc vocab_backing_;
ngram::ProbingVocabulary vocab_;
Storage vecs_;
};
}} // namespaces
#endif // LM_NEURAL_WORDVECS_H
|