Пример #1
0
        public WordEMWrapFeaturizer(string filename)
        {
            Txt2Vec.Decoder decoder = new Txt2Vec.Decoder();
            decoder.LoadBinaryModel(filename);

            string[] terms = decoder.GetAllTerms();
            vectorSize = decoder.GetVectorSize();

            m_WordEmbedding = new Dictionary<string, SingleVector>();
            m_UnkEmbedding = new SingleVector(vectorSize);

            foreach (string term in terms)
            {
                double[] vector = decoder.GetVector(term);

                if (vector != null)
                {
                    SingleVector spVector = new SingleVector(vectorSize, vector);

                    spVector.Normalize();

                    m_WordEmbedding.Add(term, spVector);
                }
            }
        }