piskvorky · menshikh-iv · Feb 16, 2018 · Dec 27, 2017 · Jan 15, 2018 · Jan 15, 2018
diff --git a/gensim/models/keyedvectors.py b/gensim/models/keyedvectors.py
@@ -220,7 +220,7 @@ def add_word(word, weights):
                 result.index2word.append(word)
 
             if binary:
-                binary_len = dtype(REAL).itemsize * vector_size
+                binary_len = dtype(datatype).itemsize * vector_size
                 for _ in xrange(vocab_size):
                     # mixed text and binary: read text first, then binary
                     word = []
@@ -233,7 +233,7 @@ def add_word(word, weights):
                         if ch != b'\n':  # ignore newlines in front of words (some binary files have)
                             word.append(ch)
                     word = utils.to_unicode(b''.join(word), encoding=encoding, errors=unicode_errors)
-                    weights = fromstring(fin.read(binary_len), dtype=REAL)
+                    weights = fromstring(fin.read(binary_len), dtype=datatype)
                     add_word(word, weights)
             else:
                 for line_no in xrange(vocab_size):
@@ -243,7 +243,7 @@ def add_word(word, weights):
                     parts = utils.to_unicode(line.rstrip(), encoding=encoding, errors=unicode_errors).split(" ")
                     if len(parts) != vector_size + 1:
                         raise ValueError("invalid vector on line %s (is this really the text format?)" % line_no)
-                    word, weights = parts[0], [REAL(x) for x in parts[1:]]
+                    word, weights = parts[0], np.array(parts[1:], dtype=datatype)
                     add_word(word, weights)
         if result.syn0.shape[0] != len(result.vocab):
             logger.info(

diff --git a/gensim/test/test_data/test.kv.bin b/gensim/test/test_data/test.kv.bin
@@ -0,0 +1,2 @@
+2 2
+kangaroo.n.01 8��&�%H��.���horse.n.01 \O�($L���k�P6I?
diff --git a/gensim/test/test_data/test.kv.txt b/gensim/test/test_data/test.kv.txt
@@ -0,0 +1,3 @@
+2 2
+kangaroo.n.01 -0.0007369244245224787 -8.269973595356034e-05
+horse.n.01 -0.0008546282343595379 0.0007694142576316829
diff --git a/gensim/test/test_datatype.py b/gensim/test/test_datatype.py
@@ -0,0 +1,37 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+#
+# Licensed under the GNU LGPL v2.1 - http://www.gnu.org/licenses/lgpl.html
+
+"""
+Automated tests for checking various matutils functions.
+"""
+
+import logging
+import unittest
+
+import numpy as np
+
+from gensim.test.utils import datapath
+from gensim.models.keyedvectors import KeyedVectors
+
+
+class TestDataType(unittest.TestCase):
+    def test_binary(self):
+        path = datapath('test.kv.bin')
+        kv = KeyedVectors.load_word2vec_format(path, binary=True,
+                                               datatype=np.float64)
+        self.assertAlmostEqual(kv['horse.n.01'][0], -0.0008546282343595379)
+        self.assertEqual(kv['horse.n.01'][0].dtype, np.float64)
+
+    def test_text(self):
+        path = datapath('test.kv.txt')
+        kv = KeyedVectors.load_word2vec_format(path, binary=False,
+                                               datatype=np.float64)
+        self.assertAlmostEqual(kv['horse.n.01'][0], -0.0008546282343595379)
+        self.assertEqual(kv['horse.n.01'][0].dtype, np.float64)
+
+
+if __name__ == '__main__':
+    logging.root.setLevel(logging.WARNING)
+    unittest.main()