Source code for topik.vectorizers.tests.test_bag_of_words

from topik.vectorizers.bag_of_words import bag_of_words

sample_data = [("doc1", ["frank", "frank", "frank", "dog", "cat"]),
                ("doc2", ["frank", "dog", "llama"]),
               ]

output = bag_of_words(sample_data)



[docs]def test_vectorizer(): assert(output.vectors["doc1"] == {1: 3, 2: 1, 3: 1}) assert(output.vectors["doc2"] == {0: 1, 1: 1, 2: 1})