Пример #1
0
def test_getting_frequencies_per_books():
    result = src.words.frequencies.get_local_frequencies_per_books(words)

    expected = [
        [('one', 0.2), ('two', 0.3), ('three', 0.5)],
        [('one', 0.2), ('dos', 0.6), ('tres', 0.2)],
    ]

    assert are_lists_deep_equal(expected, result)
Пример #2
0
def test_getting_relative_frequencies():
    result = src.words.frequencies.get_relative_frequencies(books)
    expected = [[('word', 1.9499999999999997), ('secWord', 0.8666666666666667),
                 ('thirdWord', 0.65)],
                [('thirdWord', 1.625), ('secWord', 1.4444444444444442),
                 ('word', 0.5416666666666666)]]

    assert are_lists_deep_equal(expected, result)

    result_uniques = src.words.frequencies.get_relative_frequencies(
        books, False)
    expected_uniques = [[('seventhWord', 2.1666666666666665), ('word', 1.625),
                         ('secWord', 0.7222222222222221),
                         ('thirdWord', 0.5416666666666666)],
                        [('milionthWord', 1.857142857142857),
                         ('thirdWord', 1.3928571428571428),
                         ('secWord', 1.238095238095238),
                         ('word', 0.46428571428571425)]]
    assert are_lists_deep_equal(expected_uniques, result_uniques)
Пример #3
0
def test_filtering_out_words_in_single_book():
    test_words = [[('one', 2), ('two', 3), ('three', 5), ('four', 6),
                   ('five', 4)],
                  [('one', 2), ('two', 6), ('three', 2), ('four', 9),
                   ('six', 1)]]
    result = src.words.frequencies.filter_out_words_in_single_book(test_words)
    expected = [[('one', 2), ('two', 3), ('three', 5), ('four', 6)],
                [('one', 2), ('two', 6), ('three', 2), ('four', 9)]]
    print(result)

    assert are_lists_deep_equal(result, expected)
Пример #4
0
def test_getting_sorted_frequencies():
    relative_frequencies_per_books = [
        [('one', 1), ('two', 2), ('three', 2)],
        [('dos', 2), ('one', 1), ('tres', 2)],
    ]
    result = src.words.frequencies.get_sorted_frequencies(
        relative_frequencies_per_books)

    expected = [
        [('two', 2), ('three', 2), ('one', 1)],
        [('dos', 2), ('tres', 2), ('one', 1)],
    ]
    print(result)

    assert are_lists_deep_equal(result, expected)
Пример #5
0
def test_getting_relative_frequencies_per_books():
    result = src.words.frequencies.get_relative_frequencies_per_books(
        [
            [('one', 0.2), ('two', 0.3), ('three', 0.5)],
            [('one', 0.2), ('dos', 0.6), ('tres', 0.2)],
        ], {
            'one': 0.2,
            'two': 0.15,
            'three': 0.25,
            'dos': 0.3,
            'tres': 0.1
        })

    expected = [
        [('one', 1), ('two', 2), ('three', 2)],
        [('one', 1), ('dos', 2), ('tres', 2)],
    ]

    assert are_lists_deep_equal(expected, result)
Пример #6
0
def test_are_lists_deep_equal():
    list_a = [[12], [3]]
    list_b = [[12], [3]]
    assert are_lists_deep_equal(list_a, list_b)
    assert not are_lists_deep_equal([1, 2, 3], [1, 2])
Пример #7
0
def test_count_occurences():
    test_words = [
        'I', 'I', 'I', 'like', 'potatoes', 'potatoes', 'potatoes', 'much'
    ]
    counts_arr = src.words.words_count.count_occurences(test_words)
    assert are_lists_deep_equal(counts_arr, words)
Пример #8
0
def test_map_to_frequencies():
    expected = [('I', 0.375), ('potatoes', 0.375), ('like', 0.125),
                ('much', 0.125)]
    result = src.words.words_count.map_to_frequencies(words, 8)

    assert are_lists_deep_equal(result, expected)