def test__clean_sentence_mention_only_whitespace(): sentence = { "text": "Die Parade tussen Plein-, Buitenkant-, Darling- en Kasteelstraat in Kaapstad word as markplein, parkeerterrein en vir massabyeenkomste gebruik.", "links": [{ "page": " Kaapstad", "text": " " }] } result = dc._clean_sentence(sentence) clean_sentence = { "text": "Die Parade tussen Plein-, Buitenkant-, Darling- en Kasteelstraat in Kaapstad word as markplein, parkeerterrein en vir massabyeenkomste gebruik.", "links": [] } assert result == clean_sentence
def test__clean_sentence_implicit_link(): sentence = {'text': 'some text', 'links': [{'page': 'some'}]} result = dc._clean_sentence(sentence) clean_sentence = {'text': 'some text', 'links': [{'page': 'some'}]} assert result == clean_sentence