Ejemplo n.º 1
0
 def test_alltamil(self):
     self.assertTrue(utf8.all_tamil(u"அஆஇஈஉ"))
     self.assertFalse(utf8.all_tamil(u"அஆஇNotTamilஈஉ"))
Ejemplo n.º 2
0
        print('completed')
        break
    #print(href)
    fil2.write(job_elems.text)
    result = utf8.get_words(job_elems.text)
    for fb in final:
        result.append(fb)
    for a in result:
        a = a.replace('”', '')
        a = a.replace('“', '')
        a = a.replace('!', '', 10000000000)
        a = a.replace('.', '', 10000000000)
        a = a.replace(',', '', 10000000000)
        a = a.replace('?', '', 10000000000)
        a = a.replace('ஏற்றப்படுகின்றது', '', 10000000000)
        if (utf8.all_tamil(a)):
            if a not in new:
                new.append(a)
                fil.write(a)
                fil.write('\n')
            #f.write(a)
            #f.write("\n")

        else:
            a = ''

    cnt = count()
    final = sorted(new,
                   key=lambda w: (len(utf8.get_letters(w)), next(cnt)),
                   reverse=True)[:10]
    print(final)
Ejemplo n.º 3
0
 def test_alltamil( self ):
     self.assertTrue( utf8.all_tamil(u"அஆஇஈஉ") )
     self.assertFalse( utf8.all_tamil(u"அஆஇNotTamilஈஉ") )