hi,

in context of the discussion on counting tamil characters, here is one
solution:

#!/usr/bin/env python
# -*- coding: utf-8 -*-

import codecs

def countsyll(instring):
    s = codecs.utf_8_encode(instring)
    x = codecs.utf_8_decode(s[0])[0]    
    syllen = 0
    vowels = [u'\u0bbe',u'\u0bbf',u'\u0bc0',
                u'\u0bc1',u'\u0bc2',u'\u0bc6',
                u'\u0bc7',u'\u0bc8',u'\u0bca',
                u'\u0bcb',u'\u0bcc',u'\u0bcd',]
    for y in x:
        if y not in vowels:
            syllen += 1    
    return syllen

if __name__=='__main__':
    print countsyll(u'ஆண்டவரின் துணைவன்')

-- 
regards
KG
http://lawgon.livejournal.com

_______________________________________________
ILUGC Mailing List:
http://www.ae.iitm.ac.in/mailman/listinfo/ilugc

Reply via email to