• python汉字转拼音


    上代码:

    #!/usr/bin/env python
    # -*- coding:utf-8 -*-
    
    """
        Author:cleverdeng
        E-mail:clverdeng@gmail.com
    """
    
    __version__ = '0.9'
    __all__ = ["PinYin"]
    
    import os.path
    
    
    class PinYin(object):
        def __init__(self, dict_file='word.data'):
            self.word_dict = {}
            self.dict_file = dict_file
    
    
        def load_word(self):
            if not os.path.exists(self.dict_file):
                raise IOError("NotFoundFile")
    
            with file(self.dict_file) as f_obj:
                for f_line in f_obj.readlines():
                    try:
                        line = f_line.split('    ')
                        self.word_dict[line[0]] = line[1]
                    except:
                        line = f_line.split('   ')
                        self.word_dict[line[0]] = line[1]
    
    
        def hanzi2pinyin(self, string=""):
            result = []
            if not isinstance(string, unicode):
                string = string.decode("utf-8")
            
            for char in string:
                key = '%X' % ord(char)
                result.append(self.word_dict.get(key, char).split()[0][:-1].lower())
    
            return result
    
    
        def hanzi2pinyin_split(self, string="", split=""):
            result = self.hanzi2pinyin(string=string)
            if split == "":
                return result
            else:
                return split.join(result)
    
    if __name__ == "__main__":
        test = PinYin()
        test.load_word()
        string = "巴林"
        print "in: %s" % string
        print "out: %s" % str(test.hanzi2pinyin(string=string))
        print "out: %s" % test.hanzi2pinyin_split(string=string, split="-")

    用到了文件

  • 相关阅读:
    线程的start和run方法的区别
    GC相关的面试题
    AVR单片机教程——EasyElectronics Library v1.3手册
    我回来了
    继续停更通知
    停更通知
    玩玩24点(上)
    AVR单片机教程——EasyElectronics Library v1.2手册
    AVR单片机教程——数码管
    算法基础课程总结
  • 原文地址:https://www.cnblogs.com/Micang/p/8662803.html
Copyright © 2020-2023  润新知