找出文件中的中文

来源:互联网 发布:淘宝分享购物清单在哪 编辑:程序博客网 时间:2024/05/20 22:28
'''检查文件中是否有中文,并且找出位置'''import reimport sysm = re.compile(u'[\u4e00-\u9fa5]')# 返回的是listdef readfile(filename):    try:        with open(filename,'r' ) as f:            content = f.readlines()    except UnicodeDecodeError:        with open(filename,'r' ,encoding='utf-8') as f:            content = f.readlines()    return contentdef exp(linedata):    cn = m.findall(linedata.strip())    if cn:        s = ''.join(cn)        return s    return Nonedef findchinese(filename):    total_str = ''    data = readfile(filename)    for line in range(len(data)):        linedata = exp( data[line])        if linedata:            total_str += 'line num :' + str(line )+ '  ; data = ' + linedata +'\n'    print(total_str)    with open('result.txt','w+') as f:        f.write(total_str)if __name__ == '__main__':    if len(sys.argv) == 2:        findchinese(sys.argv[1])     else:        print('参数错误')
原创粉丝点击