|  | 
 
| 
处理txt文档的数据时候出现解码问题
x
马上注册,结交更多好友,享用更多功能^_^您需要 登录 才可以下载或查看,没有账号?立即注册  
 复制代码import sys
import re
args=sys.argv
sum_list=[]
alist=[]
unmatch_list=[]
with open(args[1],"r",encoding="utf-8") as f:
    for line in f:
        line=line.strip("\n").split("\t")
        symbol=line[1]
        alist.append(symbol)
        if line[8]:
            alias_symbol=line[8].split("|")
            for i in alias_symbol:
                alist.append(i)
        if line[10]:
            prev_symbol=line[10].split("|")
            for i in prev_symbol:
                alist.append(i)
    sum_list.append(alist)
    alist.clear()
 Traceback (most recent call last):
 File "C:/Users/likuokuo/PycharmProjects/python/p_value.py", line 10, in <module>
 for line in f:
 File "C:\Users\likuokuo\AppData\Local\Programs\Python\Python35\lib\codecs.py", line 321, in decode
 (result, consumed) = self._buffer_decode(data, self.errors, final)
 UnicodeDecodeError: 'utf-8' codec can't decode bytes in position 6015-6016: invalid continuation byte
 | 
 |