为何open打开.py文件后不可阅读

过54321 · 发表于 2019-5-29 23:24:53

马上注册，结交更多好友，享用更多功能^_^

您需要登录才可以下载或查看，没有账号？立即注册

x

目的是统计一个文件夹各个文件的数目和.py文件中的总行数，可是有如下错误，一直不能更改，问是何原因
import os
import easygui as g
import os.path

def searchfor():
count_py=0
f_py=0
count_txt=0
f_txt=0
count_docx=0
f_docx=0
os.chdir(g.diropenbox())
files=os.walk(os.getcwd())
for file_aggregate in files:
      for i in file_aggregate[2]:

         (f_start,f_end)=os.path.splitext(i)
         if f_end=='.py':
            f_py+=1
            file_name=file_aggregate[0]+'\\'+i
            print(file_name)

            f=open(file_name)

            for j in list(f):
                  count_py+=1
            f.close()
         elif f_end=='.txt':
            f_txt+=1
            file_name=file_aggregate[0]+'\\'+i
            f=open(file_name,)
            for j in list(f):
                  count_txt+=1
            f.close()
         elif f_end=='.docx':
            f_docx+=1
            file_name=file_aggregate[0]+'\\'+i
            f=open(file_name+'\\'+i)
            for j in list(f):
                  count_docx+=1
            f.close()
count_py1=count_py/100
rest=10000-count_py
msg='您目前共累计编写了%d行代码,完成进度:%d\n离10万行代码还差%d行,请继续努力!' % (count_py,count_py1,rest)
tile='代码总计'
word='【.py】源文件%d个，源代码%d行\n【.txt】源文件%d个，源代码%d行\n【.docx】源文件%d个，源代码%d行' % (f_py,count_py,f_txt,count_txt,f_docx,count_docx)
g.textbox(msg,tile,word)

searchfor()

°蓝鲤歌蓝 · 发表于 2019-5-29 23:37:14

编码错误

ba21 · 发表于 2019-5-29 23:47:46

cchardet 比chardet准确度高，速度快
cchardet.detect()返回字典，其中confidence是检测精确度，encoding是编码形式
1：网页编码判断：
import requests
import cchardet
res = requests.get('http://www.baidu.com/')
rawdata = res.content
cchardet.detect(rawdata)
>>>{'confidence': 0.98999999999999999, 'encoding': 'GB2312'}
2：文件编码判断
import cchardet
with open('c:\\111.txt','rb') as f:
msg=f.read()
enc = cchardet.detect(msg)
enc = enc['encoding']
print(enc)
# 以指定编码打开文件
with open("新建文本文档.txt", "r", encoding=enc) as f:
print(f.read())

复制代码

-------------------------------------------------------------------------------------------------------------------------------------------

import easygui as g
import os, cchardet
def get_file_code(path):
with open(path,'rb') as f:
msg=f.read()
enc = cchardet.detect(msg)
enc = enc['encoding']
return enc
def show_result(start_dir):
lines = 0
total = 0
text = ""
for i in source_list:
lines = source_list[i]
total += lines
text += "【%s】源文件 %d 个，源代码 %d 行\n" % (i, file_list[i], lines)
title = '统计结果'
msg = '您目前共累积编写了 %d 行代码，完成进度：%.2f %%\n离 10 万行代码还差 %d 行，请继续努力！' % (total, total/1000, 100000-total)
g.textbox(msg, title, text)
def calc_code(file_name):
lines = 0
enc = get_file_code(file_name) # 获取文件编码
with open(file_name, "r", encoding=enc) as f: # 以指定编码打开文件
print('正在分析文件：%s ...' % file_name)
try:
for each_line in f:
lines += 1
except UnicodeDecodeError:
pass # 不可避免会遇到格式不兼容的文件，这里忽略掉......
return lines
def search_file(start_dir) :
#首先通过异常判断该文件夹是否有访问权限，这里用 os.listdir列目录尝试。
try:
os.listdir(start_dir)
except:
return
os.chdir(start_dir)
for each_file in os.listdir(os.curdir) :
ext = os.path.splitext(each_file)[1]
if ext in target :
lines = calc_code(each_file) # 统计行数
# 还记得异常的用法吗？如果字典中不存，抛出 KeyError，则添加字典键
# 统计文件数
try:
file_list[ext] += 1
except KeyError:
file_list[ext] = 1
# 统计源代码行数
try:
source_list[ext] += lines
except KeyError:
source_list[ext] = lines
if os.path.isdir(each_file):
search_file(each_file) # 递归调用
os.chdir(os.pardir) # 递归调用后切记返回上一层目录
target = ['.c', '.cpp', '.py', '.cc', '.java', '.pas', '.asm']
file_list = {}
source_list = {}
g.msgbox("请打开您存放所有代码的文件夹......", "统计代码量")
path = g.diropenbox("请选择您的代码库：")
search_file(path)
show_result(path)

复制代码

yh6788 · 发表于 2019-5-30 01:13:46

中文编码的问题吧，
f=open(file_name)
这里如果改成with open(file_name,"r",encoding="utf8") as f:
你试下OK不，

过54321 · 发表于 2019-5-30 09:58:54

yh6788 发表于 2019-5-30 01:13
中文编码的问题吧，
f=open(file_name)
这里如果改成with open(file_name,"r",encoding="utf8") as f:

感谢

账号		自动登录	找回密码
密码			立即注册

为何open打开.py文件后不可阅读

马上注册，结交更多好友，享用更多功能^_^

回帖奖励 +1 鱼币

回帖奖励 +1 鱼币

浏览过的版块