|
|
马上注册,结交更多好友,享用更多功能^_^
您需要 登录 才可以下载或查看,没有账号?立即注册
x
import jieba
import xlrd
class Cut:
def read_excel(self):
file_path = r'D:\pycharm professional\workspace\爬虫\crawler\crawler\python职位.xls'
# 读取的文件路径
# file_path = file_path.decode('utf-8')
# 文件中的中文转码
self.data = xlrd.open_workbook(file_path)
# 获取数据
self.table = self.data.sheet_by_name('python职位')
# 获取sheet
self.nrows = self.table.nrows
# 获取总行数
for each_row in range(self.nrows):
self.cell_value = self.table.cell(each_row,4).value
return self.cell_value
def seg_sentence(self,sentence):
self.seg_sentence = jieba.cut(sentence,cut_all=False,HMM=True)
return self.seg_sentence
if __name__ == "__main__":
cut = Cut()
str = cut.read_excel()
sets = cut.seg_sentence(str)
print(",".join(sets))
大佬们,这个for循环哪里出了问题,为什么没有循环 |
|