根据excel列数据提取模版，生成新的excel，有图片和格式的

颂风侯 · 发表于 2024-7-26 14:13:48

马上注册，结交更多好友，享用更多功能^_^

您需要登录才可以下载或查看，没有账号？立即注册

x

目前已经提取了一个pandas的dataframe文件。
df_merge.to_excel("提取数据.xlsx", index=False)
同时生成到了excel，如下

管线号                                                             焊接类型        工艺卡编号        焊接材质        外径壁厚        管线寸口        道数        焊接寸口
/TRIM-排污-取样器水槽-N1-40-A1TB52-N             对焊                HKB20-02        20-GB/T8163        Φ48.3*5.08        1.5        1        1.5
/TRIM-排污-取样器水槽-N1-40-A1TB52-N            承插焊                HKC20-02        20-GB/T8163&20-NB/T47008        Φ*5.08        1.5        2        3
/TRIM-排污-取样器水槽-N1-40-A1TB52-N            承插焊                HKC20-02        20-GB/T8163&20-NB/T47008        Φ48.3*5.08        1.5        2        3
/TRIM-排污-取样器水槽-N1-40-A1TB52-N            承插焊                 HKC20-02        20-GB/T8163&A105        Φ*5.08        1.5        1        1.5
/TRIM-排污-取样器水槽-N1-40-A1TB52-N            承插焊                 HKC20-02        20-GB/T8163&A105        Φ48.3*5.08        1.5        1        1.5
/TRIM-排污-安全阀及消声器排水-20-A1TB51-N        承插焊        HKC20-02        20-GB/T8163        Φ21.3*3.73        1        7        7
/TRIM-排污-安全阀及消声器排水-20-A1TB51-N        对焊                HKB20-02        20-GB/T8163        Φ26.7*3.91        1        3        3

现在需要根据“管线号”列的数据，新建名称为“管线号”列数据的excel，并去同一级的另一个名称为“模版的文件夹里，找到”对应“工艺卡编号”列的名称的对应模版的excel，插入第一个sheet
sheet名称用“工艺卡编号“的名称

就是生成名称为“/TRIM-排污-取样器水槽-N1-40-A1TB52-N”.xlsx的excel，里面有模版sheet，名称为“HKB20-02”，“HKC20-02        ”，是复制“模版的文件夹里的对应模版的第一个sheet

提取模版能提取，但是模版里面有图，有格式，提取后图没了，excel表格式也没有全乱的，这个有没有其他办法

颂风侯 · 发表于 2024-7-26 14:29:48

import pandas as pd
import os
from openpyxl import load_workbook, Workbook
# 假设你的 DataFrame 已经创建为 df_merge
df_merge = pd.read_excel("提取数据2.xlsx")
# 模板文件夹路径
template_folder = "D:/PYTHON_NEW/pythonProject/提取python excel/工艺卡模版"
# 定义输出路径
output_folder = "C:\\集中"
# 确保输出文件夹存在
os.makedirs(output_folder, exist_ok=True)
# 遍历每一行
for index, row in df_merge.iterrows():
pipe_number = row['管线号'] # 假设管线号在 DataFrame 中的列名是 '管线号'
# 创建新的 Excel 文件
new_file_path = os.path.join(output_folder, f"{pipe_number}.xlsx")
#new_file_path = os.path.join("E:\\JIESHOU",f"{pipe_number}.xlsx")
#new_file_path = os.path.join("E:\\JIESHOU",f"{pipe_number}.xlsx")
#new_file_path = os.path.join("C:\\33",f"{pipe_number}.xlsx")
# 设置已存在的 Sheet 名称
existing_sheets = set()
# 创建新的 Excel 工作簿
new_wb = Workbook()
# 删除默认生成的第一个Sheet
default_sheet = new_wb.active
new_wb.remove(default_sheet)
# 遍历与该管线号对应的所有工艺卡编号
for process_card in df_merge.loc[df_merge['管线号'] == pipe_number, '工艺卡编号'].unique():
template_path = os.path.join(template_folder, f"{process_card}.xlsx")
if os.path.exists(template_path):
wb_template = load_workbook(template_path)
sheet_name = process_card
# 确保 Sheet 名称唯一
suffix = 1
while sheet_name in existing_sheets:
sheet_name = f"{process_card}_{suffix}"
suffix += 1
# 获取模版的第一个sheet
template_sheet = wb_template.active
# 创建一个新的工作表
new_sheet = new_wb.create_sheet(title=sheet_name)
# 复制数据
for row in template_sheet.iter_rows(values_only=True):
# new_sheet.append(row) # 将每一行的数据添加到新的工作表中
for cell in row:
new_sheet[cell.coordinate].value = cell.value
if cell.has_style:
new_sheet[cell.coordinate].font = cell.font
new_sheet[cell.coordinate].border = cell.border
new_sheet[cell.coordinate].fill = cell.fill
new_sheet[cell.coordinate].number_format = cell.number_format
new_sheet[cell.coordinate].protection = cell.protection
new_sheet[cell.coordinate].alignment = cell.alignment
# 复制图片
for img in template_sheet._images:
new_sheet.add_image(img)
existing_sheets.add(sheet_name)
else:
print(f"模板文件 {process_card}.xlsx 不存在，请检查路径！")
# 保存新文件
new_wb.save(new_file_path)
print(f"已创建: {new_file_path} 包含模版: {existing_sheets}")
print("所有文件处理完成！")

复制代码

程序报错
D:\PYTHON_NEW\pythonProject\.venv\Scripts\python.exe "D:\PYTHON_NEW\pythonProject\提取python excel\可用抽出工艺卡片.py"
Traceback (most recent call last):
File "D:\PYTHON_NEW\pythonProject\提取python excel\可用抽出工艺卡片.py", line 60, in <module>
new_sheet[cell.coordinate].value = cell.value
^^^^^^^^^^
AttributeError: 'NoneType' object has no attribute 'value'

颂风侯 · 发表于 2024-7-26 14:37:45

import pandas as pd
import os
from openpyxl import load_workbook, Workbook
# 假设你的 DataFrame 已经创建为 df_merge
df_merge = pd.read_excel("提取数据2.xlsx")
# 模板文件夹路径
template_folder = "D:/PYTHON_NEW/pythonProject/提取python excel/工艺卡模版"
# 定义输出路径
output_folder = "C:\\集中"
# 确保输出文件夹存在
os.makedirs(output_folder, exist_ok=True)
# 遍历每一行
for index, row in df_merge.iterrows():
pipe_number = row['管线号'] # 假设管线号在 DataFrame 中的列名是 '管线号'
# 创建新的 Excel 文件
new_file_path = os.path.join(output_folder, f"{pipe_number}.xlsx")
#new_file_path = os.path.join("E:\\JIESHOU",f"{pipe_number}.xlsx")
#new_file_path = os.path.join("E:\\JIESHOU",f"{pipe_number}.xlsx")
#new_file_path = os.path.join("C:\\33",f"{pipe_number}.xlsx")
# 设置已存在的 Sheet 名称
existing_sheets = set()
# 创建新的 Excel 工作簿
new_wb = Workbook()
# 删除默认生成的第一个Sheet
default_sheet = new_wb.active
new_wb.remove(default_sheet)
# 遍历与该管线号对应的所有工艺卡编号
for process_card in df_merge.loc[df_merge['管线号'] == pipe_number, '工艺卡编号'].unique():
template_path = os.path.join(template_folder, f"{process_card}.xlsx")
if os.path.exists(template_path):
wb_template = load_workbook(template_path)
sheet_name = process_card
# 确保 Sheet 名称唯一
suffix = 1
while sheet_name in existing_sheets:
sheet_name = f"{process_card}_{suffix}"
suffix += 1
# 获取模版的第一个sheet
template_sheet = wb_template.active
# 创建一个新的工作表
new_sheet = new_wb.create_sheet(title=sheet_name)
# 复制数据
for i, row in enumerate(template_sheet.iter_rows(values_only=False)):
for j, cell in enumerate(row):
new_cell = new_sheet.cell(row=i + 1, column=j + 1, value=cell.value)
if cell.has_style:
new_cell.font = cell.font
new_cell.border = cell.border
new_cell.fill = cell.fill
new_cell.number_format = cell.number_format
new_cell.protection = cell.protection
new_cell.alignment = cell.alignment
# 复制图片
for img in template_sheet._images:
new_sheet.add_image(img)
existing_sheets.add(sheet_name)
else:
print(f"模板文件 {process_card}.xlsx 不存在，请检查路径！")
# 保存新文件
new_wb.save(new_file_path)
print(f"已创建: {new_file_path} 包含模版: {existing_sheets}")
print("所有文件处理完成！")

复制代码

报错如下，
D:\PYTHON_NEW\pythonProject\.venv\Scripts\python.exe "D:\PYTHON_NEW\pythonProject\提取python excel\可用抽出工艺卡片.py"
Traceback (most recent call last):
  File "D:\PYTHON_NEW\pythonProject\提取python excel\可用抽出工艺卡片.py", line 61, in <module>
new_cell.font = cell.font
^^^^^^^^^^^^^
  File "D:\PYTHON_NEW\pythonProject\.venv\Lib\site-packages\openpyxl\styles\styleable.py", line 27, in __set__
setattr(instance._style, self.key, coll.add(value))
                                    ^^^^^^^^^^^^^^^
  File "D:\PYTHON_NEW\pythonProject\.venv\Lib\site-packages\openpyxl\utils\indexed_list.py", line 48, in add
self.append(value)
  File "D:\PYTHON_NEW\pythonProject\.venv\Lib\site-packages\openpyxl\utils\indexed_list.py", line 43, in append
if value not in self._dict:
   ^^^^^^^^^^^^^^^^^^^^^^^
TypeError: unhashable type: 'StyleProxy'

Process finished with exit code 1

颂风侯 · 发表于 2024-7-26 14:42:30

import pandas as pd
import os
from openpyxl import load_workbook, Workbook
# 假设你的 DataFrame 已经创建为 df_merge
df_merge = pd.read_excel("提取数据2.xlsx")
报错如下
D:\PYTHON_NEW\pythonProject\.venv\Scripts\python.exe "D:\PYTHON_NEW\pythonProject\提取python excel\可用抽出工艺卡片.py"
D:\PYTHON_NEW\pythonProject\提取python excel\可用抽出工艺卡片.py:61: DeprecationWarning: Call to deprecated function copy (Use copy(obj) or cell.obj = cell.obj + other).
new_cell.font = cell.font.copy() if cell.font else None
D:\PYTHON_NEW\pythonProject\提取python excel\可用抽出工艺卡片.py:62: DeprecationWarning: Call to deprecated function copy (Use copy(obj) or cell.obj = cell.obj + other).
new_cell.border = cell.border.copy() if cell.border else None
D:\PYTHON_NEW\pythonProject\提取python excel\可用抽出工艺卡片.py:63: DeprecationWarning: Call to deprecated function copy (Use copy(obj) or cell.obj = cell.obj + other).
new_cell.fill = cell.fill.copy() if cell.fill else None
D:\PYTHON_NEW\pythonProject\提取python excel\可用抽出工艺卡片.py:65: DeprecationWarning: Call to deprecated function copy (Use copy(obj) or cell.obj = cell.obj + other).
new_cell.protection = cell.protection.copy() if cell.protection else None
D:\PYTHON_NEW\pythonProject\提取python excel\可用抽出工艺卡片.py:66: DeprecationWarning: Call to deprecated function copy (Use copy(obj) or cell.obj = cell.obj + other).
new_cell.alignment = cell.alignment.copy() if cell.alignment else None
已创建: C:/TRIM-排污-取样器水槽-N1-40-A1TB52-N.xlsx 包含模版: {'HKB12-02', 'HKB12-03'}
已创建: C:/TRIM-排污-取样器水槽-N1-40-A1TB52-N.xlsx 包含模版: {'HKB12-02', 'HKB12-03'}
已创建: C:/TRIM-排污-取样器水槽-N1-40-A1TB52-N.xlsx 包含模版: {'HKB12-02', 'HKB12-03'}
已创建: C:/TRIM-排污-取样器水槽-N1-40-A1TB52-N.xlsx 包含模版: {'HKB12-02', 'HKB12-03'}
已创建: C:/TRIM-排污-取样器水槽-N1-40-A1TB52-N.xlsx 包含模版: {'HKB12-02', 'HKB12-03'}
已创建: C:/TRIM-排污-安全阀及消声器排水-20-A1TB51-N.xlsx 包含模版: {'HKB12-02'}
已创建: C:/TRIM-排污-安全阀及消声器排水-20-A1TB51-N.xlsx 包含模版: {'HKB12-02'}
已创建: C:/TRIM-排污-安全阀及消声器排水-20-A1TB51-N.xlsx 包含模版: {'HKB12-02'}
已创建: C:/TRIM-GG.xlsx 包含模版: {'HKB12-02'}
已创建: C:/TRIM-CC.xlsx 包含模版: {'HKB12-01'}
已创建: C:/TRIM-BB.xlsx 包含模版: {'HKB12-02'}
已创建: C:/TRIM-BB.xlsx 包含模版: {'HKB12-02'}
所有文件处理完成！
Process finished with exit code 0
# 模板文件夹路径
template_folder = "D:/PYTHON_NEW/pythonProject/提取python excel/工艺卡模版"
# 定义输出路径
output_folder = "C:\\集中"
# 确保输出文件夹存在
os.makedirs(output_folder, exist_ok=True)
# 遍历每一行
for index, row in df_merge.iterrows():
pipe_number = row['管线号'] # 假设管线号在 DataFrame 中的列名是 '管线号'
# 创建新的 Excel 文件
new_file_path = os.path.join(output_folder, f"{pipe_number}.xlsx")
#new_file_path = os.path.join("E:\\JIESHOU",f"{pipe_number}.xlsx")
#new_file_path = os.path.join("E:\\JIESHOU",f"{pipe_number}.xlsx")
#new_file_path = os.path.join("C:\\33",f"{pipe_number}.xlsx")
# 设置已存在的 Sheet 名称
existing_sheets = set()
# 创建新的 Excel 工作簿
new_wb = Workbook()
# 删除默认生成的第一个Sheet
default_sheet = new_wb.active
new_wb.remove(default_sheet)
# 遍历与该管线号对应的所有工艺卡编号
for process_card in df_merge.loc[df_merge['管线号'] == pipe_number, '工艺卡编号'].unique():
template_path = os.path.join(template_folder, f"{process_card}.xlsx")
if os.path.exists(template_path):
wb_template = load_workbook(template_path)
sheet_name = process_card
# 确保 Sheet 名称唯一
suffix = 1
while sheet_name in existing_sheets:
sheet_name = f"{process_card}_{suffix}"
suffix += 1
# 获取模版的第一个sheet
template_sheet = wb_template.active
# 创建一个新的工作表
new_sheet = new_wb.create_sheet(title=sheet_name)
# 复制数据
for i, row in enumerate(template_sheet.iter_rows(values_only=False)):
for j, cell in enumerate(row):
new_cell = new_sheet.cell(row=i + 1, column=j + 1, value=cell.value)
if cell.has_style:
new_cell.font = cell.font.copy() if cell.font else None
new_cell.border = cell.border.copy() if cell.border else None
new_cell.fill = cell.fill.copy() if cell.fill else None
new_cell.number_format = cell.number_format
new_cell.protection = cell.protection.copy() if cell.protection else None
new_cell.alignment = cell.alignment.copy() if cell.alignment else None
# 复制图片
for img in template_sheet._images:
new_sheet.add_image(img)
existing_sheets.add(sheet_name)
else:
print(f"模板文件 {process_card}.xlsx 不存在，请检查路径！")
# 保存新文件
new_wb.save(new_file_path)
print(f"已创建: {new_file_path} 包含模版: {existing_sheets}")
print("所有文件处理完成！")

复制代码

能抽出数据，但是图片没抽出来的，单元格格式也不对

颂风侯 · 发表于 2024-7-26 14:45:05

主要是合并，对齐，行高这些都不对
图片没拉过去

颂风侯 · 发表于 2024-7-26 14:49:58

# Copyright (c) 2010-2024 openpyxl
from copy import copy
from warnings import warn
from .numbers import (
BUILTIN_FORMATS,
BUILTIN_FORMATS_MAX_SIZE,
BUILTIN_FORMATS_REVERSE,
)
from .proxy import StyleProxy
from .cell_style import StyleArray
from .named_styles import NamedStyle
from .builtins import styles
class StyleDescriptor(object):
def __init__(self, collection, key):
self.collection = collection
self.key = key
def __set__(self, instance, value):
coll = getattr(instance.parent.parent, self.collection)
if not getattr(instance, "_style"):
instance._style = StyleArray()
setattr(instance._style, self.key, coll.add(value))
def __get__(self, instance, cls):
coll = getattr(instance.parent.parent, self.collection)
if not getattr(instance, "_style"):
instance._style = StyleArray()
idx = getattr(instance._style, self.key)
return StyleProxy(coll[idx])
class NumberFormatDescriptor(object):
key = "numFmtId"
collection = '_number_formats'
def __set__(self, instance, value):
coll = getattr(instance.parent.parent, self.collection)
if value in BUILTIN_FORMATS_REVERSE:
idx = BUILTIN_FORMATS_REVERSE[value]
else:
idx = coll.add(value) + BUILTIN_FORMATS_MAX_SIZE
if not getattr(instance, "_style"):
instance._style = StyleArray()
setattr(instance._style, self.key, idx)
def __get__(self, instance, cls):
if not getattr(instance, "_style"):
instance._style = StyleArray()
idx = getattr(instance._style, self.key)
if idx < BUILTIN_FORMATS_MAX_SIZE:
return BUILTIN_FORMATS.get(idx, "General")
coll = getattr(instance.parent.parent, self.collection)
return coll[idx - BUILTIN_FORMATS_MAX_SIZE]
class NamedStyleDescriptor(object):
key = "xfId"
collection = "_named_styles"
def __set__(self, instance, value):
if not getattr(instance, "_style"):
instance._style = StyleArray()
coll = getattr(instance.parent.parent, self.collection)
if isinstance(value, NamedStyle):
style = value
if style not in coll:
instance.parent.parent.add_named_style(style)
elif value not in coll.names:
if value in styles: # is it builtin?
style = styles[value]
if style not in coll:
instance.parent.parent.add_named_style(style)
else:
raise ValueError("{0} is not a known style".format(value))
else:
style = coll[value]
instance._style = copy(style.as_tuple())
def __get__(self, instance, cls):
if not getattr(instance, "_style"):
instance._style = StyleArray()
idx = getattr(instance._style, self.key)
coll = getattr(instance.parent.parent, self.collection)
return coll.names[idx]
class StyleArrayDescriptor(object):
def __init__(self, key):
self.key = key
def __set__(self, instance, value):
if instance._style is None:
instance._style = StyleArray()
setattr(instance._style, self.key, value)
def __get__(self, instance, cls):
if instance._style is None:
return False
return bool(getattr(instance._style, self.key))
class StyleableObject(object):
"""
Base class for styleble objects implementing proxy and lookup functions
"""
font = StyleDescriptor('_fonts', "fontId")
fill = StyleDescriptor('_fills', "fillId")
border = StyleDescriptor('_borders', "borderId")
number_format = NumberFormatDescriptor()
protection = StyleDescriptor('_protections', "protectionId")
alignment = StyleDescriptor('_alignments', "alignmentId")
style = NamedStyleDescriptor()
quotePrefix = StyleArrayDescriptor('quotePrefix')
pivotButton = StyleArrayDescriptor('pivotButton')
__slots__ = ('parent', '_style')
def __init__(self, sheet, style_array=None):
self.parent = sheet
if style_array is not None:
style_array = StyleArray(style_array)
self._style = style_array
@property
def style_id(self):
if self._style is None:
self._style = StyleArray()
return self.parent.parent._cell_styles.add(self._style)
@property
def has_style(self):
if self._style is None:
return False
return any(self._style)

复制代码

失败了，报错如下
D:\PYTHON_NEW\pythonProject\.venv\Scripts\python.exe "D:\PYTHON_NEW\pythonProject\提取python excel\测试含图片的excel抽取工艺卡.py"
Traceback (most recent call last):
  File "D:\PYTHON_NEW\pythonProject\提取python excel\测试含图片的excel抽取工艺卡.py", line 59, in <module>
new_cell.font = cell.font
^^^^^^^^^^^^^
  File "D:\PYTHON_NEW\pythonProject\.venv\Lib\site-packages\openpyxl\styles\styleable.py", line 27, in __set__
setattr(instance._style, self.key, coll.add(value))
                                    ^^^^^^^^^^^^^^^
  File "D:\PYTHON_NEW\pythonProject\.venv\Lib\site-packages\openpyxl\utils\indexed_list.py", line 48, in add
self.append(value)
  File "D:\PYTHON_NEW\pythonProject\.venv\Lib\site-packages\openpyxl\utils\indexed_list.py", line 43, in append
if value not in self._dict:
   ^^^^^^^^^^^^^^^^^^^^^^^
TypeError: unhashable type: 'StyleProxy'

Process finished with exit code 1

颂风侯 · 发表于 2024-7-26 14:52:48

import pandas as pd
import os
from openpyxl import load_workbook, Workbook
# 假设你的 DataFrame 已经创建为 df_merge
df_merge = pd.read_excel("提取数据2.xlsx")
# 模板文件夹路径
template_folder = "D:/PYTHON_NEW/pythonProject/提取python excel/工艺卡模版"
# 定义输出路径
output_folder = "C:\\集中"
# 确保输出文件夹存在
os.makedirs(output_folder, exist_ok=True)
# 遍历每一行
for index, row in df_merge.iterrows():
pipe_number = row['管线号'] # 假设管线号在 DataFrame 中的列名是 '管线号'
# 创建新的 Excel 文件
new_file_path = os.path.join(output_folder, f"{pipe_number}.xlsx")
# 设置已存在的 Sheet 名称
existing_sheets = set()
# 创建新的 Excel 工作簿
new_wb = Workbook()
# 删除默认生成的第一个Sheet
default_sheet = new_wb.active
new_wb.remove(default_sheet)
# 遍历与该管线号对应的所有工艺卡编号
for process_card in df_merge.loc[df_merge == pipe_number, '工艺卡编号'].unique():
template_path = os.path.join(template_folder, f"{process_card}.xlsx")
if os.path.exists(template_path):
wb_template = load_workbook(template_path)
sheet_name = process_card
# 确保 Sheet 名称唯一
suffix = 1
while sheet_name in existing_sheets:
sheet_name = f"{process_card}_{suffix}"
suffix += 1
# 获取模版的第一个sheet
template_sheet = wb_template.active
new_sheet = new_wb.create_sheet(title=sheet_name)
# 复制数据和样式
for i, row in enumerate(template_sheet.iter_rows(values_only=False)):
for j, cell in enumerate(row):
new_cell = new_sheet.cell(row=i + 1, column=j + 1, value=cell.value)
# 复制样式属性
if cell.has_style:
if cell.font is not None:
new_cell.font = cell.font
if cell.border is not None:
new_cell.border = cell.border
if cell.fill is not None:
new_cell.fill = cell.fill
new_cell.number_format = cell.number_format
new_cell.protection = cell.protection
if cell.alignment is not None:
new_cell.alignment = cell.alignment
# 复制行高
for row in template_sheet.iter_rows():
new_sheet.row_dimensions[row[0].row].height = row[0].row_height
# 复制合并单元格
for merged_range in template_sheet.merged_cells.ranges:
new_sheet.merge_cells(str(merged_range))
# 复制图片
for img in template_sheet._images:
new_sheet.add_image(img)
existing_sheets.add(sheet_name)
else:
print(f"模板文件 {process_card}.xlsx 不存在，请检查路径！")
# 保存新文件
new_wb.save(new_file_path)
print(f"已创建: {new_file_path} 包含模版: {existing_sheets}")
print("所有文件处理完成！")

复制代码

还是报错失败的。如下
D:\PYTHON_NEW\pythonProject\.venv\Scripts\python.exe "D:\PYTHON_NEW\pythonProject\提取python excel\测试含图片的excel抽取工艺卡.py"
Traceback (most recent call last):
  File "D:\PYTHON_NEW\pythonProject\提取python excel\测试含图片的excel抽取工艺卡.py", line 33, in <module>
for process_card in df_merge.loc[df_merge == pipe_number, '工艺卡编号'].unique():
                     ~~~~~~~~~~~~^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
  File "D:\PYTHON_NEW\pythonProject\.venv\Lib\site-packages\pandas\core\indexing.py", line 1184, in __getitem__
return self._getitem_tuple(key)
         ^^^^^^^^^^^^^^^^^^^^^^^^
  File "D:\PYTHON_NEW\pythonProject\.venv\Lib\site-packages\pandas\core\indexing.py", line 1368, in _getitem_tuple
return self._getitem_lowerdim(tup)
         ^^^^^^^^^^^^^^^^^^^^^^^^^^^
  File "D:\PYTHON_NEW\pythonProject\.venv\Lib\site-packages\pandas\core\indexing.py", line 1089, in _getitem_lowerdim
return getattr(section, self.name)[new_key]
         ~~~~~~~~~~~~~~~~~~~~~~~~~~~^^^^^^^^^
  File "D:\PYTHON_NEW\pythonProject\.venv\Lib\site-packages\pandas\core\indexing.py", line 1191, in __getitem__
return self._getitem_axis(maybe_callable, axis=axis)
         ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
  File "D:\PYTHON_NEW\pythonProject\.venv\Lib\site-packages\pandas\core\indexing.py", line 1418, in _getitem_axis
raise ValueError("Cannot index with multidimensional key")
ValueError: Cannot index with multidimensional key

Process finished with exit code 1

颂风侯 · 发表于 2024-7-26 15:06:03

import pandas as pd
import os
from openpyxl import load_workbook, Workbook
# 假设你的 DataFrame 已经创建为 df_merge
df_merge = pd.read_excel("提取数据2.xlsx")
# 模板文件夹路径
template_folder = "D:/PYTHON_NEW/pythonProject/提取python excel/工艺卡模版"
# 定义输出路径
output_folder = "C:\\集中"
# 确保输出文件夹存在
os.makedirs(output_folder, exist_ok=True)
# 遍历每一行
for index, row in df_merge.iterrows():
pipe_number = row['管线号'] # 假设管线号在 DataFrame 中的列名是 '管线号'
# 创建新的 Excel 文件
new_file_path = os.path.join(output_folder, f"{pipe_number}.xlsx")
# 设置已存在的 Sheet 名称
existing_sheets = set()
# 创建新的 Excel 工作簿
new_wb = Workbook()
# 删除默认生成的第一个Sheet
default_sheet = new_wb.active
new_wb.remove(default_sheet)
# 遍历与该管线号对应的所有工艺卡编号
for process_card in df_merge.loc[df_merge == pipe_number, '工艺卡编号'].unique():
template_path = os.path.join(template_folder, f"{process_card}.xlsx")
if os.path.exists(template_path):
wb_template = load_workbook(template_path)
sheet_name = process_card
# 确保 Sheet 名称唯一
suffix = 1
while sheet_name in existing_sheets:
sheet_name = f"{process_card}_{suffix}"
suffix += 1
# 获取模版的第一个sheet
template_sheet = wb_template.active
new_sheet = new_wb.create_sheet(title=sheet_name)
# 复制数据和样式
for i, row in enumerate(template_sheet.iter_rows(values_only=False)):
for j, cell in enumerate(row):
new_cell = new_sheet.cell(row=i + 1, column=j + 1, value=cell.value)
# 复制样式属性
if cell.has_style:
if cell.font is not None:
new_cell.font = cell.font
if cell.border is not None:
new_cell.border = cell.border
if cell.fill is not None:
new_cell.fill = cell.fill
new_cell.number_format = cell.number_format
new_cell.protection = cell.protection
if cell.alignment is not None:
new_cell.alignment = cell.alignment
# 复制行高
for row in template_sheet.iter_rows():
new_sheet.row_dimensions[row[0].row].height = row[0].row_height
# 复制合并单元格
for merged_range in template_sheet.merged_cells.ranges:
new_sheet.merge_cells(str(merged_range))
# 复制图片
for img in template_sheet._images:
new_sheet.add_image(img)
existing_sheets.add(sheet_name)
else:
print(f"模板文件 {process_card}.xlsx 不存在，请检查路径！")
# 保存新文件
new_wb.save(new_file_path)
print(f"已创建: {new_file_path} 包含模版: {existing_sheets}")
print("所有文件处理完成！")

复制代码

AI老师能不能发的代码可以直接复制不用调缩进的。。。
失败如下
D:\PYTHON_NEW\pythonProject\.venv\Scripts\python.exe "D:\PYTHON_NEW\pythonProject\提取python excel\测试含图片的excel抽取工艺卡.py"
Traceback (most recent call last):
  File "D:\PYTHON_NEW\pythonProject\提取python excel\测试含图片的excel抽取工艺卡.py", line 33, in <module>
for process_card in df_merge.loc[df_merge == pipe_number, '工艺卡编号'].unique():
                     ~~~~~~~~~~~~^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
  File "D:\PYTHON_NEW\pythonProject\.venv\Lib\site-packages\pandas\core\indexing.py", line 1184, in __getitem__
return self._getitem_tuple(key)
         ^^^^^^^^^^^^^^^^^^^^^^^^
  File "D:\PYTHON_NEW\pythonProject\.venv\Lib\site-packages\pandas\core\indexing.py", line 1368, in _getitem_tuple
return self._getitem_lowerdim(tup)
         ^^^^^^^^^^^^^^^^^^^^^^^^^^^
  File "D:\PYTHON_NEW\pythonProject\.venv\Lib\site-packages\pandas\core\indexing.py", line 1089, in _getitem_lowerdim
return getattr(section, self.name)[new_key]
         ~~~~~~~~~~~~~~~~~~~~~~~~~~~^^^^^^^^^
  File "D:\PYTHON_NEW\pythonProject\.venv\Lib\site-packages\pandas\core\indexing.py", line 1191, in __getitem__
return self._getitem_axis(maybe_callable, axis=axis)
         ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
  File "D:\PYTHON_NEW\pythonProject\.venv\Lib\site-packages\pandas\core\indexing.py", line 1418, in _getitem_axis
raise ValueError("Cannot index with multidimensional key")
ValueError: Cannot index with multidimensional key

Process finished with exit code 1

颂风侯 · 发表于 2024-7-26 15:07:49

import pandas as pd
import os
from openpyxl import load_workbook, Workbook
# 假设你的 DataFrame 已经创建为 df_merge
df_merge = pd.read_excel("提取数据2.xlsx")
# 模板文件夹路径
template_folder = "D:/PYTHON_NEW/pythonProject/提取python excel/工艺卡模版"
# 定义输出路径
output_folder = "C:\\集中"
# 确保输出文件夹存在
os.makedirs(output_folder, exist_ok=True)
# 遍历每一行
for index, row in df_merge.iterrows():
pipe_number = row['管线号'] # 假设管线号在 DataFrame 中的列名是 '管线号'
# 创建新的 Excel 文件
new_file_path = os.path.join(output_folder, f"{pipe_number}.xlsx")
# 设置已存在的 Sheet 名称
existing_sheets = set()
# 创建新的 Excel 工作簿
new_wb = Workbook()
# 删除默认生成的第一个Sheet
default_sheet = new_wb.active
new_wb.remove(default_sheet)
# 遍历与该管线号对应的所有工艺卡编号
for process_card in df_merge.loc[df_merge == pipe_number, '工艺卡编号'].unique():
template_path = os.path.join(template_folder, f"{process_card}.xlsx")
if os.path.exists(template_path):
wb_template = load_workbook(template_path)
sheet_name = process_card
# 确保 Sheet 名称唯一
suffix = 1
while sheet_name in existing_sheets:
sheet_name = f"{process_card}_{suffix}"
suffix += 1
# 获取模版的第一个sheet
template_sheet = wb_template.active
new_sheet = new_wb.create_sheet(title=sheet_name)
# 复制数据和样式
for i, row in enumerate(template_sheet.iter_rows(values_only=False)):
for j, cell in enumerate(row):
new_cell = new_sheet.cell(row=i + 1, column=j + 1, value=cell.value)
# 复制样式属性
if cell.has_style:
if cell.font is not None:
new_cell.font = cell.font
if cell.border is not None:
new_cell.border = cell.border
if cell.fill is not None:
new_cell.fill = cell.fill
new_cell.number_format = cell.number_format
new_cell.protection = cell.protection
if cell.alignment is not None:
new_cell.alignment = cell.alignment
# 复制行高
for row in template_sheet.iter_rows():
new_sheet.row_dimensions[row[0].row].height = row[0].row_height
# 复制合并单元格
for merged_range in template_sheet.merged_cells.ranges:
new_sheet.merge_cells(str(merged_range))
# 复制图片
for img in template_sheet._images:
new_sheet.add_image(img)
existing_sheets.add(sheet_name)
else:
print(f"模板文件 {process_card}.xlsx 不存在，请检查路径！")
# 保存新文件
new_wb.save(new_file_path)
print(f"已创建: {new_file_path} 包含模版: {existing_sheets}")
print("所有文件处理完成！")

复制代码

报错如下
D:\PYTHON_NEW\pythonProject\.venv\Scripts\python.exe "D:\PYTHON_NEW\pythonProject\提取python excel\测试含图片的excel抽取工艺卡.py"
Traceback (most recent call last):
  File "D:\PYTHON_NEW\pythonProject\提取python excel\测试含图片的excel抽取工艺卡.py", line 33, in <module>
for process_card in df_merge.loc[df_merge == pipe_number, '工艺卡编号'].unique():
                     ~~~~~~~~~~~~^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
  File "D:\PYTHON_NEW\pythonProject\.venv\Lib\site-packages\pandas\core\indexing.py", line 1184, in __getitem__
return self._getitem_tuple(key)
         ^^^^^^^^^^^^^^^^^^^^^^^^
  File "D:\PYTHON_NEW\pythonProject\.venv\Lib\site-packages\pandas\core\indexing.py", line 1368, in _getitem_tuple
return self._getitem_lowerdim(tup)
         ^^^^^^^^^^^^^^^^^^^^^^^^^^^
  File "D:\PYTHON_NEW\pythonProject\.venv\Lib\site-packages\pandas\core\indexing.py", line 1089, in _getitem_lowerdim
return getattr(section, self.name)[new_key]
         ~~~~~~~~~~~~~~~~~~~~~~~~~~~^^^^^^^^^
  File "D:\PYTHON_NEW\pythonProject\.venv\Lib\site-packages\pandas\core\indexing.py", line 1191, in __getitem__
return self._getitem_axis(maybe_callable, axis=axis)
         ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
  File "D:\PYTHON_NEW\pythonProject\.venv\Lib\site-packages\pandas\core\indexing.py", line 1418, in _getitem_axis
raise ValueError("Cannot index with multidimensional key")
ValueError: Cannot index with multidimensional key

Process finished with exit code 1

账号		自动登录	找回密码
密码			立即注册

根据excel列数据提取模版，生成新的excel，有图片和格式的

马上注册，结交更多好友，享用更多功能^_^

浏览过的版块