首先貼出四種方法適用范圍比較:
注釋:Excel 2003 即XLS文件有大小限制即65536行256列,所以不支持大文件,而Excel 2007以上即XLSX文件的限制則為1048576行16384列
着重介紹openpyxl 操作excel
#!/usr/bin/env python # -*- coding: utf-8 -*- import openpyxl import os class Excel_Operate(): """ openpyxl 只支持xlsx 優點能夠讀寫大文件 """ wb = openpyxl.Workbook() @classmethod def create(cls, ex_path, name, sheet_name=None, sheet_names=[]): """ :param ex_path:保存路徑 :param name: excel名稱 :param sheet_name: 默認sheet名稱 :param sheet_names:其它sheet名稱 :return: """ if not os.path.exists(ex_path): os.makedirs(ex_path) ex_path_name = os.path.join(ex_path, name) if os.path.exists(ex_path_name): return True ws1 = cls.wb.active # 默認表sheet1 if sheet_name: ws1.title = sheet_name for name in sheet_names: # 定義其它sheet頁 cls.wb.create_sheet(str(name)) cls.wb.save(ex_path_name) @classmethod def add_to_data(cls, ex_path_name, data, sheetname): """ :param ex_path_name: :param data: [[1, 2, 3], [4, 5, 6]] :return: """ if not os.path.exists(ex_path_name): return {"status": False, "message": "文件不存在"} wb = openpyxl.load_workbook(ex_path_name) # sheetnames = wb.sheetnames # [u'Sheet'] 獲取所有sheet頁list ws = wb[sheetname] # 選取第一個sheet頁 for x in data: ws.append(x) wb.save(ex_path_name) @classmethod def read_data(cls, ex_path_name, is_col, is_row=True): """ :param ex_path_name: :param is_col: 以列形式返回 :param is_row: 以行形式返回 :return: """ wb = openpyxl.load_workbook(ex_path_name) # 獲取全部表名 sheetnames = wb.sheetnames ws = wb[sheetnames[0]] # 表總行數max_row max_row = ws.max_row # 表總列數 max_col = ws.max_column row_data = [] # 行數據 col_data = [] # 列數據 if is_row: for i in range(1, max_row + 1): t_data = [] for x in range(1, max_col + 1): # 獲取表中x行1列的值 cell_data = ws.cell(column=x, row=i).value t_data.append(cell_data) row_data.append(t_data) return row_data if is_col: for i in range(1, max_col + 1): t_data = [] for x in range(1, max_row + 1): # 獲取表中x行1列的值 cell_data = ws.cell(row=x, column=i).value t_data.append(cell_data) col_data.append(t_data) return col_data return [] if __name__ == "__main__": Excel_Operate.create("/tmp/abcd/202108", "數據導出.xlsx", sheet_name=u"物流數據", sheet_names=[1, 2, 3]) Excel_Operate.add_to_data("/tmp/abcd/202108/數據導出.xlsx", data=[[1, 2, 3], [4, 5, 6]], sheetname=u"物流數據") # new_data = Excel_Operate.read_data("/tmp/excel/6_new.xlsx", is_col=True, is_row=False) # # old_data = Excel_Operate.read_data("/tmp/excel/6_old.xlsx", is_col=True, is_row=False) # print(len(new_data[0]), len(old_data[0])) # # new_cha_data = set(new_data[0]) - set(old_data[0]) # print(new_cha_data) # # old_cha_data = set(old_data[0]) - set(new_data[0]) # print(old_cha_data)