zoukankan      html  css  js  c++  java
  • python实现Excel删除特定行、拷贝指定行操作

    工作中遇到的,本来用VBA写的,操作很慢,尝试用Python实现,

    任务需求:

    从原始的两张表中拷贝行到五张表中,如下表所示:

    source1和source2是一样的格式:

            one two three four five
    1 2 3   11 11 22 22 33 33 44 44 55 55

    目标表格有one,two,three,four,five。

    将前三列和对应表的两列拷贝到目标表格中,目标表格中原始也需要删除有关键字的行(注释代码中实现了,但是有8000多行,删除很耗时,改为了手动删除),然后把source1和source2含有同样关键字的行拷贝过来,拷贝的列索引是固定的

    实现:

    采用xlrd读Excel,xlutils写Excel,注释中用win32com删除行(需要安装模块pip install pywin32)

    #! /usr/bin/env python
    # encoding:utf-8
    import os
    import xlrd
    from xlutils.copy import copy
    import win32com.client as win32
    '''
    文件名、修改的表名、查找的字符串固定,如有变化,则相应修改
    '''
    regstr = ['str1', 'str2']
    tarExcels = ['one.xls','two.xls','three.xls','four.xls','five.xls']
    tarSheet = 'targetSheet'
    sourceExcels =['source1.xlsm','source2.xlsm']
    
    def copyFeatrue(sourcefiles,targetfiles):
        for item in sourcefiles:
            workbook = xlrd.open_workbook(item)
            shEng = workbook.sheet_by_index(0)
            rowNum = shEng.nrows
            '''从原始中英文表中提取出要放入五张表的内容'''
            ListMacro =[]
            ListMICRO =[]
            ListATOM =[]
            List3205E =[]
            List3911E =[]
            startRowIdx = 0
            for row in range(rowNum):
                if shEng.cell(row,4).value in regstr:
                    break
                startRowIdx += 1
            for rowIdx in range(startRowIdx,rowNum):
                commstr =[]
                tempMacro = []
                tempMICRO = []
                tempATOM = []
                temp3205E = []
                temp3911E = []
                '''前三列公共,后面五张表各自取不同的列'''
                commstr.append(shEng.cell(rowIdx,0).value)
                commstr.append(shEng.cell(rowIdx,1).value)
                commstr.append(shEng.cell(rowIdx,2).value)
    
                if shEng.cell(rowIdx,4).value:
                    tempMacro.extend(commstr)
                    tempMacro.append(shEng.cell(rowIdx,4).value)
                    tempMacro.append(shEng.cell(rowIdx, 5).value)
    
                if shEng.cell(rowIdx, 8).value:
                    tempMICRO.extend(commstr)
                    tempMICRO.append(shEng.cell(rowIdx, 8).value)
                    tempMICRO.append(shEng.cell(rowIdx, 9).value)
    
                if shEng.cell(rowIdx, 10).value:
                    tempATOM.extend(commstr)
                    tempATOM.append(shEng.cell(rowIdx, 10).value)
                    tempATOM.append(shEng.cell(rowIdx, 11).value)
    
                if shEng.cell(rowIdx, 12).value:
                    temp3205E.extend(commstr)
                    temp3205E.append(shEng.cell(rowIdx, 12).value)
                    temp3205E.append(shEng.cell(rowIdx, 13).value)
    
                if shEng.cell(rowIdx, 14).value:
                    temp3911E.extend(commstr)
                    temp3911E.append(shEng.cell(rowIdx, 14).value)
                    temp3911E.append(shEng.cell(rowIdx, 15).value)
                if tempMacro:
                    ListMacro.append(tempMacro)
                if tempMICRO:
                    ListMICRO.append(tempMICRO)
                if tempATOM:
                    ListATOM.append(tempATOM)
                if temp3205E:
                    List3205E.append(temp3205E)
                if temp3911E:
                    List3911E.append(temp3911E)
    
            '''表名和抽取出的内容一一对应'''
            dic ={}
            dic[tarExcels[0]] = List3911E
            dic[tarExcels[1]] = List3205E
            dic[tarExcels[2]] = ListATOM
            dic[tarExcels[3]] = ListMICRO
            dic[tarExcels[4]] = ListMacro
            realfile =''
    
            '''通过表名查找到对应的表的绝对路径,以便读取'''
            for j in range(5):
                for fileidx in range(len(targetfiles)):
                    if tarExcels[j] in targetfiles[fileidx]:
                        realfile = targetfiles[fileidx]
                        break
                workdest1 = xlrd.open_workbook(realfile)
                shdest1 = workdest1.sheet_by_name(tarSheet)
                rows = shdest1.nrows
                targetlist = dic[tarExcels[j]]
                '''创建新表,将对应内容写入对应表中'''
                newbook = copy(workdest1)
                newsheet = newbook.get_sheet(tarSheet)
                listidx = 0
                '''写入表的位置固定,根据列索引写入'''
                for r in range(rows,rows+len(targetlist)):
                    newsheet.write(r,0,targetlist[listidx][0])
                    newsheet.write(r, 1, targetlist[listidx][1])
                    newsheet.write(r, 2, targetlist[listidx][2])
                    newsheet.write(r, 4, targetlist[listidx][3])
                    newsheet.write(r, 5, targetlist[listidx][4])
                    listidx += 1
                newbook.save(realfile)
    
    if __name__ == '__main__':
        print('Running! Please Wait!
    ')
        targetfiles =[]
        sourcefiles =[]
        '''遍历脚本所在目录下所有文件,并且找出与目标文件一致的文件的绝对路径'''
        for root,dirs,files in os.walk(os.getcwd()):
            for name in files:
                if name in tarExcels:
                    targetfiles.append(os.path.join(root, name))
                if name in sourceExcels:
                    sourcefiles.append(os.path.join(root, name))
        copyFeatrue(sourcefiles,targetfiles)
        print('^_^Success!^_^')
        input('input any key to continue!
    ')
    
    '''
    class copyExcel:
        def __init__(self,filename = None):
            self.workApp = win32.Dispatch('Excel.Application')
            if filename:
                self.filename = filename
                self.workbook = self.workApp.Workbooks.Open(filename)
            else:
                self.workbook = self.workApp.Workbooks.Add()
                self.filename = ''
    
        def deleteRow(self,sheet,row):
            sht = self.workbook.Worksheets(sheet)
            sht.Rows(row).Delete()
    
        def save(self, newfile=None):
            if newfile:
                self.filename = newfile
                self.workbook.SaveAs(newfile)
            else:
                self.workbook.Save()
    
        def close(self):
            self.workbook.Close(SaveChanges = 0)
            del self.workApp
    
        def getCell(self,sheet,row,col):
            sht = self.workbook.Worksheets(sheet)
            return sht.Cells(row,col).Value
    
        def setCell(self,sheet,row,col,value):
            sht = self.xlBook.Worksheets(sheet)
            sht.Cells(row, col).Value = value
        def getRowNum(self,sheet):
            sht = self.workbook.Worksheets(sheet)
            return sht.usedrange.rows.count
    
    ##删除目标字符串对应的行
    def delFeature(destdir):
        for i in range(len(tarExcels)):
            sourfile = destdir + '\' + tarExcels[i]
            temp = copyExcel(sourfile)
            #workbook = win32.Dispatch('Excel.Application').Workbooks.Open('D:pychenliu.xlsx')
            rowNum = temp.getRowNum(tarSheet)
            print(rowNum)
            row = 1
            while row <= rowNum:
                #print(row)
                if temp.getCell(tarSheet,row,5) == 'str1' or temp.getCell(tarSheet,row,5) == 'str2':
                    temp.deleteRow(tarSheet,row)
                    row -= 1
                    rowNum -=1
                row += 1
            temp.save()
            temp.close()
    
    '''
    

      

  • 相关阅读:
    MySQL select语句中where条件的提取过程
    MySQL特性:ICP,Index Condition Pushdown
    MySQL特性:BKA,Batched Key Access,批量索引访问
    MySQL特性:MRR,Multi-Range Read,多范围读
    show engine innodb status 输出结果解读
    IPv6的一点使用小计
    MySQL 通过ibd恢复数据
    explain 小结
    clickhouse的多路径存储策略
    cenos6.5升级glibc2.18
  • 原文地址:https://www.cnblogs.com/xqn2017/p/8387515.html
Copyright © 2011-2022 走看看