使用Python语言读写Excel数据demo

本文介绍了一种使用Python openpyxl库从大型Excel文件中筛选并分割数据的方法。通过读取一个包含特定ID的文本文件,该脚本能够从一个包含13665条记录的Excel文件中筛选出符合ID条件的数据,并将其保存到两个新的Excel文件中:一个包含匹配ID的数据,另一个包含未匹配ID的数据。此过程涉及读取源Excel文件的多个列,将数据与文本文件中的ID进行比较,然后将结果写入新文件。

摘要生成于 C知道 ,由 DeepSeek-R1 满血版支持, 前往体验 >

import openpyxl
from openpyxl import load_workbook
                                                                                   
f = open(file='data/10886数据集/最原始数据/电子病历对应病历号from10886.txt', encoding='utf-8')   
list_f = f.readlines()                                                                                 
ll = []                                                                                                
for item in list_f:                                                                                    
    item = item.replace('\n', '')                                                                      
    ll.append(item)                                                                                    
                                                                                                       
wb = load_workbook("data/10886数据集/最原始数据/首次病程记录_抽取_原始数据_13665.xlsx")          
sheet1 = wb.get_sheet_by_name("Sheet1")                                                                

# 读excel                                                                                                   
column_A = sheet1["A"]                                                                                 
column_B = sheet1["B"]                                                                                 
column_C = sheet1["C"]                                                                                 
column_D = sheet1["D"]                                                                                 
column_E = sheet1["E"]                                                                                 
column_F = sheet1["F"]                                                                                 
column_G = sheet1["G"]                                                                                 
column_H = sheet1["H"]                                                                                 
                                                                                                       
filepath1 = 'data/10886数据集/最原始数据/从13665中抽取出的10886条数据.xlsx'                            
filepath2 = 'data/10886数据集/最原始数据/从13665中抽取出的除10886条数据以外的数据.xlsx'                
                                                                                                       
wb1 = openpyxl.Workbook()                                                                              
ws1 = wb1.create_sheet('Sheet1')                                                                       
                                                                                                       
wb2 = openpyxl.Workbook()                                                                              
ws2 = wb2.create_sheet('Sheet1')                                                                       
                                                                                                       
index_ws1 = 1                                                                                          
index_ws2 = 1
# 写excel                                                                                          
for i in range(0, 13666):                                                                              
    print("i :" + str(i) + "...")                                                                      
    if i == 0:                                                                                         
        ws1.cell(row=index_ws1, column=1, value=sheet1["A"][i].value).value                            
        ws1.cell(row=index_ws1, column=2, value=sheet1["B"][i].value).value                            
        ws1.cell(row=index_ws1, column=3, value=sheet1["C"][i].value).value                            
        ws1.cell(row=index_ws1, column=4, value=sheet1["D"][i].value).value                            
        ws1.cell(row=index_ws1, column=5, value=sheet1["E"][i].value).value                            
        ws1.cell(row=index_ws1, column=6, value=sheet1["F"][i].value).value                            
        ws1.cell(row=index_ws1, column=7, value=sheet1["G"][i].value).value                            
        ws1.cell(row=index_ws1, column=8, value=sheet1["H"][i].value).value                            
                                                                                                       
        ws2.cell(row=index_ws2, column=1, value=sheet1["A"][i].value).value                            
        ws2.cell(row=index_ws2, column=2, value=sheet1["B"][i].value).value                            
        ws2.cell(row=index_ws2, column=3, value=sheet1["C"][i].value).value                            
        ws2.cell(row=index_ws2, column=4, value=sheet1["D"][i].value).value                            
        ws2.cell(row=index_ws2, column=5, value=sheet1["E"][i].value).value                            
        ws2.cell(row=index_ws2, column=6, value=sheet1["F"][i].value).value                            
        ws2.cell(row=index_ws2, column=7, value=sheet1["G"][i].value).value                            
        ws2.cell(row=index_ws2, column=8, value=sheet1["H"][i].value).value                            
                                                                                                       
        index_ws1 += 1                                                                                 
        index_ws2 += 1                                                                                 
    else:                                                                                              
        if str(sheet1["A"][i].value) in ll:                                                            
            ws1.cell(row=index_ws1, column=1, value=sheet1["A"][i].value).value                        
            ws1.cell(row=index_ws1, column=2, value=sheet1["B"][i].value).value                        
            ws1.cell(row=index_ws1, column=3, value=sheet1["C"][i].value).value                        
            ws1.cell(row=index_ws1, column=4, value=sheet1["D"][i].value).value                        
            ws1.cell(row=index_ws1, column=5, value=sheet1["E"][i].value).value                        
            ws1.cell(row=index_ws1, column=6, value=sheet1["F"][i].value).value                        
            ws1.cell(row=index_ws1, column=7, value=sheet1["G"][i].value).value                        
            ws1.cell(row=index_ws1, column=8, value=sheet1["H"][i].value).value                        
                                                                                                       
            index_ws1 += 1                                                                             
        elif str(sheet1["A"][i].value) not in ll:                                                      
            ws2.cell(row=index_ws2, column=1, value=sheet1["A"][i].value).value                        
            ws2.cell(row=index_ws2, column=2, value=sheet1["B"][i].value).value                        
            ws2.cell(row=index_ws2, column=3, value=sheet1["C"][i].value).value                        
            ws2.cell(row=index_ws2, column=4, value=sheet1["D"][i].value).value                        
            ws2.cell(row=index_ws2, column=5, value=sheet1["E"][i].value).value                        
            ws2.cell(row=index_ws2, column=6, value=sheet1["F"][i].value).value                        
            ws2.cell(row=index_ws2, column=7, value=sheet1["G"][i].value).value                        
            ws2.cell(row=index_ws2, column=8, value=sheet1["H"][i].value).value                        
                                                                                                       
            index_ws2 += 1                                                                             
                                                                                                       
wb1.save(filepath1)                                                                                    
wb2.save(filepath2)                                                                                    

 

评论
添加红包

请填写红包祝福语或标题

红包个数最小为10个

红包金额最低5元

当前余额3.43前往充值 >
需支付:10.00
成就一亿技术人!
领取后你会自动成为博主和红包主的粉丝 规则
hope_wisdom
发出的红包
实付
使用余额支付
点击重新获取
扫码支付
钱包余额 0

抵扣说明:

1.余额是钱包充值的虚拟货币,按照1:1的比例进行支付金额的抵扣。
2.余额无法直接购买下载,可以购买VIP、付费专栏及课程。

余额充值