python遍历文件夹下的csv文件,读取文件内容存到数据库

寻找有志同道合的小伙伴,互帮互助,群里还有不错的视频学习教程和PDF电子书!

‘’’

def analysisWorkflowCsv(file):

csvFile = csv.reader(file)

读取一行,下面的reader中已经没有该行了

head_row = next(csvFile)

print(head_row)

__conn = getConnect_old()

counter = 0

for row in csvFile:

workflow = {}

workflow[‘UUID’] = row[0]

workflow[‘subject’] = row[1]

workflow[‘signdate’] = row[2]

workflow[‘U_UnitName’] = row[3]

workflow[‘U_UnitUser’] = row[4]

workflow[‘U_UnitUserTitle’] = row[5]

workflow[‘U_UnitEndTime’] = row[6]

workflow[‘U_UnitAction’] = row[7]

workflow[‘U_UnitToTitle’] = row[8]

if insertWorkflows(__conn, workflow):

counter += 1

if counter % 1000 == 0:

__conn.commitData()

print(“已经插入工作流数据: %d 条。”%counter)

__conn.commitData()

__conn.closeConn()

2、解析文件内容,首行为标题栏需要跳过。入库操作每满1000条commit一次主要是python频繁提交执行次数达到1000+就会报错。1000条commit一次可以避免错误并缓解内存压力。

‘’’

解析文件

‘’’

def analysisWorkflowCsv(file):

csvFile = csv.reader(file)

读取一行,下面的reader中已经没有该行了

head_row = next(csvFile)

print(head_row)

__conn = getConnect_old()

counter = 0

for row in csvFile:

workflow = {}

workflow[‘UUID’] = row[0]

workflow[‘subject’] = row[1]

workflow[‘signdate’] = row[2]

workflow[‘U_UnitName’] = row[3]

workflow[‘U_UnitUser’] = row[4]

workflow[‘U_UnitUserTitle’] = row[5]

workflow[‘U_UnitEndTime’] = row[6]

workflow[‘U_UnitAction’] = row[7]

workflow[‘U_UnitToTitle’] = row[8]

if insertWorkflows(__conn, workflow):

counter += 1

if counter % 1000 == 0:

__conn.commitData()

print(“已经插入工作流数据: %d 条。”%counter)

__conn.commitData()

__conn.closeConn()

3、数据入库

‘’’

插入工作流程数据

‘’’

def insertWorkflows(__conn, workflow):

__sql = ‘’’

INSERT INTO workflows (

UUID, U_UnitName, U_UnitUser, U_UnitUserTitle, U_UnitEndTime, U_UnitAction, U_UnitToTitle, subject, signdate

) VALUES (%s, %s, %s, %s, %s, %s, %s, %s, %s)

‘’’

__params = (

workflow[‘UUID’], workflow[‘U_UnitName’], workflow[‘U_UnitUser’], workflow[‘U_UnitUserTitle’],

workflow[‘U_UnitEndTime’], workflow[‘U_UnitAction’], workflow[‘U_UnitToTitle’], workflow[‘subject’],

workflow[‘signdate’]

)

print(__sql % __params)

return __conn.mssql_exe_sql(__sql, __params)

4、python操作sqlserver代码

‘’’

遇到问题没人解答?小编创建了一个Python学习交流QQ群:778463939

寻找有志同道合的小伙伴,互帮互助,群里还有不错的视频学习教程和PDF电子书!

‘’’

import pymssql

os.environ[‘NLS_LANG’] = ‘SIMPLIFIED CHINESE_CHINA.UTF8’

‘’’

数据库连接

‘’’

class ConnectionDatabase(object):

连接mysql数据库

def init(self, ip, user_name, passwd, db, char=‘utf8’):

self.ip = ip

self.port = port

self.username = user_name

self.passwd = passwd

self.mysqldb = db

self.char = char

self.MsSQL_db = pymssql.connect(

host=self.ip,

user=self.username,

password=self.passwd,

database=self.mysqldb,

charset=self.char)

查询数据(sqlserver)

def mssql_findList(self, sql):

cursor = self.MsSQL_db.cursor()

MsSQL_sql = sql

results = None

if not cursor:

raise (NameError,“数据库连接失败”)

try:

执行SQL语句

cursor.execute(MsSQL_sql)

获取所有记录列表

results = cursor.fetchall()

except Exception as e:

print(e)

self.MsSQL_db.close()

if results:

return results

else:

return None

数据增删改查(sqlserver)

def mssql_exe_sql(self, sql, params):

cursor = self.MsSQL_db.cursor()

MsSQL_sql = sql

result = 0

if not cursor:

raise (NameError,“数据库连接失败”)

try:

执行SQL语句

cursor.execute(MsSQL_sql, params)

result = cursor.rowcount

except Exception as e:

print(e)

self.MsSQL_db.rollback()

self.MsSQL_db.close()

return result>0

‘’’

提交数据集

‘’’

def commitData(self):

try:

self.MsSQL_db.commit()

except Exception as e:

print(e)

‘’’

关闭数据库连接

‘’’

def closeConn(self):

if self.MsSQL_db:

self.MsSQL_db.close()

5、执行代码

if name == “main”:

#文件所在的文件夹父路径

testFilePath = “G:\数据解析\csv\workflowcsv”

testFilePath = “G:\数据解析\csv\wd25csv”

readAllFiles(testFilePath)

遇到的问题及解决方式:

(1)以上代码执行时如果有时间类型的字段需要对字符串进行转换;

re.sub(‘[^0-9 | - | : ]’, ‘’, timestr)

利用正则表达式将时间字符串中的特殊字符去掉,再转换为时间字符串,避免代码执行时类型转换错误。

评论
添加红包

请填写红包祝福语或标题

红包个数最小为10个

红包金额最低5元

当前余额3.43前往充值 >
需支付:10.00
成就一亿技术人!
领取后你会自动成为博主和红包主的粉丝 规则
hope_wisdom
发出的红包
实付
使用余额支付
点击重新获取
扫码支付
钱包余额 0

抵扣说明:

1.余额是钱包充值的虚拟货币,按照1:1的比例进行支付金额的抵扣。
2.余额无法直接购买下载,可以购买VIP、付费专栏及课程。

余额充值