# -*- coding: utf-8 -*- import sys import time CTRL_A='\x01' CTRL_B='\x02' thedate = '' thetime = '' sn = '' asr = '' intent = '' nlp = '' domain = '' def speechHandle(inputFile,outputFile): print "********** speechHandle " + inputFile + " start **********" try: input = open(inputFile, 'r') output = open(outputFile, 'a+') while True: line = input.readline() if len(line.strip()) < 1: break fileds = line.split(CTRL_A) fieldsLen = len(fileds) if fieldsLen == 6: for fIndex in range(0,6): kv = fileds[fIndex].split(CTRL_B) kvLen = len(kv) if kvLen == 2: if kv[0].strip()=='time': unixtimestamp = kv[1] timetmp = time.localtime(int(unixtimestamp)/1000) thedate = time.strftime("%Y-%m-%d", timetmp) thetime = time.strftime("%H:%M:%S", timetmp) elif kv[0].strip()=='id': sn = kv[1] elif kv[0].strip()=='asr': asr = kv[1] elif kv[0].strip() == 'intent': intent = kv[1].strip() elif kv[0].strip() == 'domain': domain = kv[1] lineOut = thedate + CTRL_A + thetime + CTRL_A + sn + CTRL_A + asr + CTRL_A + intent + CTRL_A + domain + "\n" output.write(lineOut) else: print line except IOError as ioerr: print 'File Error' + str(ioerr) exit(-1) finally: input.close() output.close() print "********** speechHandle " + inputFile + " end **********" if __name__ == '__main__': if len(sys.argv) != 3: print "Please input inputFile and outputFile" else: speechHandle(sys.argv[1], sys.argv[2])
供参考
本文介绍了一个用于处理特定格式的日志文件的Python脚本。该脚本读取输入文件,解析并转换日志条目到指定的输出格式,最后将结果写入输出文件。处理过程包括提取日期、时间、序列号、语音识别结果、意图及领域等关键字段。
729

被折叠的 条评论
为什么被折叠?



