python3.5csv特殊字符解析

import fileinput for line in fileinput.FileInput("file",inplace=1): line = line.replace(":",",") import fileinput for line in fileinput.FileInput("file",inplace=1): line = line.replace("case"," ")

l h, l min, ls, gmt h, gmt m, gmt s, date, product id, manuf id, case, pallet, id, code, company id, location, secondary code 03,30,30,08,30,30,15 August 2015, 123456789, 987654321, 12, 1234, 12, 1234, 12345, 123, 12

#!/usr/bin/env python import csv import os inputFileName = 'test.txt' outputFileName = 'finished.csv' with open(inputFileName, newline='') as inFile, open(outputFileName, 'w', newline='') as outfile: r = csv.reader(inFile) w = csv.writer(outfile) line = '03:30:30 08:30:30 [15 August 2015] productid:123456789 manuf:987654321 case:12 pallet:1234 id:12 code:1234 12345 123 12' str_list = line.split() new_list = [str_list[0], str_list[1], ' '.join([item.strip('[]') for item in str_list[2:5]]), # '[15', 'August', '2015]' str_list[6].split(':')[1], str_list[7].split(':')[1], str_list[8].split(':')[1], str_list[9].split(':')[1], str_list[10].split(':')[1], str_list[12], str_list[13] ] with open(inputFileName, newline='') as inFile, open(outputFileName, 'w', newline='') as outfile: r = csv.reader(inFile) w = csv.writer(outfile) for row in r: w.writerow(new_list)

2条回答

网友

1楼 · 编辑于 2024-06-12 16:30:21

使用以下方法处理每条线

line = '03:30:30 08:30:30 [15 August 2015] productid:123456789 manuf:987654321 case:12 pallet:1234 id:12 code:1234 12345 123 12'
str_list = line.split()

new_list = [str_list[0],
            str_list[1],
            ' '.join([item.strip('[]') for item in str_list[2:5]]), # '[15', 'August', '2015]'
            str_list[6].split(':')[1],
            str_list[7].split(':')[1],
            str_list[8].split(':')[1],
            str_list[9].split(':')[1],
            str_list[10].split(':')[1],
            str_list[12],
            str_list[13]
            ]

print(new_list)
# Output
['03:30:30', '08:30:30', '15 August 2015', '987654321', '12', '1234', '12', '1234', '123', '12']

写入csv文件时使用

^{pr2}$

或者处理所有行并将结果保存到列表列表中，然后使用writerows将结果wirte保存到csv文件中

writer.writerows(lists)

完整的源代码

#!/usr/bin/env python
import csv

inputFileName = 'test.txt'
outputFileName = 'finished.csv'

with open(outputFileName, 'w') as outfile:
    w = csv.writer(outfile)

    # write the file header
    fieldnames = ['local time', 'GMT time', 'date', 'product id', 'manuf id', 
            'case', 'pallet', 'id', 'code', 'company id', 'location', 'secondary code']
    writer.writerow(fieldnames)


    # process each line
    with open(inputFileName, 'r') as inFile:
        for line in inFile:
            str_list = line.rstrip().split()
            new_list = [str_list[0],
                        str_list[1],
                        ' '.join([item.strip('[]') for item in str_list[2:5]]), # '[15', 'August', '2015]'
                        str_list[6].split(':')[1],
                        str_list[7].split(':')[1],
                        str_list[8].split(':')[1],
                        str_list[9].split(':')[1],
                        str_list[10].split(':')[1],
                        str_list[12],
                        str_list[13]]

            w.writerow(new_list) # write to the file

网友

2楼 · 编辑于 2024-06-12 16:30:21

如果输入文件的结构已知，则不需要使用正则表达式，因为正则表达式速度较慢。对于您的情况，请尝试使用类似于以下代码的代码：

import csv
with open('destination.csv', 'w', newline='') as csvfile:
    csv_writer = csv.writer(csvfile, delimiter=',')
    ...  # get your data here, the next code is for one line of data
    values = line.split()
    values[2] = '{} {} {}'.format(values[2][1:], values[3], values[4][:-1])  # Get rid of square brackets
    for idx in range(5, 11):
        values[idx] = values[idx].split(':')[1]  # get the number values
    values.pop(3);  # remove separated month name
    values.pop(3);  # remove separated year

    csv_writer.writerow(values)

您只编辑需要它的数据，然后将整行写入csv。在

相关问题更多 >

编程相关推荐

热门问题

热门文章