我正在尝试重命名具有空格的csv中的标题。使用Pandas API参考中的这些行不起作用。标题仍然有空格而不是下划线。
import pandas as pd
df = pd.read_csv("my.csv",low_memory=False)
df.columns = df.columns.str.strip().str.lower().str.replace(' ', '_')
尝试使用列表理解。
df.columns = [c.strip().lower().replace(' ', '_') for c in df.columns]
尝试使用重命名?
df.rename(index=str, columns={"A space": "a", "B space ": "c"})
我放弃了Pandas,只是在Python 2.7中使用了CSV模块。
import csv
import re
import tempfile
import sys
import os
if sys.version_info >= (3, 3):
from os import replace
elif sys.platform == "win32":
from osreplace import replace
else:
from os import rename as replace
newHeaderList = []
with tempfile.NamedTemporaryFile(dir='.', delete=False) as tmp, \
open('myFile.txt', 'rb') as f:
r = csv.reader(f, delimiter = '\t')
w = csv.writer(tmp, delimiter = '\t', quoting=csv.QUOTE_NONNUMERIC)
header = next(r)
for h in header:
headerNoSpace = re.sub("\s+", "_", h.strip())
newHeaderList.append(headerNoSpace)
w.writerow(newHeaderList)
for row in r:
w.writerow(row)
os.rename(tmp.name, new_text_filepath)
new_txt = csv.reader(open('newFile.txt', "rb"), delimiter = '\t')
out_csv = csv.writer(open('myFile.csv', 'wb'))
out_csv.writerows(new_txt)