python xlsxwriter:添加 table 时将 header 保留在 excel 中

python xlsxwriter: Keep header in excel when adding a table

我有一个写入 xslx 文件的熊猫数据框,我想在该数据上添加一个 table。我也想保留我已经写的headers,而不是再次添加它们。这可能吗?

示例:

import pandas as pd
import xlsxwriter as xw

# random dataframe
d = {'one' : pd.Series([1., 2., 3.], index=['a', 'b', 'c']), 'two' : pd.Series([5., 6., 7., 8.], index=['a', 'b', 'c', 'd'])}
df = pd.DataFrame(d)


# write data to file
writer = pd.ExcelWriter("test.xlsx", engine='xlsxwriter')
df.to_excel(writer,"sheet without table")
df.to_excel(writer,"sheet with table")
df.to_excel(writer,"sheet with table and header")

# get sheets to add the tables
workbook  = writer.book
worksheet_table = writer.sheets['sheet with table']
worksheet_table_header = writer.sheets['sheet with table and header']

# the range in which the table is
end_row = len(df.index)
end_column = len(df.columns)
cell_range = xw.utility.xl_range(0, 0, end_row, end_column)


# add the table that will delete the headers
worksheet_table.add_table(cell_range,{'header_row': True,'first_column': True})

######################################
# The hack

# Using the index in the Table
df.reset_index(inplace=True)
header = [{'header': di} for di in df.columns.tolist()]
worksheet_table_header.add_table(cell_range,{'header_row': True,'first_column': True,'columns':header})

writer.save()

I would also like to keep the headers that I have already written, instead of adding them again. Is that possible?

没有

您在 worksheet_table_header 中的第三个解决方案可能是实现它的最佳方式。

黑客攻击/解决方法是唯一的选择(如@jmcnamara 所见)。简而言之就是:

import pandas as pd
import xlsxwriter as xw

# random dataframe
d = {'one' : pd.Series([1., 2., 3.], index=['a', 'b', 'c']), 'two' : pd.Series([5., 6., 7., 8.], index=['a', 'b', 'c', 'd'])}
df = pd.DataFrame(d)


# write data to file
writer = pd.ExcelWriter("test.xlsx", engine='xlsxwriter')
df.to_excel(writer,"sheet with table and header")

# get sheets to add the tables
workbook  = writer.book
worksheet_table_header = writer.sheets['sheet with table and header']

# the range in which the table is
end_row = len(df.index)
end_column = len(df.columns)
cell_range = xw.utility.xl_range(0, 0, end_row, end_column)

######################################
# The hack

# Using the index in the Table
df.reset_index(inplace=True)
header = [{'header': di} for di in df.columns.tolist()]
worksheet_table_header.add_table(cell_range,{'header_row': True,'first_column': True,'columns':header})

writer.save()

在使用 xlsxwriter 版本 0.9.6 时,我不得不修改@jmcnamara 的 hack。我必须从列数中减去一列,否则我会得到一个不在 pandas.DataFrame 中的额外列(请参阅 end_column 分配)。以下修改版本(pandas 版本 0.19.2)。

import pandas as pd
import xlsxwriter

# random dataframe
d = {'one':pd.Series([1., 2., 3.]), 'two':pd.Series([5., 6., 7., 8.])}
df = pd.DataFrame(d)
print df

# write data to file
writer = pd.ExcelWriter("test.xlsx", engine='xlsxwriter')
df.to_excel(writer, 'sheet1', index=False)

# get sheets to add the tables
ws = writer.sheets['sheet1']

# the range in which the table is
end_row = len(df.index)
end_column = len(df.columns) - 1
cell_range = xlsxwriter.utility.xl_range(0, 0, end_row, end_column)

######################################
# The hack
header = [{'header': c} for c in df.columns.tolist()]
ws.add_table(cell_range,{'header_row': True, 'columns':header, 'style':'Table Style Medium 11'})
ws.freeze_panes(1, 1)
writer.save()
writer.close()

这个怎么样(请注意,仅当数据框包含 NA 时才需要 'options'):

import pandas as pd
import xlsxwriter

# random dataframe
d = {'one':pd.Series([1., 2., 3.]), 'two':pd.Series([5., 6., 7., 8.])}
df = pd.DataFrame(d)

workbook = xlsxwriter.Workbook('test.xlsx', options={'nan_inf_to_errors': True})
worksheet = workbook.add_worksheet('sheet1')
worksheet.add_table(0, 0, df.shape[0], df.shape[1]-1,
    {'data': df.values.tolist(),
    'columns': [{'header': c} for c in df.columns.tolist()],
    'style': 'Table Style Medium 9'})
workbook.close()