From 27c3a41a46d10d6436498595f7e17dc70a249ff9 Mon Sep 17 00:00:00 2001 From: Binh Nguyen Date: Tue, 5 May 2020 15:03:02 +0700 Subject: [PATCH] [REF] add DataFrame to_excel params, update requirements.txt since Pandas needs XlsxWriter>=0.9.8 --- camelot/core.py | 6 ++++-- requirements.txt | 1 + 2 files changed, 5 insertions(+), 2 deletions(-) diff --git a/camelot/core.py b/camelot/core.py index b7a02b1..6e3d73d 100644 --- a/camelot/core.py +++ b/camelot/core.py @@ -712,7 +712,7 @@ class TableList(object): filepath = os.path.join(dirname, filename) z.write(filepath, os.path.basename(filepath)) - def export(self, path, f="csv", compress=False): + def export(self, path, f="csv", compress=False, df_kwargs={}): """Exports the list of tables to specified file format. Parameters @@ -723,6 +723,8 @@ class TableList(object): File format. Can be csv, json, excel, html and sqlite. compress : bool Whether or not to add files to a ZIP archive. + df_kwargs : dict, optional (default: {}) + A dict of `pandas.DataFrame.to_excel https://github.com/pandas-dev/pandas/blob/master/pandas/core/generic.py#L1924` """ dirname = os.path.dirname(path) @@ -742,7 +744,7 @@ class TableList(object): writer = pd.ExcelWriter(filepath) for table in self._tables: sheet_name = "page-{}-table-{}".format(table.page, table.order) - table.df.to_excel(writer, sheet_name=sheet_name, encoding="utf-8") + table.df.to_excel(writer, sheet_name=sheet_name, encoding="utf-8", **df_kwargs) writer.save() if compress: zipname = os.path.join(os.path.dirname(path), root) + ".zip" diff --git a/requirements.txt b/requirements.txt index f815e26..31d2c7d 100755 --- a/requirements.txt +++ b/requirements.txt @@ -6,3 +6,4 @@ openpyxl>=2.5.8 pandas>=0.23.4 pdfminer.six>=20170720 PyPDF2>=1.26.0 +XlsxWriter>=0.9.8