diff --git a/tap_spreadsheets_anywhere/format_handler.py b/tap_spreadsheets_anywhere/format_handler.py index 3bf911f..bc29a39 100644 --- a/tap_spreadsheets_anywhere/format_handler.py +++ b/tap_spreadsheets_anywhere/format_handler.py @@ -157,7 +157,9 @@ def get_row_iterator(table_spec, uri): reader = get_streamreader(uri, universal_newlines=universal_newlines, open_mode='r', encoding=encoding) iterator = tap_spreadsheets_anywhere.csv_handler.get_row_iterator(table_spec, reader) elif format == 'excel': - reader = get_streamreader(uri, universal_newlines=universal_newlines,newline=None, open_mode='rb') + reader = get_streamreader(uri, universal_newlines=universal_newlines,newline=None, open_mode='rb', + # encoding must be None to prevent smart_open from ignoring binary mode + encoding=None) if uri.lower().endswith(".xls"): iterator = tap_spreadsheets_anywhere.excel_handler.get_legacy_row_iterator(table_spec, reader) else: