62 lines
1.5 KiB
Python
62 lines
1.5 KiB
Python
|
import io
|
||
|
|
||
|
import pytest
|
||
|
|
||
|
import pandas as pd
|
||
|
import pandas._testing as tm
|
||
|
|
||
|
from pandas.io.excel import ExcelFile
|
||
|
from pandas.io.excel._base import inspect_excel_format
|
||
|
|
||
|
xlrd = pytest.importorskip("xlrd")
|
||
|
|
||
|
exts = [".xls"]
|
||
|
|
||
|
|
||
|
@pytest.fixture(params=exts)
|
||
|
def read_ext_xlrd(request):
|
||
|
"""
|
||
|
Valid extensions for reading Excel files with xlrd.
|
||
|
|
||
|
Similar to read_ext, but excludes .ods, .xlsb, and for xlrd>2 .xlsx, .xlsm
|
||
|
"""
|
||
|
return request.param
|
||
|
|
||
|
|
||
|
def test_read_xlrd_book(read_ext_xlrd, datapath):
|
||
|
engine = "xlrd"
|
||
|
sheet_name = "Sheet1"
|
||
|
pth = datapath("io", "data", "excel", "test1.xls")
|
||
|
with xlrd.open_workbook(pth) as book:
|
||
|
with ExcelFile(book, engine=engine) as xl:
|
||
|
result = pd.read_excel(xl, sheet_name=sheet_name, index_col=0)
|
||
|
|
||
|
expected = pd.read_excel(
|
||
|
book, sheet_name=sheet_name, engine=engine, index_col=0
|
||
|
)
|
||
|
tm.assert_frame_equal(result, expected)
|
||
|
|
||
|
|
||
|
def test_read_xlsx_fails(datapath):
|
||
|
# GH 29375
|
||
|
from xlrd.biffh import XLRDError
|
||
|
|
||
|
path = datapath("io", "data", "excel", "test1.xlsx")
|
||
|
with pytest.raises(XLRDError, match="Excel xlsx file; not supported"):
|
||
|
pd.read_excel(path, engine="xlrd")
|
||
|
|
||
|
|
||
|
@pytest.mark.parametrize(
|
||
|
"file_header",
|
||
|
[
|
||
|
b"\x09\x00\x04\x00\x07\x00\x10\x00",
|
||
|
b"\x09\x02\x06\x00\x00\x00\x10\x00",
|
||
|
b"\x09\x04\x06\x00\x00\x00\x10\x00",
|
||
|
b"\xd0\xcf\x11\xe0\xa1\xb1\x1a\xe1",
|
||
|
],
|
||
|
)
|
||
|
def test_read_old_xls_files(file_header):
|
||
|
# GH 41226
|
||
|
f = io.BytesIO(file_header)
|
||
|
assert inspect_excel_format(f) == "xls"
|