78 lines
1.9 KiB
Python
78 lines
1.9 KiB
Python
|
"""
|
||
|
Patched ``BZ2File`` and ``LZMAFile`` to handle pickle protocol 5.
|
||
|
"""
|
||
|
|
||
|
from __future__ import annotations
|
||
|
|
||
|
from pickle import PickleBuffer
|
||
|
|
||
|
from pandas.compat._constants import PY310
|
||
|
|
||
|
try:
|
||
|
import bz2
|
||
|
|
||
|
has_bz2 = True
|
||
|
except ImportError:
|
||
|
has_bz2 = False
|
||
|
|
||
|
try:
|
||
|
import lzma
|
||
|
|
||
|
has_lzma = True
|
||
|
except ImportError:
|
||
|
has_lzma = False
|
||
|
|
||
|
|
||
|
def flatten_buffer(
|
||
|
b: bytes | bytearray | memoryview | PickleBuffer,
|
||
|
) -> bytes | bytearray | memoryview:
|
||
|
"""
|
||
|
Return some 1-D `uint8` typed buffer.
|
||
|
|
||
|
Coerces anything that does not match that description to one that does
|
||
|
without copying if possible (otherwise will copy).
|
||
|
"""
|
||
|
|
||
|
if isinstance(b, (bytes, bytearray)):
|
||
|
return b
|
||
|
|
||
|
if not isinstance(b, PickleBuffer):
|
||
|
b = PickleBuffer(b)
|
||
|
|
||
|
try:
|
||
|
# coerce to 1-D `uint8` C-contiguous `memoryview` zero-copy
|
||
|
return b.raw()
|
||
|
except BufferError:
|
||
|
# perform in-memory copy if buffer is not contiguous
|
||
|
return memoryview(b).tobytes("A")
|
||
|
|
||
|
|
||
|
if has_bz2:
|
||
|
|
||
|
class BZ2File(bz2.BZ2File):
|
||
|
if not PY310:
|
||
|
|
||
|
def write(self, b) -> int:
|
||
|
# Workaround issue where `bz2.BZ2File` expects `len`
|
||
|
# to return the number of bytes in `b` by converting
|
||
|
# `b` into something that meets that constraint with
|
||
|
# minimal copying.
|
||
|
#
|
||
|
# Note: This is fixed in Python 3.10.
|
||
|
return super().write(flatten_buffer(b))
|
||
|
|
||
|
|
||
|
if has_lzma:
|
||
|
|
||
|
class LZMAFile(lzma.LZMAFile):
|
||
|
if not PY310:
|
||
|
|
||
|
def write(self, b) -> int:
|
||
|
# Workaround issue where `lzma.LZMAFile` expects `len`
|
||
|
# to return the number of bytes in `b` by converting
|
||
|
# `b` into something that meets that constraint with
|
||
|
# minimal copying.
|
||
|
#
|
||
|
# Note: This is fixed in Python 3.10.
|
||
|
return super().write(flatten_buffer(b))
|