summaryrefslogtreecommitdiff
path: root/dedup
diff options
context:
space:
mode:
authorHelmut Grohne <helmut@subdivi.de>2016-04-28 20:50:12 +0200
committerHelmut Grohne <helmut@subdivi.de>2016-04-28 20:50:12 +0200
commit9ad30297a535a8a8f9bdc945288b02d75a379cb6 (patch)
treeadacaf54f0e8bce018c89677610fa76f8caeeee5 /dedup
parenta24b9125ae91cb26e56bac3752b6e38e1dbf264e (diff)
downloaddebian-dedup-9ad30297a535a8a8f9bdc945288b02d75a379cb6.tar.gz
decouple a function decompress out of decompress_tar
Building on the previous commit, add a decompress function that turns a compressed filelike into a decompressed filelike. Use it to decouple the decompression step.
Diffstat (limited to 'dedup')
-rw-r--r--dedup/compression.py32
1 files changed, 32 insertions, 0 deletions
diff --git a/dedup/compression.py b/dedup/compression.py
index 52917e3..5df6613 100644
--- a/dedup/compression.py
+++ b/dedup/compression.py
@@ -1,7 +1,10 @@
+import bz2
import struct
import sys
import zlib
+import lzma
+
crc32_type = "L" if sys.version_info.major >= 3 else "l"
class GzipDecompressor(object):
@@ -151,3 +154,32 @@ class DecompressedStream(object):
self.decompressor = None
self.buff = b""
self.closed = True
+
+decompressors = {
+ '.gz': GzipDecompressor,
+ '.bz2': bz2.BZ2Decompressor,
+ '.lzma': lzma.LZMADecompressor,
+ '.xz': lzma.LZMADecompressor,
+}
+
+def decompress(filelike, extension):
+ """Decompress a stream according to its extension.
+ @param filelike: is a read-only byte-stream. It must support read(size) and
+ close().
+ @param extension: permitted values are "", ".gz", ".bz2", ".lzma", and
+ ".xz"
+ @type extension: str
+ @returns: a read-only byte-stream with the decompressed contents of the
+ original filelike. It supports read(size) and close(). If the
+ original supports seek(pos) and tell(), then it also supports
+ those.
+ @raises ValueError: on unkown extensions
+ """
+ if not extension:
+ return filelike
+ try:
+ decompressor = decompressors[extension]
+ except KeyError:
+ raise ValueError("unknown compression format with extension %r" %
+ extension)
+ return DecompressedStream(filelike, decompressor())