summaryrefslogtreecommitdiff
path: root/dedup/compression.py
diff options
context:
space:
mode:
Diffstat (limited to 'dedup/compression.py')
-rw-r--r--dedup/compression.py32
1 files changed, 32 insertions, 0 deletions
diff --git a/dedup/compression.py b/dedup/compression.py
index 52917e3..5df6613 100644
--- a/dedup/compression.py
+++ b/dedup/compression.py
@@ -1,7 +1,10 @@
+import bz2
import struct
import sys
import zlib
+import lzma
+
crc32_type = "L" if sys.version_info.major >= 3 else "l"
class GzipDecompressor(object):
@@ -151,3 +154,32 @@ class DecompressedStream(object):
self.decompressor = None
self.buff = b""
self.closed = True
+
+decompressors = {
+ '.gz': GzipDecompressor,
+ '.bz2': bz2.BZ2Decompressor,
+ '.lzma': lzma.LZMADecompressor,
+ '.xz': lzma.LZMADecompressor,
+}
+
+def decompress(filelike, extension):
+ """Decompress a stream according to its extension.
+ @param filelike: is a read-only byte-stream. It must support read(size) and
+ close().
+ @param extension: permitted values are "", ".gz", ".bz2", ".lzma", and
+ ".xz"
+ @type extension: str
+ @returns: a read-only byte-stream with the decompressed contents of the
+ original filelike. It supports read(size) and close(). If the
+ original supports seek(pos) and tell(), then it also supports
+ those.
+ @raises ValueError: on unkown extensions
+ """
+ if not extension:
+ return filelike
+ try:
+ decompressor = decompressors[extension]
+ except KeyError:
+ raise ValueError("unknown compression format with extension %r" %
+ extension)
+ return DecompressedStream(filelike, decompressor())