本文整理汇总了Python中gzip.html方法的典型用法代码示例。如果您正苦于以下问题:Python gzip.html方法的具体用法?Python gzip.html怎么用?Python gzip.html使用的例子?那么, 这里精选的方法代码示例或许可以为您提供帮助。您也可以进一步了解该方法所在类gzip
的用法示例。
在下文中一共展示了gzip.html方法的7个代码示例,这些例子默认根据受欢迎程度排序。您可以为喜欢或者感觉有用的代码点赞,您的评价将有助于系统推荐出更棒的Python代码示例。
示例1: make_tarfile
# 需要导入模块: import gzip [as 别名]
# 或者: from gzip import html [as 别名]
def make_tarfile(output_filename, source_dir, archive_name, custom_filter=None):
# Helper for filtering out modification timestamps
def _filter_timestamps(tar_info):
tar_info.mtime = 0
return tar_info if custom_filter is None else custom_filter(tar_info)
unzipped_filename = tempfile.mktemp()
try:
with tarfile.open(unzipped_filename, "w") as tar:
tar.add(source_dir, arcname=archive_name, filter=_filter_timestamps)
# When gzipping the tar, don't include the tar's filename or modification time in the
# zipped archive (see https://docs.python.org/3/library/gzip.html#gzip.GzipFile)
with gzip.GzipFile(filename="", fileobj=open(output_filename, 'wb'), mode='wb', mtime=0) \
as gzipped_tar, open(unzipped_filename, 'rb') as tar:
gzipped_tar.write(tar.read())
finally:
os.remove(unzipped_filename)
示例2: compress
# 需要导入模块: import gzip [as 别名]
# 或者: from gzip import html [as 别名]
def compress(body, compress_level):
"""Compress 'body' at the given compress_level."""
import zlib
# See http://www.gzip.org/zlib/rfc-gzip.html
yield b'\x1f\x8b' # ID1 and ID2: gzip marker
yield b'\x08' # CM: compression method
yield b'\x00' # FLG: none set
# MTIME: 4 bytes
yield struct.pack('<L', int(time.time()) & int('FFFFFFFF', 16))
yield b'\x02' # XFL: max compression, slowest algo
yield b'\xff' # OS: unknown
crc = zlib.crc32(b'')
size = 0
zobj = zlib.compressobj(compress_level,
zlib.DEFLATED, -zlib.MAX_WBITS,
zlib.DEF_MEM_LEVEL, 0)
for line in body:
size += len(line)
crc = zlib.crc32(line, crc)
yield zobj.compress(line)
yield zobj.flush()
# CRC32: 4 bytes
yield struct.pack('<L', crc & int('FFFFFFFF', 16))
# ISIZE: 4 bytes
yield struct.pack('<L', size & int('FFFFFFFF', 16))
示例3: compress
# 需要导入模块: import gzip [as 别名]
# 或者: from gzip import html [as 别名]
def compress(body, compress_level):
"""Compress 'body' at the given compress_level."""
import zlib
# See http://www.gzip.org/zlib/rfc-gzip.html
yield ntob('\x1f\x8b') # ID1 and ID2: gzip marker
yield ntob('\x08') # CM: compression method
yield ntob('\x00') # FLG: none set
# MTIME: 4 bytes
yield struct.pack("<L", int(time.time()) & int('FFFFFFFF', 16))
yield ntob('\x02') # XFL: max compression, slowest algo
yield ntob('\xff') # OS: unknown
crc = zlib.crc32(ntob(""))
size = 0
zobj = zlib.compressobj(compress_level,
zlib.DEFLATED, -zlib.MAX_WBITS,
zlib.DEF_MEM_LEVEL, 0)
for line in body:
size += len(line)
crc = zlib.crc32(line, crc)
yield zobj.compress(line)
yield zobj.flush()
# CRC32: 4 bytes
yield struct.pack("<L", crc & int('FFFFFFFF', 16))
# ISIZE: 4 bytes
yield struct.pack("<L", size & int('FFFFFFFF', 16))
示例4: compress
# 需要导入模块: import gzip [as 别名]
# 或者: from gzip import html [as 别名]
def compress(body, compress_level):
"""Compress 'body' at the given compress_level."""
import zlib
# See http://www.gzip.org/zlib/rfc-gzip.html
yield ntob('\x1f\x8b') # ID1 and ID2: gzip marker
yield ntob('\x08') # CM: compression method
yield ntob('\x00') # FLG: none set
# MTIME: 4 bytes
yield struct.pack('<L', int(time.time()) & int('FFFFFFFF', 16))
yield ntob('\x02') # XFL: max compression, slowest algo
yield ntob('\xff') # OS: unknown
crc = zlib.crc32(ntob(''))
size = 0
zobj = zlib.compressobj(compress_level,
zlib.DEFLATED, -zlib.MAX_WBITS,
zlib.DEF_MEM_LEVEL, 0)
for line in body:
size += len(line)
crc = zlib.crc32(line, crc)
yield zobj.compress(line)
yield zobj.flush()
# CRC32: 4 bytes
yield struct.pack('<L', crc & int('FFFFFFFF', 16))
# ISIZE: 4 bytes
yield struct.pack('<L', size & int('FFFFFFFF', 16))
示例5: compress
# 需要导入模块: import gzip [as 别名]
# 或者: from gzip import html [as 别名]
def compress(body, compress_level):
"""Compress 'body' at the given compress_level."""
import zlib
# See http://www.gzip.org/zlib/rfc-gzip.html
yield ntob('\x1f\x8b') # ID1 and ID2: gzip marker
yield ntob('\x08') # CM: compression method
yield ntob('\x00') # FLG: none set
# MTIME: 4 bytes
yield struct.pack("<L", int(time.time()) & int('FFFFFFFF', 16))
yield ntob('\x02') # XFL: max compression, slowest algo
yield ntob('\xff') # OS: unknown
crc = zlib.crc32(ntob(""))
size = 0
zobj = zlib.compressobj(compress_level,
zlib.DEFLATED, -zlib.MAX_WBITS,
zlib.DEF_MEM_LEVEL, 0)
for line in body:
size += len(line)
crc = zlib.crc32(line, crc)
yield zobj.compress(line)
yield zobj.flush()
# CRC32: 4 bytes
yield struct.pack("<L", crc & int('FFFFFFFF', 16))
# ISIZE: 4 bytes
yield struct.pack("<L", size & int('FFFFFFFF', 16))
示例6: fileobj_name
# 需要导入模块: import gzip [as 别名]
# 或者: from gzip import html [as 别名]
def fileobj_name(f):
"""
Returns the 'name' of file-like object f, if it has anything that could be
called its name. Otherwise f's class or type is returned. If f is a
string f itself is returned.
"""
if isinstance(f, str):
return f
elif isinstance(f, gzip.GzipFile):
# The .name attribute on GzipFiles does not always represent the name
# of the file being read/written--it can also represent the original
# name of the file being compressed
# See the documentation at
# https://docs.python.org/3/library/gzip.html#gzip.GzipFile
# As such, for gzip files only return the name of the underlying
# fileobj, if it exists
return fileobj_name(f.fileobj)
elif hasattr(f, 'name'):
return f.name
elif hasattr(f, 'filename'):
return f.filename
elif hasattr(f, '__class__'):
return str(f.__class__)
else:
return str(type(f))
示例7: _compute_lm
# 需要导入模块: import gzip [as 别名]
# 或者: from gzip import html [as 别名]
def _compute_lm(self, G_arpa):
"""Generate an ARPA n-gram from an abkhazia corpus
This method relies on the following Kaldi programs:
add-start-end.sh, build-lm.sh and compile-lm. It uses the
IRSTLM library.
"""
self.log.info(
'computing %s %s-gram in ARPA format', self.level, self.order)
# cut -d' ' -f2 lm_text > text_ready. Train need to
# remove utt-id on first column of text file
lm_text = os.path.join(self.a2k._local_path(), 'lm_text.txt')
lm_lines = utils.open_utf8(lm_text, 'r').readlines()
text_ready = os.path.join(self.a2k._local_path(), 'text_ready.txt')
with utils.open_utf8(text_ready, 'w') as ready:
ready.write('\n'.join(
[' '.join(line.split()[1:]) for line in lm_lines]))
text_se = os.path.join(self.a2k._local_path(), 'text_se.txt')
utils.jobs.run(
'add-start-end.sh',
stdin=open(text_ready, 'r'),
stdout=open(text_se, 'w').write,
env=kaldi_path(), cwd=self.recipe_dir)
assert os.path.isfile(text_se), 'LM failed on add-start-end'
# k option is number of split, useful for huge text files
# build-lm.sh in kaldi/tools/irstlm/bin
text_lm = os.path.join(self.a2k._local_path(), 'text_lm.gz')
self._run_command(
'build-lm.sh -i {0} -n {1} -o {2} -k 1 -s kneser-ney'
.format(text_se, self.order, text_lm))
assert os.path.isfile(text_lm), 'LM failed on build-lm'
text_blm = os.path.join(self.a2k._local_path(), 'text_blm.gz')
self._run_command(
# was with the -i option
'compile-lm {} --text=yes {}'.format(text_lm, text_blm))
# gzip the compiled lm (from
# https://docs.python.org/2/library/gzip.html#examples-of-usage)
with open(text_blm, 'rb') as fin, gzip.open(G_arpa, 'wb') as fout:
shutil.copyfileobj(fin, fout)