1
0
mirror of https://github.com/mikf/gallery-dl.git synced 2024-11-25 04:02:32 +01:00

[postprocessor:zip] add 'mode' option (#355)

This commit is contained in:
Mike Fährmann 2019-07-28 18:13:18 +02:00
parent 6ce22f606b
commit a90280f4e7
No known key found for this signature in database
GPG Key ID: 5680CA389D365A88
2 changed files with 43 additions and 11 deletions

View File

@ -1465,6 +1465,22 @@ Default ``false``
Description Keep the actual files after writing them to a ZIP archive.
=========== =====
zip.mode
--------
=========== =====
Type ``string``
Default ``"default"``
Description * ``"default"``: Write the central directory file header
once after everything is done or an exception is raised.
* ``"safe"``: Update the central directory file header
each time a file is stored in a ZIP archive.
This greatly reduces the chance a ZIP archive gets corrupted in
case the Python interpreter gets shut down unexpectedly
(power outage, SIGKILL) but is also a lot slower.
=========== =====
Miscellaneous Options

View File

@ -1,6 +1,6 @@
# -*- coding: utf-8 -*-
# Copyright 2018 Mike Fährmann
# Copyright 2018-2019 Mike Fährmann
#
# This program is free software; you can redistribute it and/or modify
# it under the terms of the GNU General Public License version 2 as
@ -25,7 +25,7 @@ class ZipPP(PostProcessor):
def __init__(self, pathfmt, options):
PostProcessor.__init__(self)
self.delete = not options.get("keep-files", False)
self.ext = "." + options.get("extension", "zip")
ext = "." + options.get("extension", "zip")
algorithm = options.get("compression", "store")
if algorithm not in self.COMPRESSION_ALGORITHMS:
self.log.warning(
@ -34,29 +34,45 @@ class ZipPP(PostProcessor):
algorithm = "store"
self.path = pathfmt.realdirectory
self.zfile = zipfile.ZipFile(
self.path + self.ext, "a",
self.COMPRESSION_ALGORITHMS[algorithm], True)
args = (self.path + ext, "a",
self.COMPRESSION_ALGORITHMS[algorithm], True)
def run(self, pathfmt):
if options.get("mode") == "safe":
self.run = self._write_safe
self.zfile = None
self.args = args
else:
self.run = self._write
self.zfile = zipfile.ZipFile(*args)
def _write(self, pathfmt, zfile=None):
# 'NameToInfo' is not officially documented, but it's available
# for all supported Python versions and using it directly is a lot
# better than calling getinfo()
if pathfmt.filename not in self.zfile.NameToInfo:
self.zfile.write(pathfmt.temppath, pathfmt.filename)
# faster than calling getinfo()
if zfile is None:
zfile = self.zfile
if pathfmt.filename not in zfile.NameToInfo:
zfile.write(pathfmt.temppath, pathfmt.filename)
pathfmt.delete = self.delete
def _write_safe(self, pathfmt):
with zipfile.ZipFile(*self.args) as zfile:
self._write(pathfmt, zfile)
def finalize(self):
self.zfile.close()
if self.zfile:
self.zfile.close()
if self.delete:
try:
# remove target directory
os.rmdir(self.path)
except OSError:
pass
if not self.zfile.NameToInfo:
if self.zfile and not self.zfile.NameToInfo:
try:
# delete empty zip archive
os.unlink(self.zfile.filename)
except OSError:
pass