1
0
mirror of https://github.com/mikf/gallery-dl.git synced 2024-11-25 04:02:32 +01:00
gallery-dl/test/test_postprocessor.py

537 lines
17 KiB
Python
Raw Normal View History

2019-08-12 21:46:30 +02:00
#!/usr/bin/env python3
# -*- coding: utf-8 -*-
# Copyright 2019-2022 Mike Fährmann
2019-08-12 21:46:30 +02:00
#
# This program is free software; you can redistribute it and/or modify
# it under the terms of the GNU General Public License version 2 as
# published by the Free Software Foundation.
import os
import sys
import unittest
from unittest.mock import Mock, mock_open, patch
import logging
2019-08-12 21:46:30 +02:00
import zipfile
import tempfile
2020-11-18 17:11:55 +01:00
import collections
from datetime import datetime
2019-08-12 21:46:30 +02:00
sys.path.insert(0, os.path.dirname(os.path.dirname(os.path.abspath(__file__))))
from gallery_dl import extractor, output, path # noqa E402
2020-11-18 17:11:55 +01:00
from gallery_dl import postprocessor, config # noqa E402
from gallery_dl.postprocessor.common import PostProcessor # noqa E402
2019-08-12 21:46:30 +02:00
class MockPostprocessorModule(Mock):
__postprocessor__ = "mock"
class FakeJob():
def __init__(self, extr=extractor.find("test:")):
self.extractor = extr
self.pathfmt = path.PathFormat(extr)
self.out = output.NullOutput()
self.get_logger = logging.getLogger
2020-11-18 17:11:55 +01:00
self.hooks = collections.defaultdict(list)
def register_hooks(self, hooks, options):
for hook, callback in hooks.items():
self.hooks[hook].append(callback)
2019-08-12 21:46:30 +02:00
class TestPostprocessorModule(unittest.TestCase):
def setUp(self):
postprocessor._cache.clear()
def test_find(self):
for name in (postprocessor.modules):
cls = postprocessor.find(name)
self.assertEqual(cls.__name__, name.capitalize() + "PP")
self.assertIs(cls.__base__, PostProcessor)
self.assertEqual(postprocessor.find("foo"), None)
self.assertEqual(postprocessor.find(1234) , None)
self.assertEqual(postprocessor.find(None) , None)
@patch("builtins.__import__")
2019-08-12 21:46:30 +02:00
def test_cache(self, import_module):
import_module.return_value = MockPostprocessorModule()
for name in (postprocessor.modules):
postprocessor.find(name)
self.assertEqual(import_module.call_count, len(postprocessor.modules))
# no new calls to import_module
for name in (postprocessor.modules):
postprocessor.find(name)
self.assertEqual(import_module.call_count, len(postprocessor.modules))
class BasePostprocessorTest(unittest.TestCase):
@classmethod
def setUpClass(cls):
cls.dir = tempfile.TemporaryDirectory()
2019-11-23 23:50:16 +01:00
config.set((), "base-directory", cls.dir.name)
cls.job = FakeJob()
2019-08-12 21:46:30 +02:00
@classmethod
def tearDownClass(cls):
cls.dir.cleanup()
config.clear()
2020-11-18 17:11:55 +01:00
def tearDown(self):
self.job.hooks.clear()
2019-08-12 21:46:30 +02:00
def _create(self, options=None, data=None):
kwdict = {"category": "test", "filename": "file", "extension": "ext"}
if options is None:
options = {}
if data is not None:
kwdict.update(data)
self.pathfmt = self.job.pathfmt
2019-08-12 21:46:30 +02:00
self.pathfmt.set_directory(kwdict)
self.pathfmt.set_filename(kwdict)
self.pathfmt.build_path()
2019-08-12 21:46:30 +02:00
pp = postprocessor.find(self.__class__.__name__[:-4].lower())
return pp(self.job, options)
2019-08-12 21:46:30 +02:00
2020-11-18 17:11:55 +01:00
def _trigger(self, events=None, *args):
for event in (events or ("prepare", "file")):
for callback in self.job.hooks[event]:
callback(self.pathfmt, *args)
2019-08-12 21:46:30 +02:00
class ClassifyTest(BasePostprocessorTest):
def test_classify_default(self):
pp = self._create()
self.assertEqual(pp.mapping, {
ext: directory
for directory, exts in pp.DEFAULT_MAPPING.items()
for ext in exts
})
self.pathfmt.set_extension("jpg")
self.pathfmt.build_path()
2019-08-12 21:46:30 +02:00
pp.prepare(self.pathfmt)
path = os.path.join(self.dir.name, "test", "Pictures")
self.assertEqual(self.pathfmt.path, path + "/file.jpg")
2019-08-12 21:46:30 +02:00
self.assertEqual(self.pathfmt.realpath, path + "/file.jpg")
with patch("os.makedirs") as mkdirs:
2020-11-18 17:11:55 +01:00
self._trigger()
2019-08-12 21:46:30 +02:00
mkdirs.assert_called_once_with(path, exist_ok=True)
def test_classify_noop(self):
pp = self._create()
rp = self.pathfmt.realpath
pp.prepare(self.pathfmt)
self.assertEqual(self.pathfmt.path, rp)
2019-08-12 21:46:30 +02:00
self.assertEqual(self.pathfmt.realpath, rp)
with patch("os.makedirs") as mkdirs:
2020-11-18 17:11:55 +01:00
self._trigger()
2019-08-12 21:46:30 +02:00
self.assertEqual(mkdirs.call_count, 0)
def test_classify_custom(self):
pp = self._create({"mapping": {
"foo/bar": ["foo", "bar"],
}})
self.assertEqual(pp.mapping, {
"foo": "foo/bar",
"bar": "foo/bar",
})
self.pathfmt.set_extension("foo")
self.pathfmt.build_path()
2019-08-12 21:46:30 +02:00
pp.prepare(self.pathfmt)
path = os.path.join(self.dir.name, "test", "foo", "bar")
self.assertEqual(self.pathfmt.path, path + "/file.foo")
2019-08-12 21:46:30 +02:00
self.assertEqual(self.pathfmt.realpath, path + "/file.foo")
with patch("os.makedirs") as mkdirs:
2020-11-18 17:11:55 +01:00
self._trigger()
2019-08-12 21:46:30 +02:00
mkdirs.assert_called_once_with(path, exist_ok=True)
class MetadataTest(BasePostprocessorTest):
def test_metadata_default(self):
pp = self._create()
# default arguments
self.assertEqual(pp.write , pp._write_json)
self.assertEqual(pp.ascii , False)
self.assertEqual(pp.indent , 4)
self.assertEqual(pp.extension, "json")
def test_metadata_json(self):
pp = self._create({
"mode" : "json",
"ascii" : True,
"indent" : 2,
"extension": "JSON",
}, {
"public" : "hello",
"_private" : "world",
2019-08-12 21:46:30 +02:00
})
self.assertEqual(pp.write , pp._write_json)
self.assertEqual(pp.ascii , True)
self.assertEqual(pp.indent , 2)
self.assertEqual(pp.extension, "JSON")
with patch("builtins.open", mock_open()) as m:
2020-11-18 17:11:55 +01:00
self._trigger()
2019-08-12 21:46:30 +02:00
path = self.pathfmt.realpath + ".JSON"
m.assert_called_once_with(path, "w", encoding="utf-8")
self.assertEqual(self._output(m), """{
"category": "test",
"extension": "ext",
"filename": "file",
"public": "hello"
2019-08-12 21:46:30 +02:00
}
""")
def test_metadata_tags(self):
2019-08-26 23:10:12 +02:00
pp = self._create(
{"mode": "tags"},
{"tags": ["foo", "bar", "baz"]},
)
2019-08-12 21:46:30 +02:00
self.assertEqual(pp.write, pp._write_tags)
self.assertEqual(pp.extension, "txt")
with patch("builtins.open", mock_open()) as m:
2020-11-18 17:11:55 +01:00
self._trigger()
2019-08-12 21:46:30 +02:00
path = self.pathfmt.realpath + ".txt"
m.assert_called_once_with(path, "w", encoding="utf-8")
self.assertEqual(self._output(m), "foo\nbar\nbaz\n")
def test_metadata_tags_split_1(self):
2020-11-18 17:11:55 +01:00
self._create(
2019-08-26 23:10:12 +02:00
{"mode": "tags"},
{"tags": "foo, bar, baz"},
)
2019-08-12 21:46:30 +02:00
with patch("builtins.open", mock_open()) as m:
2020-11-18 17:11:55 +01:00
self._trigger()
2019-08-12 21:46:30 +02:00
self.assertEqual(self._output(m), "foo\nbar\nbaz\n")
def test_metadata_tags_split_2(self):
2020-11-18 17:11:55 +01:00
self._create(
2019-08-12 21:46:30 +02:00
{"mode": "tags"},
{"tags": "foobar1 foobar2 foobarbaz"},
)
with patch("builtins.open", mock_open()) as m:
2020-11-18 17:11:55 +01:00
self._trigger()
2019-08-12 21:46:30 +02:00
self.assertEqual(self._output(m), "foobar1\nfoobar2\nfoobarbaz\n")
def test_metadata_tags_tagstring(self):
2020-11-18 17:11:55 +01:00
self._create(
2019-08-26 23:10:12 +02:00
{"mode": "tags"},
{"tag_string": "foo, bar, baz"},
)
2019-08-12 21:46:30 +02:00
with patch("builtins.open", mock_open()) as m:
2020-11-18 17:11:55 +01:00
self._trigger()
2019-08-12 21:46:30 +02:00
self.assertEqual(self._output(m), "foo\nbar\nbaz\n")
def test_metadata_tags_dict(self):
self._create(
{"mode": "tags"},
{"tags": {"g": ["foobar1", "foobar2"], "m": ["foobarbaz"]}},
)
with patch("builtins.open", mock_open()) as m:
self._trigger()
self.assertEqual(self._output(m), "foobar1\nfoobar2\nfoobarbaz\n")
2019-08-12 21:46:30 +02:00
def test_metadata_custom(self):
def test(pp_info):
pp = self._create(pp_info, {"foo": "bar"})
self.assertEqual(pp.write, pp._write_custom)
self.assertEqual(pp.extension, "txt")
self.assertTrue(pp._content_fmt)
with patch("builtins.open", mock_open()) as m:
2020-11-18 17:11:55 +01:00
self._trigger()
self.assertEqual(self._output(m), "bar\nNone\n")
2020-11-18 17:11:55 +01:00
self.job.hooks.clear()
test({"mode": "custom", "content-format": "{foo}\n{missing}\n"})
test({"mode": "custom", "content-format": ["{foo}", "{missing}"]})
test({"mode": "custom", "format": "{foo}\n{missing}\n"})
test({"format": "{foo}\n{missing}\n"})
2019-08-12 21:46:30 +02:00
def test_metadata_extfmt(self):
pp = self._create({
"extension" : "ignored",
"extension-format": "json",
})
self.assertEqual(pp._filename, pp._filename_extfmt)
with patch("builtins.open", mock_open()) as m:
2020-11-18 17:11:55 +01:00
self._trigger()
path = self.pathfmt.realdirectory + "file.json"
m.assert_called_once_with(path, "w", encoding="utf-8")
def test_metadata_extfmt_2(self):
2020-11-18 17:11:55 +01:00
self._create({
"extension-format": "{extension!u}-data:{category:Res/ES/}",
})
self.pathfmt.prefix = "2."
with patch("builtins.open", mock_open()) as m:
2020-11-18 17:11:55 +01:00
self._trigger()
path = self.pathfmt.realdirectory + "file.2.EXT-data:tESt"
m.assert_called_once_with(path, "w", encoding="utf-8")
def test_metadata_directory(self):
2020-11-18 17:11:55 +01:00
self._create({
"directory": "metadata",
})
with patch("builtins.open", mock_open()) as m:
2020-11-18 17:11:55 +01:00
self._trigger()
path = self.pathfmt.realdirectory + "metadata/file.ext.json"
m.assert_called_once_with(path, "w", encoding="utf-8")
def test_metadata_directory_2(self):
2020-11-18 17:11:55 +01:00
self._create({
"directory" : "metadata////",
"extension-format": "json",
})
with patch("builtins.open", mock_open()) as m:
2020-11-18 17:11:55 +01:00
self._trigger()
path = self.pathfmt.realdirectory + "metadata/file.json"
m.assert_called_once_with(path, "w", encoding="utf-8")
def test_metadata_filename(self):
self._create({
"filename" : "{category}_{filename}_/meta/\n\r.data",
"extension-format": "json",
})
with patch("builtins.open", mock_open()) as m:
self._trigger()
path = self.pathfmt.realdirectory + "test_file__meta_.data"
m.assert_called_once_with(path, "w", encoding="utf-8")
def test_metadata_stdout(self):
self._create({"filename": "-", "indent": None})
with patch("sys.stdout", Mock()) as m:
self._trigger()
self.assertEqual(self._output(m), """\
{"category": "test", "extension": "ext", "filename": "file"}
""")
def test_metadata_modify(self):
kwdict = {"foo": 0, "bar": {"bax": 1, "bay": 2, "baz": 3}}
self._create({
"mode": "modify",
"fields": {
"foo" : "{filename}-{foo!s}",
"foo2" : "\fE bar['bax'] + 122",
"bar[baz]": "{_now}",
"bar[ba2]": "test",
},
}, kwdict)
pdict = self.pathfmt.kwdict
self.assertIsNot(kwdict, pdict)
self.assertEqual(pdict["foo"], kwdict["foo"])
self.assertEqual(pdict["bar"], kwdict["bar"])
self._trigger()
self.assertEqual(pdict["foo"] , "file-0")
self.assertEqual(pdict["foo2"] , 123)
self.assertEqual(pdict["bar"]["ba2"], "test")
self.assertIsInstance(pdict["bar"]["baz"], datetime)
def test_metadata_delete(self):
kwdict = {"foo": 0, "bar": {"bax": 1, "bay": 2, "baz": 3}}
self._create({"mode": "delete", "fields": ["foo", "bar[baz]"]}, kwdict)
pdict = self.pathfmt.kwdict
self.assertIsNot(kwdict, pdict)
self.assertEqual(pdict["foo"], kwdict["foo"])
self.assertEqual(pdict["bar"], kwdict["bar"])
del kwdict["foo"]
del kwdict["bar"]["baz"]
self._trigger()
self.assertNotIn("foo", pdict)
self.assertNotIn("baz", pdict["bar"])
self.assertEqual(kwdict["bar"], pdict["bar"])
self._trigger()
self.assertNotIn("foo", pdict)
self.assertNotIn("baz", pdict["bar"])
self.assertEqual(kwdict["bar"], pdict["bar"])
2019-08-12 21:46:30 +02:00
@staticmethod
def _output(mock):
return "".join(
call[1][0]
for call in mock.mock_calls
if call[0].endswith("write")
2019-08-12 21:46:30 +02:00
)
class MtimeTest(BasePostprocessorTest):
def test_mtime_datetime(self):
self._create(None, {"date": datetime(1980, 1, 1)})
2020-11-18 17:11:55 +01:00
self._trigger()
self.assertEqual(self.pathfmt.kwdict["_mtime"], 315532800)
2019-08-12 21:46:30 +02:00
def test_mtime_timestamp(self):
2020-11-18 17:11:55 +01:00
self._create(None, {"date": 315532800})
self._trigger()
self.assertEqual(self.pathfmt.kwdict["_mtime"], 315532800)
2019-08-12 21:46:30 +02:00
def test_mtime_key(self):
2020-11-18 17:11:55 +01:00
self._create({"key": "foo"}, {"foo": 315532800})
self._trigger()
self.assertEqual(self.pathfmt.kwdict["_mtime"], 315532800)
2019-08-12 21:46:30 +02:00
def test_mtime_value(self):
self._create({"value": "{foo}"}, {"foo": 315532800})
self._trigger()
self.assertEqual(self.pathfmt.kwdict["_mtime"], 315532800)
2019-08-12 21:46:30 +02:00
class ZipTest(BasePostprocessorTest):
def test_zip_default(self):
pp = self._create()
self.assertEqual(self.job.hooks["file"][0], pp.write_fast)
self.assertEqual(pp.path, self.pathfmt.realdirectory[:-1])
2019-08-12 21:46:30 +02:00
self.assertEqual(pp.delete, True)
self.assertEqual(pp.args, (
pp.path + ".zip", "a", zipfile.ZIP_STORED, True,
))
self.assertTrue(pp.args[0].endswith("/test.zip"))
def test_zip_safe(self):
pp = self._create({"mode": "safe"})
2020-11-18 17:11:55 +01:00
self.assertEqual(self.job.hooks["file"][0], pp.write_safe)
self.assertEqual(pp.path, self.pathfmt.realdirectory[:-1])
self.assertEqual(pp.delete, True)
self.assertEqual(pp.args, (
pp.path + ".zip", "a", zipfile.ZIP_STORED, True,
))
self.assertTrue(pp.args[0].endswith("/test.zip"))
2019-08-12 21:46:30 +02:00
def test_zip_options(self):
pp = self._create({
"keep-files": True,
"compression": "zip",
"extension": "cbz",
})
self.assertEqual(pp.delete, False)
self.assertEqual(pp.args, (
pp.path + ".cbz", "a", zipfile.ZIP_DEFLATED, True,
2019-08-12 21:46:30 +02:00
))
self.assertTrue(pp.args[0].endswith("/test.cbz"))
2019-08-26 23:10:12 +02:00
def test_zip_write(self):
with tempfile.NamedTemporaryFile("w", dir=self.dir.name) as file:
pp = self._create({"files": [file.name, "_info_.json"],
"keep-files": True})
filename = os.path.basename(file.name)
2019-08-26 23:10:12 +02:00
file.write("foobar\n")
# write dummy file with 3 different names
for i in range(3):
name = "file{}.ext".format(i)
self.pathfmt.temppath = file.name
self.pathfmt.filename = name
2020-11-18 17:11:55 +01:00
self._trigger()
2019-08-26 23:10:12 +02:00
nti = pp.zfile.NameToInfo
self.assertEqual(len(nti), i+2)
2019-08-26 23:10:12 +02:00
self.assertIn(name, nti)
# check file contents
self.assertEqual(len(nti), 4)
2019-08-26 23:10:12 +02:00
self.assertIn("file0.ext", nti)
self.assertIn("file1.ext", nti)
self.assertIn("file2.ext", nti)
self.assertIn(filename, nti)
2019-08-26 23:10:12 +02:00
# write the last file a second time (will be skipped)
2020-11-18 17:11:55 +01:00
self._trigger()
self.assertEqual(len(pp.zfile.NameToInfo), 4)
2019-08-26 23:10:12 +02:00
# close file
2020-11-18 17:11:55 +01:00
self._trigger(("finalize",), 0)
2019-08-26 23:10:12 +02:00
# reopen to check persistence
with zipfile.ZipFile(pp.zfile.filename) as file:
nti = file.NameToInfo
self.assertEqual(len(pp.zfile.NameToInfo), 4)
self.assertIn("file0.ext", nti)
self.assertIn("file1.ext", nti)
self.assertIn("file2.ext", nti)
self.assertIn(filename, nti)
2019-08-26 23:10:12 +02:00
os.unlink(pp.zfile.filename)
def test_zip_write_mock(self):
def side_effect(_, name):
pp.zfile.NameToInfo.add(name)
pp = self._create()
pp.zfile = Mock()
pp.zfile.NameToInfo = set()
pp.zfile.write.side_effect = side_effect
# write 3 files
for i in range(3):
self.pathfmt.temppath = self.pathfmt.realdirectory + "file.ext"
self.pathfmt.filename = "file{}.ext".format(i)
2020-11-18 17:11:55 +01:00
self._trigger()
2019-08-26 23:10:12 +02:00
2020-11-18 17:11:55 +01:00
# write the last file a second time (should be skipped)
self._trigger()
2019-08-26 23:10:12 +02:00
2020-11-18 17:11:55 +01:00
# close file
self._trigger(("finalize",), 0)
2019-08-26 23:10:12 +02:00
self.assertEqual(pp.zfile.write.call_count, 3)
for call in pp.zfile.write.call_args_list:
args, kwargs = call
self.assertEqual(len(args), 2)
self.assertEqual(len(kwargs), 0)
self.assertEqual(args[0], self.pathfmt.temppath)
self.assertRegex(args[1], r"file\d\.ext")
self.assertEqual(pp.zfile.close.call_count, 1)
2019-08-12 21:46:30 +02:00
if __name__ == "__main__":
unittest.main()