import json
import os
from zipfile import ZipFile
import pytest
from hircine.scraper.utils import open_archive_file, parse_dict
def test_parse_dict():
data = {
"scalar": "foo",
"list": ["bar", "baz"],
"dict": {"nested_scalar": "qux", "nested_list": ["plugh", "xyzzy"]},
}
def annotate(tag):
return lambda item: f"{tag}_{item}"
parsers = {
"scalar": annotate("scalar"),
"list": annotate("list"),
"dict": {"nested_scalar": annotate("scalar"), "nested_list": annotate("list")},
"missing": annotate("missing"),
}
assert [f() for f in parse_dict(parsers, data)] == [
"scalar_foo",
"list_bar",
"list_baz",
"scalar_qux",
"list_plugh",
"list_xyzzy",
]
@pytest.mark.parametrize(
"check_sidecar",
[
(False),
(True),
],
ids=[
"zip",
"sidecar",
],
)
def test_open_archive_file(gen_archive, tmpdir, check_sidecar):
archive = next(gen_archive)
archive.path = os.path.join(tmpdir, "archive.zip")
zip_data = {"zip": "data"}
sidecar_data = {"sidecar": "data"}
with open(f"{archive.path}.info.json", "x") as handle:
json.dump(sidecar_data, handle)
with ZipFile(archive.path, "x") as ziph:
ziph.writestr("info.json", json.dumps(zip_data))
with open_archive_file(archive, "info.json", check_sidecar=check_sidecar) as file:
data = json.load(file)
if check_sidecar:
assert data == sidecar_data
else:
assert data == zip_data