Skip to content

Commit a104967

Browse files
authored
Merge pull request #213 from openzim/customize_publisher
Customize / Harmonize publisher + other small fixes
2 parents 2fd98ed + 727fc44 commit a104967

File tree

5 files changed

+25
-6
lines changed

5 files changed

+25
-6
lines changed

ChangeLog

+11
Original file line numberDiff line numberDiff line change
@@ -8,6 +8,17 @@ as of 2.0.0.
88

99
## [Unreleased]
1010

11+
### Added
12+
- `Publisher` ZIM metadata can now be customized at CLI (#210)
13+
14+
### Changed
15+
- `Publisher` ZIM metadata default value is changed to `openZIM` intead of `Kiwix` (#210)
16+
17+
### Fixed
18+
- Do not fail if temporary directory already exists (#207)
19+
- Typo in `Scraper` ZIM metadata (#212)
20+
- Adapt to hatchling v1.19.0 which mandates packages setting (#211)
21+
1122
## [2.1.0] - 2023-08-18
1223

1324
### Changed

pyproject.toml

+4-1
Original file line numberDiff line numberDiff line change
@@ -6,7 +6,7 @@ build-backend = "hatchling.build"
66
name = "gutenberg2zim"
77
authors = [{ name = "Kiwix", email = "[email protected]" }]
88
keywords = ["kiwix", "zim", "offline", "gutenberg"]
9-
requires-python = ">=3.11"
9+
requires-python = ">=3.11,<3.12"
1010
description = "Make ZIM file from Gutenberg books"
1111
readme = "pypi-readme.rst"
1212
license = { text = "GPL-3.0-or-later" }
@@ -69,6 +69,9 @@ exclude = ["/.github"]
6969
path = "hatch_build.py"
7070
dependencies = ["zimscraperlib==3.1.1"]
7171

72+
[tool.hatch.build.targets.wheel]
73+
packages = ["src/gutenberg2zim"]
74+
7275
[tool.hatch.envs.default]
7376
features = ["dev"]
7477

src/gutenberg2zim/entrypoint.py

+5-2
Original file line numberDiff line numberDiff line change
@@ -22,7 +22,7 @@
2222
"""[--prepare] [--parse] [--download] [--export] [--dev] """
2323
"""[--zim] [--complete] [-m ONE_LANG_ONE_ZIM_FOLDER] """
2424
"""[--title-search] [--bookshelves] [--optimization-cache S3URL] """
25-
"""[--stats-filename STATS_FILENAME]"""
25+
"""[--stats-filename STATS_FILENAME] [--publisher ZIM_PUBLISHER]"""
2626
"""
2727
2828
-h --help Display this help message
@@ -63,6 +63,7 @@
6363
--use-any-optimized-version Try to use any optimized version found on """
6464
"""optimization cache
6565
--stats-filename=<filename> Path to store the progress JSON file to
66+
--publisher=<zim_publisher> Custom Publisher in ZIM Metadata (openZIM otherwise)
6667
6768
This script is used to produce a ZIM file (and any intermediate state)
6869
of Gutenberg repository using a mirror."""
@@ -102,6 +103,7 @@ def main():
102103
optimization_cache = arguments.get("--optimization-cache") or None
103104
use_any_optimized_version = arguments.get("--use-any-optimized-version", False)
104105
stats_filename = arguments.get("--stats-filename") or None
106+
publisher = arguments.get("--publisher") or "openZIM"
105107

106108
s3_storage = None
107109
if optimization_cache:
@@ -111,7 +113,7 @@ def main():
111113
logger.info("S3 Credentials OK. Continuing ... ")
112114

113115
# create tmp dir
114-
TMP_FOLDER_PATH.mkdir(parents=True)
116+
TMP_FOLDER_PATH.mkdir(parents=True, exist_ok=True)
115117

116118
languages = [
117119
x.strip().lower()
@@ -224,4 +226,5 @@ def f(x):
224226
title=zim_title,
225227
description=zim_desc,
226228
stats_filename=stats_filename,
229+
publisher=publisher,
227230
)

src/gutenberg2zim/shared.py

+3-3
Original file line numberDiff line numberDiff line change
@@ -32,7 +32,7 @@ def inc_progress():
3232
Global.progress += 1
3333

3434
@staticmethod
35-
def setup(filename, language, title, description, name):
35+
def setup(filename, language, title, description, name, publisher):
3636
Global.creator = Creator(
3737
filename=filename,
3838
main_path="Home.html",
@@ -41,10 +41,10 @@ def setup(filename, language, title, description, name):
4141
title=title,
4242
description=description,
4343
creator="gutenberg.org", # type: ignore
44-
publisher="Kiwix", # type: ignore
44+
publisher=publisher, # type: ignore
4545
name=name,
4646
tags="_category:gutenberg;gutenberg", # type: ignore
47-
scraper=f"gutengergtozim-{VERSION}", # type: ignore
47+
scraper=f"gutenberg2zim-{VERSION}", # type: ignore
4848
date=date.today(), # type: ignore
4949
).config_verbose(True)
5050

src/gutenberg2zim/zim.py

+2
Original file line numberDiff line numberDiff line change
@@ -28,6 +28,7 @@ def build_zimfile(
2828
title,
2929
description,
3030
stats_filename,
31+
publisher,
3132
):
3233
# actual list of languages with books sorted by most used
3334
nb = fn.COUNT(Book.language).alias("nb")
@@ -76,6 +77,7 @@ def build_zimfile(
7677
title=title,
7778
description=description,
7879
name=project_id,
80+
publisher=publisher,
7981
)
8082

8183
Global.start()

0 commit comments

Comments
 (0)