Skip to content
New issue

Have a question about this project? Sign up for a free GitHub account to open an issue and contact its maintainers and the community.

By clicking “Sign up for GitHub”, you agree to our terms of service and privacy statement. We’ll occasionally send you account related emails.

Already on GitHub? Sign in to your account

Automatically generate sitemap.xml after building HTMLs #89

Merged
merged 2 commits into from
Aug 31, 2022
Merged
Show file tree
Hide file tree
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension


Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
10 changes: 10 additions & 0 deletions archive.py
Original file line number Diff line number Diff line change
Expand Up @@ -49,6 +49,8 @@

from lib.website import build_website

from lib.sitemap import build_sitemap

try:
import settings
except ModuleNotFoundError:
Expand Down Expand Up @@ -145,6 +147,12 @@ def run():
parser.add_argument(
"-b", action="store_true", default=False, help="Build .md files"
)
parser.add_argument(
"--no-sitemap",
action="store_true",
default=False,
help="Don't build sitemap files",
)
parser.add_argument(
"-t", action="store_true", default=False, help="Make a clean json archive"
)
Expand Down Expand Up @@ -206,6 +214,8 @@ def run():
settings.page_head_html,
settings.page_footer_html,
)
if not results.no_sitemap:
build_sitemap(settings.site_url, md_root.as_posix(), md_root.as_posix())


if __name__ == "__main__":
Expand Down
3 changes: 1 addition & 2 deletions entrypoint.sh
Original file line number Diff line number Diff line change
Expand Up @@ -32,8 +32,7 @@ python3 get-pip.py
pip install virtualenv
virtualenv -p python3 .
source bin/activate
pip3 install zulip==0.6.3
pip3 install pyyaml==5.2
pip3 install install -r requirements.txt
Copy link
Contributor

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

install is here twice: #96

# crudini is not available as an Alpine pkg, so we install via pip.
pip3 install crudini

Expand Down
16 changes: 16 additions & 0 deletions lib/sitemap.py
Original file line number Diff line number Diff line change
@@ -0,0 +1,16 @@
from glob import iglob
from typing import Iterator

from xml_sitemap_writer import XMLSitemap


def build_sitemap(base_url: str, archive_dir_path: str, sitemap_write_dir_path: str):
def iterate_html_files() -> Iterator[str]:
# Iterator yields relative path like
# archive/stream/10-errors/topic/laptop.html
# TODO: Investigate when running in windows
# TODO: Must ensure that the relative URLs are valid
return iglob("**/*.html", root_dir=archive_dir_path, recursive=True)

with XMLSitemap(sitemap_write_dir_path, base_url) as sitemap:
sitemap.add_urls(iterate_html_files())
3 changes: 3 additions & 0 deletions requirements.txt
Original file line number Diff line number Diff line change
@@ -0,0 +1,3 @@
pyyaml==5.2
xml-sitemap-writer==0.5.0
zulip==0.6.3