Allow specifying an editor as well as/instead of an author
[books.alexwlchan.net] / scripts / render_html.py
index 0cbb13f..048a7fc 100755 (executable)
@@ -1,6 +1,7 @@
-#!/usr/bin/env python
+#!/usr/bin/env python3
 
 import datetime
 
 import datetime
+import hashlib
 import itertools
 import os
 import pathlib
 import itertools
 import os
 import pathlib
@@ -9,23 +10,72 @@ import subprocess
 import sys
 
 import attr
 import sys
 
 import attr
+import bs4
+import cssmin
 import frontmatter
 from jinja2 import Environment, FileSystemLoader, select_autoescape
 import markdown
 from markdown.extensions.smarty import SmartyExtension
 import smartypants
 
 import frontmatter
 from jinja2 import Environment, FileSystemLoader, select_autoescape
 import markdown
 from markdown.extensions.smarty import SmartyExtension
 import smartypants
 
+from generate_bookshelf import create_shelf_data_uri
+from tint_colors import get_tint_colors, store_tint_color
+
 
 def rsync(dir1, dir2):
     subprocess.check_call(["rsync", "--recursive", "--delete", dir1, dir2])
 
 
 
 def rsync(dir1, dir2):
     subprocess.check_call(["rsync", "--recursive", "--delete", dir1, dir2])
 
 
+def git(*args):
+    return subprocess.check_output(["git"] + list(args)).strip().decode("utf8")
+
+
+def set_git_timestamps():
+    """
+    For everything in the covers/ directory, set the last modified timestamp to
+    the last time it was modified in Git.  This should make tint colour computations
+    stable across machines.
+    """
+    root = git("rev-parse", "--show-toplevel")
+
+    now = datetime.datetime.now().timestamp()
+
+    for f in os.listdir("src/covers"):
+        path = os.path.join("src/covers", f)
+
+        if not os.path.isfile(path):
+            continue
+
+        stat = os.stat(path)
+
+        # If the modified time is >7 days ago, skip setting the modified time.  This means
+        # the script stays pretty fast when doing a regular sync.
+        if now - stat.st_mtime > 7 * 24 * 60 * 60 and "--reset" not in sys.argv:
+            continue
+
+        revision = git("rev-list", "--max-count=1", "HEAD", path)
+
+        if not revision:
+            continue
+
+        timestamp, *_ = git("show", "--pretty=format:%ai", "--abbrev-commit", revision).splitlines()
+        modified_time = datetime.datetime.strptime(timestamp, "%Y-%m-%d %H:%M:%S %z").timestamp()
+
+        access_time = stat.st_atime
+
+        os.utime(path, times=(access_time, modified_time))
+
+
 @attr.s
 class Book:
 @attr.s
 class Book:
+    slug = attr.ib()
     title = attr.ib()
     title = attr.ib()
-    author = attr.ib()
     publication_year = attr.ib()
     publication_year = attr.ib()
-    cover_image = attr.ib()
+
+    author = attr.ib(default="")
+    editor = attr.ib(default="")
+
+    cover_image = attr.ib(default="")
     cover_desc = attr.ib(default="")
 
     isbn10 = attr.ib(default="")
     cover_desc = attr.ib(default="")
 
     isbn10 = attr.ib(default="")
@@ -36,7 +86,8 @@ class Book:
 class Review:
     date_read = attr.ib()
     text = attr.ib()
 class Review:
     date_read = attr.ib()
     text = attr.ib()
-    format = attr.ib()
+    date_order = attr.ib(default=1)
+    format = attr.ib(default=None)
     rating = attr.ib(default=None)
     did_not_finish = attr.ib(default=False)
 
     rating = attr.ib(default=None)
     did_not_finish = attr.ib(default=False)
 
@@ -55,7 +106,16 @@ class ReviewEntry:
 def get_review_entry_from_path(path):
     post = frontmatter.load(path)
 
 def get_review_entry_from_path(path):
     post = frontmatter.load(path)
 
-    book = Book(**post["book"])
+    kwargs = {}
+    for attr_name in Book.__attrs_attrs__:
+        try:
+            kwargs[attr_name.name] = post["book"][attr_name.name]
+        except KeyError:
+            pass
+
+    kwargs["slug"] = os.path.basename(os.path.splitext(path)[0])
+    book = Book(**kwargs)
+
     review = Review(**post["review"], text=post.content)
 
     return ReviewEntry(path=path, book=book, review=review)
     review = Review(**post["review"], text=post.content)
 
     return ReviewEntry(path=path, book=book, review=review)
@@ -76,7 +136,9 @@ class CurrentlyReadingEntry:
 def get_reading_entry_from_path(path):
     post = frontmatter.load(path)
 
 def get_reading_entry_from_path(path):
     post = frontmatter.load(path)
 
-    book = Book(**post["book"])
+    slug = os.path.basename(os.path.splitext(path)[0])
+    book = Book(slug=slug, **post["book"])
+
     reading = CurrentlyReading(text=post.content)
 
     return CurrentlyReadingEntry(path=path, book=book, reading=reading)
     reading = CurrentlyReading(text=post.content)
 
     return CurrentlyReadingEntry(path=path, book=book, reading=reading)
@@ -105,8 +167,10 @@ class PlanEntry:
 def get_plan_entry_from_path(path):
     post = frontmatter.load(path)
 
 def get_plan_entry_from_path(path):
     post = frontmatter.load(path)
 
-    book = Book(**post["book"])
-    plan = Plan(**post["plan"], text=post.content)
+    slug = os.path.basename(os.path.splitext(path)[0])
+    book = Book(slug=slug, **post["book"])
+
+    plan = Plan(date_added=post["plan"]["date_added"], text=post.content)
 
     return PlanEntry(path=path, book=book, plan=plan)
 
 
     return PlanEntry(path=path, book=book, plan=plan)
 
@@ -132,7 +196,7 @@ def render_markdown(text):
 
 def render_date(date_value):
     if isinstance(date_value, datetime.date):
 
 def render_date(date_value):
     if isinstance(date_value, datetime.date):
-        return date_value.strftime("%d %B %Y")
+        return date_value.strftime("%-d %B %Y")
 
     date_match = re.match(
         r"^(?P<year>\d{4})-(?P<month>\d{2})(?:-(?P<day>\d{2}))?$", date_value
 
     date_match = re.match(
         r"^(?P<year>\d{4})-(?P<month>\d{2})(?:-(?P<day>\d{2}))?$", date_value
@@ -146,24 +210,85 @@ def render_date(date_value):
     )
 
     if date_match.group("day"):
     )
 
     if date_match.group("day"):
-        return date_obj.strftime("%-d %B %Y")
+        return render_date(date_obj)
     else:
         return date_obj.strftime("%B %Y")
 
 
     else:
         return date_obj.strftime("%B %Y")
 
 
-def render_individual_review(env, *, review_entry):
-    template = env.get_template("review.html")
-    html = template.render(
-        review_entry=review_entry, title=f"My review of {review_entry.book.title}"
-    )
-
-    out_name = review_entry.out_path() / "index.html"
-    out_path = pathlib.Path("_html") / out_name
+def save_html(template, out_name="", **kwargs):
+    html = template.render(**kwargs)
+    out_path = pathlib.Path("_html") / out_name / "index.html"
     out_path.parent.mkdir(exist_ok=True, parents=True)
     out_path.parent.mkdir(exist_ok=True, parents=True)
-    out_path.write_text(html)
+
+    soup = bs4.BeautifulSoup(html, "html.parser")
+
+    # Minify the CSS in all inline <style> tags.
+    for style_tag in soup.find_all("style"):
+        style_tag.string = cssmin.cssmin(style_tag.string)
+
+    # Remove any comments
+    for comment in soup(text=lambda text: isinstance(text, bs4.Comment)):
+        comment.extract()
+
+    out_path.write_text(str(soup))
+
+
+def _create_new_thumbnail(src_path, dst_path):
+    dst_path.parent.mkdir(exist_ok=True, parents=True)
+
+    # Thumbnails are 240x240 max, then 2x for retina displays
+    subprocess.check_call([
+        "convert", src_path, "-resize", "480x480>", dst_path
+    ])
+
+
+def thumbnail_1x(name):
+    pth = pathlib.Path(name)
+    return pth.stem + "_1x" + pth.suffix
+
+
+def _create_new_square(src_path, square_path):
+    square_path.parent.mkdir(exist_ok=True, parents=True)
+
+    subprocess.check_call([
+        "convert",
+        src_path, "-resize", "240x240", "-gravity", "center", "-background", "white", "-extent", "240x240", square_path
+    ])
+
+
+def create_thumbnails():
+    for image_name in os.listdir("src/covers"):
+        if image_name == ".DS_Store":
+            continue
+
+        src_path = pathlib.Path("src/covers") / image_name
+        dst_path = pathlib.Path("_html/thumbnails") / image_name
+
+        if not dst_path.exists():
+            _create_new_thumbnail(src_path, dst_path)
+        elif src_path.stat().st_mtime > dst_path.stat().st_mtime:
+            _create_new_thumbnail(src_path, dst_path)
+
+        square_path = pathlib.Path("_html/squares") / image_name
+
+        if not square_path.exists():
+            _create_new_square(src_path, square_path)
+        elif src_path.stat().st_mtime > square_path.stat().st_mtime:
+            _create_new_square(src_path, square_path)
+
+        store_tint_color(dst_path)
+
+
+CSS_HASH = hashlib.md5(open('static/style.css', 'rb').read()).hexdigest()
+
+
+def css_hash(_):
+    return f"md5:{CSS_HASH}"
 
 
 def main():
 
 
 def main():
+    set_git_timestamps()
+
     env = Environment(
         loader=FileSystemLoader("templates"),
         autoescape=select_autoescape(["html", "xml"]),
     env = Environment(
         loader=FileSystemLoader("templates"),
         autoescape=select_autoescape(["html", "xml"]),
@@ -172,6 +297,13 @@ def main():
     env.filters["render_markdown"] = render_markdown
     env.filters["render_date"] = render_date
     env.filters["smartypants"] = smartypants.smartypants
     env.filters["render_markdown"] = render_markdown
     env.filters["render_date"] = render_date
     env.filters["smartypants"] = smartypants.smartypants
+    env.filters["thumbnail_1x"] = thumbnail_1x
+    env.filters["css_hash"] = css_hash
+    env.filters["create_shelf_data_uri"] = create_shelf_data_uri
+
+    create_thumbnails()
+
+    tint_colors = get_tint_colors()
 
     rsync("src/covers/", "_html/covers/")
     rsync("static/", "_html/static/")
 
     rsync("src/covers/", "_html/covers/")
     rsync("static/", "_html/static/")
@@ -182,14 +314,21 @@ def main():
         get_entries(dirpath="src/reviews", constructor=get_review_entry_from_path)
     )
     all_reviews = sorted(
         get_entries(dirpath="src/reviews", constructor=get_review_entry_from_path)
     )
     all_reviews = sorted(
-        all_reviews, key=lambda rev: str(rev.review.date_read), reverse=True
+        all_reviews, key=lambda rev: f"{rev.review.date_read}/{rev.review.date_order}", reverse=True
     )
 
     for review_entry in all_reviews:
     )
 
     for review_entry in all_reviews:
-        render_individual_review(env, review_entry=review_entry)
+        save_html(
+            template=env.get_template("review.html"),
+            out_name=review_entry.out_path(),
+            review_entry=review_entry,
+            title=f"My review of {review_entry.book.title}",
+            tint_colors=tint_colors
+        )
 
 
-    template = env.get_template("list_reviews.html")
-    html = template.render(
+    save_html(
+        template=env.get_template("list_reviews.html"),
+        out_name="reviews",
         all_reviews=[
             (year, list(reviews))
             for (year, reviews) in itertools.groupby(
         all_reviews=[
             (year, list(reviews))
             for (year, reviews) in itertools.groupby(
@@ -198,11 +337,9 @@ def main():
         ],
         title="books i’ve read",
         this_year=str(datetime.datetime.now().year),
         ],
         title="books i’ve read",
         this_year=str(datetime.datetime.now().year),
+        tint_colors=tint_colors
     )
 
     )
 
-    out_path = pathlib.Path("_html") / "reviews/index.html"
-    out_path.write_text(html)
-
     # Render the "currently reading" page
 
     all_reading = list(
     # Render the "currently reading" page
 
     all_reading = list(
@@ -211,12 +348,13 @@ def main():
         )
     )
 
         )
     )
 
-    template = env.get_template("list_reading.html")
-    html = template.render(all_reading=all_reading, title="books i’m currently reading")
-
-    out_path = pathlib.Path("_html") / "reading/index.html"
-    out_path.parent.mkdir(exist_ok=True, parents=True)
-    out_path.write_text(html)
+    save_html(
+        template=env.get_template("list_reading.html"),
+        out_name="reading",
+        all_reading=all_reading,
+        title="books i’m currently reading",
+        tint_colors=tint_colors
+    )
 
     # Render the "want to read" page
 
 
     # Render the "want to read" page
 
@@ -224,22 +362,42 @@ def main():
         get_entries(dirpath="src/plans", constructor=get_plan_entry_from_path)
     )
 
         get_entries(dirpath="src/plans", constructor=get_plan_entry_from_path)
     )
 
-    all_plans = sorted(all_plans, key=lambda plan: plan.plan.date_added)
+    all_plans = sorted(all_plans, key=lambda plan: plan.plan.date_added, reverse=True)
 
 
-    template = env.get_template("list_plans.html")
-    html = template.render(all_plans=all_plans, title="books i want to read")
+    save_html(
+        template=env.get_template("list_plans.html"),
+        out_name="to-read",
+        all_plans=all_plans,
+        title="books i want to read",
+        tint_colors=tint_colors,
+    )
 
 
-    out_path = pathlib.Path("_html") / "to-read/index.html"
-    out_path.parent.mkdir(exist_ok=True, parents=True)
-    out_path.write_text(html)
+    # Render the "never going to read this page"
 
 
-    # Render the front page
+    all_retired = list(
+        get_entries(dirpath="src/will_never_read", constructor=get_plan_entry_from_path)
+    )
+
+    all_retired = sorted(
+        all_retired, key=lambda plan: plan.plan.date_added, reverse=True
+    )
 
 
-    index_template = env.get_template("index.html")
-    html = index_template.render(text=open("src/index.md").read())
+    save_html(
+        template=env.get_template("list_will_never_read.html"),
+        out_name="will-never-read",
+        all_retired=all_retired,
+        title="books i&rsquo;m never going to read",
+        tint_colors=tint_colors
+    )
+
+    # Render the front page
 
 
-    index_path = pathlib.Path("_html") / "index.html"
-    index_path.write_text(html)
+    save_html(
+        template=env.get_template("index.html"),
+        text=open("src/index.md").read(),
+        reviews=all_reviews[:5],
+        tint_colors=tint_colors
+    )
 
     print("✨ Rendered HTML files to _html ✨")
 
 
     print("✨ Rendered HTML files to _html ✨")