blog/build/index.py

#!/usr/bin/env python3

# should this operate on the same basic files as the rss script?

import sys
import re

# we expect the arguments to be filepaths to each blog post

def print_usage():
    print("\nusage: python mkblogindex.py POSTS\n")
    print("\n")
    print("\t\tPOSTS\tfilepaths of blog posts")

# check args for at least one file path
if len(sys.argv) < 2:
    print_usage()
    sys.exit(1)

# posts are arguments from index 1 onwards
posts = sys.argv[1:]

dir_pattern = re.compile("(.+)\/(\d{4}\/\d+\/\d+\/.+\.html)")
path_pattern = re.compile("(.+)\/(\d{4})\/(\d{1,2})\/(\d{1,2})\/(.+).html")
title_pattern = re.compile("<h1>(.+)</h1>")

posts.reverse()

links = []

# for each file we want to output an <a> tag with a relative href to the site root
for path in posts:

    m = re.match(path_pattern, path)
    if not m:
        # path/to/file.ext -> file
        title = path.split('/')[-1].split(".")[0]

        date = f'<span class="post-date">0000-00-00</span>'
        url = path.split("/")[-1]

    else:
        year = m.group(2)
        month = m.group(3).rjust(2, '0')
        day = m.group(4).rjust(2, '0')

        date = f'<span class="post-date">{year}-{month}-{day}</span>'

        title = ""
        with open(path) as f:
            for line in f:
                if title_pattern.match(line):
                    title = re.sub(title_pattern, r'<span class="post-title">\1</span>', line).strip()
                    break

        # clean leading directories to get the relative path we'll use for the link
        url = re.sub(dir_pattern, r"\2", path)
        url = f"blog/{url}"

    item = (date, f'<li><a href="{url}">{date}{title}</a></li>')
    links.append(item)

# make sure we're properly ordered in reverse date order lol
links = sorted(links, key=lambda x: x[0])
links.reverse()

for l in links:
    print(l[1])
make html 2023-03-11 14:29:39 +01:00			`#!/usr/bin/env python3`

isaac 2024-10-26 02:03:20 +02:00			`# should this operate on the same basic files as the rss script?`

make html 2023-03-11 14:29:39 +01:00			`import sys`
			`import re`

			`# we expect the arguments to be filepaths to each blog post`

			`def print_usage():`
			`print("\nusage: python mkblogindex.py POSTS\n")`
			`print("\n")`
			`print("\t\tPOSTS\tfilepaths of blog posts")`

			`# check args for at least one file path`
			`if len(sys.argv) < 2:`
			`print_usage()`
			`sys.exit(1)`

			`# posts are arguments from index 1 onwards`
			`posts = sys.argv[1:]`

update directory regex 2023-03-14 00:21:08 +01:00			`dir_pattern = re.compile("(.+)\/(\d{4}\/\d+\/\d+\/.+\.html)")`
make html 2023-03-11 14:29:39 +01:00			`path_pattern = re.compile("(.+)\/(\d{4})\/(\d{1,2})\/(\d{1,2})\/(.+).html")`
			`title_pattern = re.compile("<h1>(.+)</h1>")`

			`posts.reverse()`

			`links = []`

			`# for each file we want to output an <a> tag with a relative href to the site root`
			`for path in posts:`
isaac 2024-10-26 02:03:20 +02:00
make html 2023-03-11 14:29:39 +01:00			`m = re.match(path_pattern, path)`
isaac 2024-10-26 02:03:20 +02:00			`if not m:`
			`# path/to/file.ext -> file`
			`title = path.split('/')[-1].split(".")[0]`

			`date = f'<span class="post-date">0000-00-00</span>'`
			`url = path.split("/")[-1]`

			`else:`
			`year = m.group(2)`
			`month = m.group(3).rjust(2, '0')`
			`day = m.group(4).rjust(2, '0')`

			`date = f'<span class="post-date">{year}-{month}-{day}</span>'`

			`title = ""`
			`with open(path) as f:`
			`for line in f:`
			`if title_pattern.match(line):`
			`title = re.sub(title_pattern, r'<span class="post-title">\1</span>', line).strip()`
			`break`

			`# clean leading directories to get the relative path we'll use for the link`
			`url = re.sub(dir_pattern, r"\2", path)`
			`url = f"blog/{url}"`
make html 2023-03-11 14:29:39 +01:00
			`item = (date, f'<li><a href="{url}">{date}{title}</a></li>')`
			`links.append(item)`

			`# make sure we're properly ordered in reverse date order lol`
			`links = sorted(links, key=lambda x: x[0])`
			`links.reverse()`

			`for l in links:`
			`print(l[1])`