2023-03-11 14:29:39 +01:00
|
|
|
#!/usr/bin/env python3
|
|
|
|
|
2024-10-26 02:03:20 +02:00
|
|
|
# should this operate on the same basic files as the rss script?
|
|
|
|
|
2023-03-11 14:29:39 +01:00
|
|
|
import sys
|
|
|
|
import re
|
|
|
|
|
|
|
|
# we expect the arguments to be filepaths to each blog post
|
|
|
|
|
|
|
|
def print_usage():
|
|
|
|
print("\nusage: python mkblogindex.py POSTS\n")
|
|
|
|
print("\n")
|
|
|
|
print("\t\tPOSTS\tfilepaths of blog posts")
|
|
|
|
|
|
|
|
# check args for at least one file path
|
|
|
|
if len(sys.argv) < 2:
|
|
|
|
print_usage()
|
|
|
|
sys.exit(1)
|
|
|
|
|
|
|
|
# posts are arguments from index 1 onwards
|
|
|
|
posts = sys.argv[1:]
|
|
|
|
|
2023-03-14 00:21:08 +01:00
|
|
|
dir_pattern = re.compile("(.+)\/(\d{4}\/\d+\/\d+\/.+\.html)")
|
2023-03-11 14:29:39 +01:00
|
|
|
path_pattern = re.compile("(.+)\/(\d{4})\/(\d{1,2})\/(\d{1,2})\/(.+).html")
|
|
|
|
title_pattern = re.compile("<h1>(.+)</h1>")
|
|
|
|
|
|
|
|
posts.reverse()
|
|
|
|
|
|
|
|
links = []
|
|
|
|
|
|
|
|
# for each file we want to output an <a> tag with a relative href to the site root
|
|
|
|
for path in posts:
|
2024-10-26 02:03:20 +02:00
|
|
|
|
2023-03-11 14:29:39 +01:00
|
|
|
m = re.match(path_pattern, path)
|
2024-10-26 02:03:20 +02:00
|
|
|
if not m:
|
|
|
|
# path/to/file.ext -> file
|
|
|
|
title = path.split('/')[-1].split(".")[0]
|
|
|
|
|
|
|
|
date = f'<span class="post-date">0000-00-00</span>'
|
|
|
|
url = path.split("/")[-1]
|
|
|
|
|
|
|
|
else:
|
|
|
|
year = m.group(2)
|
|
|
|
month = m.group(3).rjust(2, '0')
|
|
|
|
day = m.group(4).rjust(2, '0')
|
|
|
|
|
|
|
|
date = f'<span class="post-date">{year}-{month}-{day}</span>'
|
|
|
|
|
|
|
|
title = ""
|
|
|
|
with open(path) as f:
|
|
|
|
for line in f:
|
|
|
|
if title_pattern.match(line):
|
|
|
|
title = re.sub(title_pattern, r'<span class="post-title">\1</span>', line).strip()
|
|
|
|
break
|
|
|
|
|
|
|
|
# clean leading directories to get the relative path we'll use for the link
|
|
|
|
url = re.sub(dir_pattern, r"\2", path)
|
|
|
|
url = f"blog/{url}"
|
2023-03-11 14:29:39 +01:00
|
|
|
|
|
|
|
item = (date, f'<li><a href="{url}">{date}{title}</a></li>')
|
|
|
|
links.append(item)
|
|
|
|
|
|
|
|
# make sure we're properly ordered in reverse date order lol
|
|
|
|
links = sorted(links, key=lambda x: x[0])
|
|
|
|
links.reverse()
|
|
|
|
|
|
|
|
for l in links:
|
|
|
|
print(l[1])
|
|
|
|
|