#!/usr/bin/env python3 import sys import re # we expect the arguments to be filepaths to each blog post def print_usage(): print("\nusage: python mkblogindex.py POSTS\n") print("\n") print("\t\tPOSTS\tfilepaths of blog posts") # check args for at least one file path if len(sys.argv) < 2: print_usage() sys.exit(1) # posts are arguments from index 1 onwards posts = sys.argv[1:] dir_pattern = re.compile("(.+)/(blog\/.+\.html)") path_pattern = re.compile("(.+)\/(\d{4})\/(\d{1,2})\/(\d{1,2})\/(.+).html") title_pattern = re.compile("

(.+)

") # filter posts to just those with a date in them posts = [p for p in posts if path_pattern.match(p)] # for each file we want to output an tag with a relative href to the site root for path in posts: date = re.sub(path_pattern, r'\2-\3-\4', path) title = "" with open(path) as f: for line in f: if title_pattern.match(line): title = re.sub(title_pattern, r'\1', line).strip() break # clean leading directories to get the relative path we'll use for the link url = re.sub(dir_pattern, r"\2", path) print(f'
  • {date}{title}
  • ')