build.sh

#!/bin/bash

set -e

tmp="$(mktemp -d)"

finish() {
	echo "Done, removing $tmp"
	rm -r "$tmp"
}

trap finish EXIT

# Akas are permanent names that redirect to various resources. If the location of the resource changes, the aka can simply be updated.
# Due to being hosted on Github pages we do not have direct control over redirects, so we must use meta refresh directives.
echo "Akas..."

mkdir -p aka

redirecthtmlpage() {
	url="$1"

	echo "<!DOCTYPE html>"
	echo "<title>Redirecting to $url</title>"

	# Refresh the page immediately to the desired URL.
	echo "<meta http-equiv='refresh' content='0; URL=$url'>"

	# However, we don't want any caching, so if we update the URL it will be immediately reflected in the redirect.
	echo '<meta http-equiv="Cache-Control" content="no-cache, no-store, must-revalidate" />'
	echo '<meta http-equiv="Pragma" content="no-cache" />'
	echo '<meta http-equiv="Expires" content="0" />'

	echo '<meta name="viewport" content="width=device-width, initial-scale=1">'

	# Additional links to the URL.
	echo "<link rel='canonical' href='$url'>"
	echo "Redirecting to <a href='$url'>$url</a>..." # The user can click this one if their browser doesn't redirect them.
}

N_AKAS=0

# Each line in akas.txt has the format:
# <name of redirect> <url of redirect>
while read line; do
	# Split the aka line into the name and url
	name="$(echo "$line" | cut -d' ' -f1)"
	url="$(echo "$line" | cut -d' ' -f2-)"

	echo " $name -> $url"

	echo "<tr><td><a href='$name'>$name</a></td> <td><a href='$url'>$url</a></td> <td><a href='$name.qr.svg'>SVG</a> <a href='$name.qr.png'>PNG</a></td></tr>" >> "$tmp/_akas.in.html"

	N_AKAS=$((N_AKAS+1))

	(
		redirecthtmlpage "$url" > "aka/$name.html"
		qrencode -o "aka/$name.qr.svg" -l M -t SVG -s 10 -m 2 "https://benleskey.com/aka/$name"
		qrencode -o "aka/$name.qr.png" -l M -t PNG -s 20 -m 2 "https://benleskey.com/aka/$name"
	) &
done < akas.txt

echo "Downloading images..."
while read line; do
	output="$(echo "$line" | cut -d' ' -f1)"
	input="$(echo "$line" | cut -d' ' -f2-)"

	echo " Downloading $input -> $output"

	curl -sSL "$input" > "images/$output" &
done < images.txt

# replacefile <placeholder> <path to file>
# A pipeline function to replace a placeholder with the contents of a file
replacefile() {
	placeholder="$1"
	path="$2"

	replacetext "$placeholder" "$(cat "$path")"
}

# replacetext <placeholder> <text to insert>
# A pipeline function to replace a placeholder with text
replacetext() {
	placeholder="$1"

	text="$(echo "$2" | sed 's|\\|\\\\|g' | sed 's|&|\\&|g' | sed '$!s/$/\\n/' | tr -d '\n')"

	sed -f <(echo "s&$placeholder&$text&g")
	#awk -v placeholder="$placeholder" -v text="$text" '{gsub(placeholder, text); print}'
}

htmlescape() {
	python3 -c "import html, sys; sys.stdout.write(html.escape(sys.stdin.read()))"
}

basereplace() {
	toroot="$1"

	replacetext "__RDATE__" "$(TZ=UTC date -R)" |
	replacetext "__YEAR__" "$(TZ=UTC date +%Y)" |
	replacetext "__DATE__" "$(TZ=UTC date -I)" |
	replacetext "__ROOT__" "$toroot"
}

commonreplace() {
	basereplace "$@" |
	replacetext "__FOOTERICONS__" "$(basereplace "$@" < templates/footer_icons.in.html)"
}

mkdir -p page
mkdir -p blog/tags
mkdir -p "$tmp"/tags

# The list of all tags, to be built up as posts are processed.
alltags=""

# Maximum blog posts in the "minor" list, i.e. on the front page.
BMMAX=7

# Maximum blog posts in an RSS feed
RSSMAX=15

# Maximum number of words in the RSS description summary
SUMMARY_WORDS=100

# Number of blog posts so far.
BN=0
PN=0

echo "Blog..."

# Begin the major and minor blog post lists.
echo "<ul>" > "$tmp"/_major.in.html
echo "<ul>" > "$tmp"/_minor.in.html

# The post function is called from the posts.sh list of posts; it is responsible for processing each blog post.
# A post has four components, reflected in the arguments:
# post <human-redable identifier name> <human-readable, pretty title of post> <date YYYY-MM-DD> <space-delimited list of tags>
post() {
	name="$1"
	title="$2"
	date="$3"
	tags="$4"

	series="$POST_SERIES"

	# We'll be reading the text of the blog post from an input HTML file and generating the full HTML page.
	infile="blog.in/$name.in.html"
	outfile="blog/$name.html"
	outfeed="$tmp/_$name.xml"

	echo " $name: $title [$date]"

	# We will collect all the tags and build a list of hyperlinks to insert into the HTML.
	# HTML for the tag lists are generated for each different place they must be used with different styling and URLs (since sometimes we need blog/tags#tag and sometimes just tags/#tag if we are within the blog itself).

	taghtml="" # The list of tags to be used within the blog posts.
	smalltaghtml="" # The list of tags to be used within the "major" blog post list, on the dedicated blog page.
	minortaghtml="" # The list of tags to be used within the "minor" blog post list, on the main page.

	while read tag; do
		taghtml="$taghtml <a class='tag' href='__ROOT__/blog/tags/$tag'>#$tag</a>"
		minortaghtml="$minortaghtml <a class='smalltag' href='__ROOT__/blog/tags/$tag'>#$tag</a>"
		smalltaghtml="$smalltaghtml <a class='smalltag' href='__ROOT__/blog/tags/$tag'>#$tag</a>"

		# If we haven't seen this tag yet in any post, record it and clear away any old file built from this tag.
		if ! echo "$alltags" | grep -w "$tag" > /dev/null; then
			echo " New tag: $tag"
			alltags="$alltags $tag"
		fi

	done < <(echo "$tags" | xargs -n1 | sort | uniq | xargs -n1 --no-run-if-empty)

	dateinfo="$date"
	latestdate="$date"

	if [ -n "$POST_UPDATED" ]; then
		dateinfo="$date, $POST_UPDATED"
		latestdate="$POST_UPDATED"
	fi

	post_global_link="https://benleskey.com/blog/$name"
	post_link="__ROOT__/blog/$name"
	post_base_link="https://benleskey.com/blog/$name"
	post_listing_class=""

	if [ -n "$POST_EXTERNAL" ]; then
		post_link="$POST_EXTERNAL"
		post_base_link="$POST_EXTERNAL"
		post_listing_class="external"
	fi

	if [ -n "$POST_INTERNAL" ]; then
		post_link="__ROOT__/page/$POST_INTERNAL"
		post_base_link="https://benleskey.com/page/$POST_INTERNAL"
	fi

	# Now we will write a link to this post to the each of its tags' pages.
	# We do this after tag processing because a link to the post also includes its tags, so we need to know all the tags of the post.
	while read tag; do
		echo "<li class='postlisting $post_listing_class'><a href='$post_link'>$title</a> [$dateinfo] $smalltaghtml</li>" >> "$tmp/_tag_$tag.html"
	done < <(echo "$tags" | xargs -n1 --no-run-if-empty)

	# Record that another post was processed.
	BN=$((BN+1))

	# If we haven't reached the limit for "minor" posts, add a link to the minor blog post listing HTML, this is for the "recent posts" section of the main page.
	if [ $BN -le $BMMAX ]; then
		echo "<li class='postlisting $post_listing_class'><a href='$post_link'>$title</a> [$dateinfo] $minortaghtml</li>" >> "$tmp"/_minor.in.html
	fi

	# Always add a link to the "major" blog post listing HTML, this is for the dedicated blog page.
	echo "<li class='postlisting $post_listing_class'><a href='$post_link'>$title</a> [$dateinfo] $smalltaghtml</li>" >> "$tmp"/_major.in.html

	if [ -n "$POST_INTERNAL" ]; then
		redirecthtmlpage "../page/$POST_INTERNAL" > "$outfile" &
	elif [ -n "$POST_EXTERNAL" ]; then
		redirecthtmlpage "$POST_EXTERNAL" > "$outfile" &
	else
		replaceseries() {
			if [[ -n "$series" ]]; then
				replacefile "__SERIES_TOP__" "templates/series_top.in.html" | replacefile "__SERIES_BOTTOM__" "templates/series_bottom.in.html" | replacetext "__SERIES__" "$series" | replacetext "__SERIES_RSS_LINK__" "<link rel='alternate' type='application/rss+xml' title=\"Ben Leskey's RSS feed: $series\" href='tags/$series.feed.xml'>"
			else
				replacetext "__SERIES_TOP__" "" | replacetext "__SERIES_BOTTOM__" "" | replacetext "__SERIES_RSS_LINK__" ""
			fi
		}

		# Build the blog post HTML.
		(replacetext "__TITLE__" "$title" | replacetext "__POST_DATE__" "$dateinfo" | replacetext "__TAGS__" "$taghtml" | replaceseries | commonreplace .. | replacefile "__POST__" "$infile" | python3 toc_builder.py) < templates/post.in.html > "$outfile" &
	fi

	rsspost() {
		if [ -n "$POST_INTERNAL" ]; then
			(if [ -n "$POST_BLURB" ]; then
				echo "<p>$POST_BLURB</p>"
			fi
			echo "See <a href='$POST_INTERNAL'>$POST_INTERNAL</a>") | python3 unrelate.py "https://benleskey.com/page"
		elif [ -n "$POST_EXTERNAL" ]; then
			(if [ -n "$POST_BLURB" ]; then
				echo "<p>$POST_BLURB</p>"
			fi
			echo "See <a href='$POST_EXTERNAL'>$POST_EXTERNAL</a>") | python3 unrelate.py "https://benleskey.com/blog"
		else
			(python3 unrelate.py "https://benleskey.com/blog") < $infile
		fi
	}

	# Build the RSS item XML
	(commonreplace .. | replacetext "__TITLE__" "$(echo "$title" | htmlescape)" | replacetext "__POST_RDATE__" "$(TZ=UTC date --date="$latestdate + 12 hours" -R)" | replacetext "__CATEGORIES__" "$(echo "$tags" | xargs -n1 printf "<category>%s</category>")" | replacetext "__GUID_LINK__" "$post_global_link" | replacetext "__LINK__" "$post_base_link" | replacetext "__DESCRIPTION__" "$(rsspost | htmlescape)") < templates/feed_item.in.xml > "$outfeed" &
}

# Include the list of posts via source, so it can call the post function.
source blog.in/posts.sh

echo "<ul>" > "$tmp"/_pages.in.html

page() {
	name="$1"
	title="$2"
	date="$3"

	echo " $name: $title [$date]"

	infile="page.in/$name.in.html"
	outfile="page/$name.html"

	echo "<li class='postlisting'><a href='$name'>$title</a> [$date]</li>" >> "$tmp"/_pages.in.html

	(replacetext "__TITLE__" "$title" | replacetext "__PAGE_DATE__" "$date" | commonreplace .. | replacefile "__PAGE__" "$infile" | python3 toc_builder.py) < templates/page.in.html > "$outfile" &

	PN=$((PN+1))
}

source page.in/pages.sh

echo "</ul>" >> "$tmp"/_pages.in.html

# If there are more posts than can be displayed in the minor list (on the main page) then add a "More..." link to the minor list.
if [ $BN -gt $BMMAX ]; then
	echo "<li><a href='blog'>$((BN - BMMAX)) more...</a></li>" >> "$tmp"/_minor.in.html
fi

# Cap off the lists.
echo "</ul>" >> "$tmp"/_minor.in.html
echo "</ul>" >> "$tmp"/_major.in.html

(commonreplace .. | replacetext "__NUM_AKAS__" $N_AKAS | replacefile "__AKAS__" "$tmp/_akas.in.html") < templates/aka_index.in.html > "aka/index.html" &

echo " Waiting..."
wait

echo "" > "$tmp"/_feed.in.xml

# Concat all the RSS items
post() {
	name="$1"
	tags="$4"

	if [[ $(grep "<item>" "$tmp"/_feed.in.xml | wc -l) -lt $RSSMAX ]]; then
		feedfile="$tmp/_$name.xml"
		cat < "$feedfile" >> "$tmp"/_feed.in.xml
	fi

	while read tag; do
		touch "$tmp"/_tag_feed_"$tag".xml

		if [[ $(grep "<item>" "$tmp"/_tag_feed_"$tag".xml | wc -l) -lt $RSSMAX ]]; then
			feedfile="$tmp/_$name.xml"
			cat < "$feedfile" >> "$tmp"/_tag_feed_"$tag".xml
		fi
	done < <(echo "$tags" | xargs -n1 --no-run-if-empty)
}

source blog.in/posts.sh

# Build the main page.
(
	replacefile "__BLOGMINOR__" "$tmp/_minor.in.html" |
	commonreplace . |
	python3 element_copy.py |
	python3 alternate.py
) < templates/index.in.html > index.html

# Uniquify and sort the list of all tags.
alltags="$(echo "$alltags" | xargs -n1 | sort | uniq | xargs)"

echo > "$tmp/_tag_list.in.html"

# For each tag, just append the previously generated list of posts HTML for that tag.
while read tag; do
	echo " Tag: $tag"

	echo "<li><a class='icon' href='__ROOT__/blog/tags/$tag.feed.xml' title='RSS feed'><img src='https://upload.wikimedia.org/wikipedia/commons/4/43/Feed-icon.svg' alt='RSS feed'></a><a href='__ROOT__/blog/tags/$tag'>$tag</a></li>" >> "$tmp/_tag_list.in.html"

	(replacefile "__FEED_" "$tmp/_tag_feed_$tag.xml" | replacetext __TAG__ "$tag" | commonreplace ../..) < templates/tag_feed.in.xml > blog/tags/"$tag.feed.xml" &
done < <(echo "$alltags" | xargs -n1 --no-run-if-empty)

while read tag; do
	(replacefile "__ITEMS__" "$tmp/_tag_$tag.html" | replacetext __NUM_POSTS__ "$(wc -l "$tmp/_tag_$tag.html" | cut -d' ' -f1)" | replacefile __TAG_LIST__ "$tmp/_tag_list.in.html" | replacetext __TAG__ "$tag" | commonreplace ../..) < templates/tag.in.html > blog/tags/"$tag".html &
done < <(echo "$alltags" | xargs -n1 --no-run-if-empty)

# Build the dedicated blog index page.
(replacefile "__BLOGMAJOR__" "$tmp/_major.in.html" | replacetext __NUM_POSTS__ "$BN" | replacefile __TAG_LIST__ "$tmp/_tag_list.in.html" | commonreplace ..) < templates/blog.in.html > blog/index.html &

(replacefile "__PAGES__" "$tmp/_pages.in.html" | replacetext __NUM_PAGES__ "$PN" | commonreplace ..) < templates/pages.in.html > page/index.html &

echo " Waiting..."
wait

echo "Generating RSS feed..."
(replacefile "__FEED__" "$tmp/_feed.in.xml" | commonreplace ..) < templates/feed.in.xml > blog/feed.xml &

echo "Processing images..."

mkdir -p thumbs

for ext in jpg png; do
	find images -maxdepth 1 -name "*.$ext" -prune | while read n; do
		n="$(basename "$n")"
		echo " Processing $n"
		convert -resize 10% -strip "images/$n" "thumbs/${n%.*}.10.$ext" &
		convert -resize 25% -strip "images/$n" "thumbs/${n%.*}.25.$ext" &
		convert -resize 50% -strip "images/$n" "thumbs/${n%.*}.50.$ext" &
	done
done

echo " Waiting..."
wait