# Support for adding tags to daily log posts and miscellaneous fixes to date
# display
require 'fileutils'
require 'nokogiri'
require 'set'
require 'pathname'
require 'uri'
module Jekyll
class ProjectPage < Page
def initialize(site, base, dir)
@site = site
@base = base
@dir = dir
@name = 'index.html'
self.process(@name)
@path = site.layouts["project-home"].path
self.read_yaml("", "") # uses path from above first
self.data['title'] = "Projects"
end
end
class CategoryPageGenerator < Generator
safe true
def generate(site)
if site.layouts.key? 'project-home'
dir = site.config['project-dir'] || 'projects'
site.pages << ProjectPage.new(site, site.source, dir)
end
end
end
end
# Pre-render
#
# This is the first step. When posts are built, this block goes through and
# reads the markdown line by line to identify log entries by looking for headers
# followed by a parseable date. It then extracts the project tags that follow
# the date and constructs a hash/dict mapping log entries by their html ids
# (in the standard YYYYMMDD format) to an array of project tags. This block also
# removes the project tags and pretty formats things.
Jekyll::Hooks.register :posts, :pre_render do |post|
in_code_block = false
entrymap = Hash.new { |h, k| h[k] = Set.new }
converted_lines = post.content.split("\n").map do |line|
# skip code blocks
in_code_block = !in_code_block if line.match(/^```/)
next line if in_code_block
# drop lines that aren't markdown headers
matched = line.match(/^(#+) /)
next line unless matched
# drop headers that don't start with dates
DateTime.parse(line.strip) rescue next line
# pretty format dates
date = DateTime.parse(line.strip)
iddate = date.strftime("%Y%m%d")
displaydate = date.strftime("%a, %b %e")
# extract project tags
tags = line.strip.scan(/#([a-zA-Z0-9._-]{3,} ?)/)
# if project tags are detected for this entry then add it to the hash
if tags.length > 0
tags.each { |tag| entrymap[iddate].add(tag[0].strip) }
end
# replace markdown header with this nice html
"
#{displaydate}
"
end
# sort the hash so posts will be laid out chronologically on the project page
entrymap = Hash[ entrymap.sort_by { |key, val| key } ]
# save the hash for later processing
post.site.data["entrymap"] = entrymap
post.content = converted_lines.join("\n")
end
# Post-render
#
# This is the second step. Once the posts are converted to HTML, this block is
# called. It goes through and splits up each post into separate log entries and
# inserts the HTML version of these log entries into a hash that maps projects
# to entry HTMLs. It also goes and fixes relative links in the log entries so
# that images work once the HTML is copied over to the projects folder.
Jekyll::Hooks.register :posts, :post_render do |post|
# if this post has entries with project tags
if post.site.data["entrymap"].length > 0
# attempt to load a hash mapping tags to ids from the site data
if post.site.data["tagmap"] == nil
tagmap = {}
else
tagmap = post.site.data["tagmap"]
end
# create new array if key doesn't exist (default dictionary)
tagmap.default_proc = proc { |h, k| h[k] = [] }
doc = Nokogiri::HTML post.content
# iterate over each entry and its associated tags
post.site.data["entrymap"].each do |entry, tags|
new_node_set = Nokogiri::XML::NodeSet.new(doc)
orig = doc.at_css("h3.log-entry[id=\"#{entry}\"]")
new_node_set << orig
node = orig.next
# continue until we run out of sibling nodes or we hit the next log entry
while !node.nil? && node["class"] != "log-entry"
new_node_set << node
node = node.next
end
tags.each do |tag|
dir = post.site.config['projects_dir'] || 'projects'
old_path = post.url # convert to relative url since post.url is absolute
old_path[0] = ''
fix_links(new_node_set, old_path, File.join(dir, tag)) # fix rel links
content = new_node_set.to_html
# fix checkboxes
content.gsub! '
[ ]', '
'
content.gsub! '
[x]', '
'
tagmap[tag.strip].push(content)
end
end
post.site.data["tagmap"] = tagmap
end
end
# Post-write
#
# This is the last step. Once the posts are all written, we can build the
# project pages. This works by taking the mapping of projects to HTML fragments
# from previously and generating new pages for each project and injecting the
# HTML fragments into their respective pages.
Jekyll::Hooks.register :site, :post_write do |site|
dir = site.config['projects_dir'] || 'projects'
dest = site.config["destination"]
if site.data.key?("tagmap")
# load in the all generated HTML for the project page, we're going to clone
# this and inject our new content into it to avoid having to deal with liquid
template = File.read(File.join(dest, dir, 'index.html'))
doc = Nokogiri::HTML template
site.data["tagmap"].each_key do |tag|
path = File.join(dest, dir, tag)
FileUtils.mkdir_p path
File.open(File.join(path, "index.html"), 'w') do |f|
# inject new title
doc.at_css('h1.post-title').inner_html = "Project ##{tag} ↩"
# construct one body of HTML from all the separate fragments
new_node_set = Nokogiri::XML::NodeSet.new(doc)
site.data["tagmap"][tag].each do |content|
new_node_set << Nokogiri::HTML::fragment(content)
end
content = doc.at_css('div.post-content')
# skeletonize page and inject new content
content.children.remove rescue nil
content << new_node_set.to_html
content << ""
f.write(doc.to_html)
end
end
end
end
# fixes relative paths for the new tag files
def fix_links(doc, old_path, new_path)
# figure out relative link mapping
prefix = Pathname.new(old_path).relative_path_from(Pathname.new(new_path))
url_tags = {
'img' => 'src',
'script' => 'src',
'a' => 'href'
}
# grab all url links
doc.search(url_tags.keys.join(',')).each do |node|
url_param = url_tags[node.name]
src = node[url_param]
unless src.empty?
path = Pathname.new(src)
uri = URI.parse(src)
# only fix relative links and non http calls
if path.relative? && !%w( http https ).include?(uri.scheme)
node[url_param] = (prefix+path).to_s
end
end
end
end