require 'set'
IGNORED_PAGES = Set['sitemap.xml']
LANGS = Set['en', 'pt', 'fr', 'eo'] # jp zh es de
module Jekyll
class Linter < Generator
safe true
priority :high
def insert_id(name, document)
lang = document.data['lang']
ref = document.data['ref']
id = "#{name}:#{lang}:#{ref}"
if @known_ids.include? id then
raise "Duplicate ID found: '#{id}'"
else
@known_ids.add id
end
end
def assert_unique_ids(site)
@known_ids = Set[]
all_documents(site) do |collection_name, document|
insert_id collection_name, document
end
end
def slugify(s)
s.ljust(100)
.gsub(/[\W]+/, ' ')
.strip
.gsub(/\s\s+/, '-')
.downcase
.gsub(' ', '-')
.gsub('_', '-')
end
def assert(value, message)
unless value
raise message
end
value
end
def assert_field(document, field)
f = document.data[field]
raise "Undefined '#{field}' for #{document.path}" unless f
f
end
COLLECTION_LAYOUTS = {
'page' => 'page',
'slides' => 'slides',
'articles' => 'post',
'pastebins' => 'post',
'tils' => 'post',
'podcasts' => 'post',
'screencasts' => 'post'
}
def assert_frontmatter_fields(name, document)
title = assert_field document, 'title'
lang = assert_field document, 'lang'
ref = assert_field document, 'ref'
layout = assert_field document, 'layout'
date = document.date.strftime('%Y-%m-%d') unless layout == 'page'
slug = layout == 'page' ? ref : assert_field(document, 'slug')
extension = name == 'slides' ? 'slides' : 'md'
unless LANGS.member? lang
raise "Invalid lang '#{lang}' in #{document.path}"
end
if COLLECTION_LAYOUTS[name] != layout
raise "Layout mismatch: expected '#{COLLECTION_LAYOUTS[name]}', got '#{layout}' for #{document.path}"
end
if lang == 'en'
unless ['index', 'root', 'tils'].include? ref
if slugify(title) != ref then
raise "#{ref} isn't a slug of the title.\nref: '#{ref}'\ntitle slug: '#{slugify(title)}'"
p slugify(title)
end
end
end
unless layout == 'page' then
path = "_#{name}/#{date}-#{slug}.#{extension}"
unless path == document.relative_path then
raise "date/filename mismatch:\ndate+slug: #{path}\nfilename: #{document.relative_path}"
end
if lang == 'en' then
unless ref == slug then
raise "ref/slug mismatch:\nref: #{ref}\nslug: #{slug}"
end
end
end
if name == 'podcasts' then
flac = "resources/podcasts/#{date}-#{slug}.flac"
unless File.exist? flac then
raise "Missing FLAC file '#{flac}'"
end
end
if name == 'screencasts' then
webm = "resources/screencasts/#{date}-#{slug}.webm"
unless File.exist? webm then
raise "Missing WebM file '#{webm}'"
end
end
end
def assert_frontmatter(site)
all_documents(site) do |collection_name, document|
assert_frontmatter_fields collection_name, document
end
end
@@first_build = true
def assert_git_annex(site)
url = site.config['url']
stdout = `git annex find --not --in web`
if stdout != '' or not $?.success? then
puts 'Files in Git Annex not published to "web" remote:'
puts stdout
puts "Add them with:\n\n"
stdout.strip.split("\n").each do |file|
puts "git annex addurl --file #{file} #{url}/#{file}"
end
msg = "\nBuild again after files above are added"
if @@first_build then
@@first_build = false
puts msg
else
raise msg
end
end
end
MEDIA_EXTENSION = {
'podcasts' => 'flac',
'screencasts' => 'webm'
}
def assert_media_metadata(site)
site.collections.each do |name, collection|
if ['podcasts', 'screencasts'].include? name then
collection.docs.each do |document|
date = document.data['date'].strftime('%Y-%m-%d')
slug = document.data['slug']
ext = MEDIA_EXTENSION[name]
file = "resources/#{name}/#{date}-#{slug}.#{ext}"
if name == 'podcasts'
stdout = `metaflac --export-tags-to=- #{file}`.strip.split("\n")
expected = [
"COMMENTS=#{site.config['url']}/#{file}",
'ARTIST=EuAndreh',
"DATE=#{date}",
"TITLE=#{document.data['title']}",
"ALBUM=#{site.config['t']['podcasts']['feed']['title'][document.data['lang']]}"
]
expected.each do |metadata|
unless stdout.include? metadata
tags = expected.join('\\n').gsub(/'/, "'\"'\"'")
add_metadata_cmd = "metaflac --remove-all #{file}\nprintf '#{tags}\\n' | metaflac --import-tags-from=- #{file}"
check_metadata_cmd = "metaflac --export-tags-to=- #{file}"
raise "Missing metadata entry '#{metadata}' in '#{file}'.\nAdd it with:\n\n#{add_metadata_cmd}\n\nCheck with:\n #{check_metadata_cmd}"
end
end
check_cover_cmd = "metaflac #{file} --export-picture-to=- | diff - static/favicon.png"
`#{check_cover_cmd}`
unless $?.success? then
add_cover_cmd = "metaflac #{file} --import-picture-from=static/favicon.png"
raise "Cover art from '#{file}' doesn't match 'static/favicon.png'.\nFix it with:\n\n#{add_cover_cmd}\n\nCheck with:\n #{check_cover_cmd}"
end
elsif name == 'screencasts' then
stdout = `mediainfo #{file} | awk -F: '/^Movie name/ { print $2 }'`.strip
expected = document.data['title'] + ' - EuAndreh'
unless stdout == expected then
escaped_title = expected.gsub(/'/, "'\"'\"'")
add_metadata_cmd = "mkvpropedit '#{file}' -e info -s title='#{escaped_title}'"
check_metadata_cmd = "mediainfo '#{file}' | grep 'Movie name'"
raise "Missing metadata entry 'title' in '#{file}'.\nAdd it with:\n\n#{add_metadata_cmd}\n\nCheck with:\n #{check_metadata_cmd}"
end
end
end
end
end
end
def generate(site)
assert_unique_ids(site)
assert_frontmatter(site)
assert_media_metadata(site)
assert_git_annex(site)
end
def all_documents(site)
site.collections.each do |name, collection|
collection.docs.each do |document|
unless document.data['generated']
yield name, document
end
end
end
site.pages.each do |page|
unless IGNORED_PAGES.include? page.path
unless page.data['generated']
yield 'page', page
end
end
end
end
end
end