aboutsummaryrefslogblamecommitdiff
path: root/_plugins/linter.rb
blob: aa568bbd06e121015197798b3c63f00f4697ed14 (plain) (tree)
1
2
3
4
5
6
7
8
9
10

             

                                                 



                          

                  



                                   
                                    

                                           
                         



                               
                        

                                                        


         
























                                                                
                           


                            

                             

     
                                                 











































                                                                                                             


                                   


                                                           
           



                                

                                                           


         
                        





                                                                









                                                               
           


         

                           
                             

     





                                                             

                                                              
                                 
                                                                              







                                                                                               
                                               






                                                                                                                                                         
                                                                                                    

                                     

                                                                                                                                                           

                                            







                                                                                                                                                 





               

                             
                              
                                 
                            
       

















                                                 

     
require 'set'

IGNORED_PAGES = Set['sitemap.xml']
LANGS = Set['en', 'pt', 'fr', 'eo'] # jp zh es de

module Jekyll
  class Linter < Generator
    safe true
    priority :high

    def insert_id(name, document)
      lang = document.data['lang']
      ref = document.data['ref']
      id = "#{name}:#{lang}:#{ref}"
      if @known_ids.include? id then
        raise "Duplicate ID found: '#{id}'"
      else
        @known_ids.add id
      end
    end

    def assert_unique_ids(site)
      @known_ids = Set[]
      all_documents(site) do |collection_name, document|
        insert_id collection_name, document
      end
    end

    def slugify(s)
      s.ljust(100)
        .gsub(/[\W]+/, ' ')
        .strip
        .gsub(/\s\s+/, '-')
        .downcase
        .gsub(' ', '-')
        .gsub('_', '-')
    end

    def assert(value, message)
      unless value
        raise message
      end
      value
    end

    def assert_field(document, field)
      f = document.data[field]
      raise "Undefined '#{field}' for #{document.path}" unless f
      f
    end

    COLLECTION_LAYOUTS = {
      'page' => 'page',
      'slides' => 'slides',
      'articles' => 'post',
      'pastebins' => 'post',
      'tils' => 'post',
      'podcasts' => 'post',
      'screencasts' => 'post'
    }

    def assert_frontmatter_fields(name, document)
      title = assert_field document, 'title'
      lang = assert_field document, 'lang'
      ref = assert_field document, 'ref'
      layout = assert_field document, 'layout'
      date = document.date.strftime('%Y-%m-%d') unless layout == 'page'
      slug = layout == 'page' ? ref : assert_field(document, 'slug')
      extension = name == 'slides' ? 'slides' : 'md'

      unless LANGS.member? lang
        raise "Invalid lang '#{lang}' in #{document.path}"
      end

      if COLLECTION_LAYOUTS[name] != layout
        raise "Layout mismatch: expected '#{COLLECTION_LAYOUTS[name]}', got '#{layout}' for #{document.path}"
      end

      if lang == 'en'
        unless ['index', 'root', 'tils'].include? ref
          if slugify(title) != ref then
            raise "#{ref} isn't a slug of the title.\nref:        '#{ref}'\ntitle slug: '#{slugify(title)}'"
            p slugify(title)
          end
        end
      end

      unless layout == 'page' then
        path = "_#{name}/#{date}-#{slug}.#{extension}"
        unless path == document.relative_path then
          raise "date/filename mismatch:\ndate+slug: #{path}\nfilename:  #{document.relative_path}"
        end

        if lang == 'en' then
          unless ref == slug then
            raise "ref/slug mismatch:\nref:  #{ref}\nslug: #{slug}"
          end
        end
      end

      if name == 'podcasts' then
        flac = "resources/podcasts/#{date}-#{slug}.flac"
        unless File.exist? flac then
          raise "Missing FLAC file '#{flac}'"
        end

      end

      if name == 'screencasts' then
        webm = "resources/screencasts/#{date}-#{slug}.webm"
        unless File.exist? webm then
          raise "Missing WebM file '#{webm}'"
        end
      end
    end

    def assert_frontmatter(site)
      all_documents(site) do |collection_name, document|
        assert_frontmatter_fields collection_name, document
      end
    end

    @@first_build = true
    def assert_git_annex(site)
      url = site.config['url']
      stdout = `git annex find --not --in web`
      if stdout != '' or not $?.success? then
        puts 'Files in Git Annex not published to "web" remote:'
        puts stdout
        puts "Add them with:\n\n"
        stdout.strip.split("\n").each do |file|
          puts "git annex addurl --file #{file} #{url}/#{file}"
        end
        msg = "\nBuild again after files above are added"
        if @@first_build then
          @@first_build = false
          puts msg
        else
          raise msg
        end
      end
    end

    MEDIA_EXTENSION = {
      'podcasts' => 'flac',
      'screencasts' => 'webm'
    }

    def assert_media_metadata(site)
      site.collections.each do |name, collection|
        if ['podcasts', 'screencasts'].include? name then
          collection.docs.each do |document|
            date = document.data['date'].strftime('%Y-%m-%d')
            slug = document.data['slug']
            ext = MEDIA_EXTENSION[name]
            file =  "resources/#{name}/#{date}-#{slug}.#{ext}"
            if name == 'podcasts'
              stdout = `metaflac --export-tags-to=- #{file}`.strip.split("\n")
              expected = [
                "COMMENTS=#{site.config['url']}/#{file}",
                'ARTIST=EuAndreh',
                "DATE=#{date}",
                "TITLE=#{document.data['title']}",
                "ALBUM=#{site.config['t']['podcasts']['feed']['title'][document.data['lang']]}"
              ]
              expected.each do |metadata|
                unless stdout.include? metadata
                  tags = expected.join('\\n').gsub(/'/, "'\"'\"'")
                  add_metadata_cmd = "metaflac --remove-all #{file}\nprintf '#{tags}\\n' | metaflac --import-tags-from=- #{file}"
                  check_metadata_cmd = "metaflac --export-tags-to=- #{file}"
                  raise "Missing metadata entry '#{metadata}' in '#{file}'.\nAdd it with:\n\n#{add_metadata_cmd}\n\nCheck with:\n  #{check_metadata_cmd}"
                end
              end

              check_cover_cmd = "metaflac #{file} --export-picture-to=- | diff - static/favicon.png"
              `#{check_cover_cmd}`
              unless $?.success? then
                add_cover_cmd = "metaflac #{file} --import-picture-from=static/favicon.png"
                raise "Cover art from '#{file}' doesn't match 'static/favicon.png'.\nFix it with:\n\n#{add_cover_cmd}\n\nCheck with:\n  #{check_cover_cmd}"
              end
            elsif name == 'screencasts' then
              stdout = `mediainfo #{file} | awk -F: '/^Movie name/ { print $2 }'`.strip
              expected = document.data['title'] + ' - EuAndreh'
              unless stdout == expected then
                escaped_title = expected.gsub(/'/, "'\"'\"'")
                add_metadata_cmd = "mkvpropedit '#{file}' -e info -s title='#{escaped_title}'"
                check_metadata_cmd = "mediainfo '#{file}' | grep 'Movie name'"
                raise "Missing metadata entry 'title' in '#{file}'.\nAdd it with:\n\n#{add_metadata_cmd}\n\nCheck with:\n  #{check_metadata_cmd}"
              end
            end
          end
        end
      end
    end

    def generate(site)
      assert_unique_ids(site)
      assert_frontmatter(site)
      assert_media_metadata(site)
      assert_git_annex(site)
    end

    def all_documents(site)
      site.collections.each do |name, collection|
        collection.docs.each do |document|
          unless document.data['generated']
            yield name, document
          end
        end
      end

      site.pages.each do |page|
        unless IGNORED_PAGES.include? page.path
          unless page.data['generated']
            yield 'page', page
          end
        end
      end
    end
  end
end