module Docs class Eigen3 < UrlScraper self.name = 'Eigen3' self.type = 'eigen3' self.slug = 'eigen3' self.base_url = 'https://eigen.tuxfamily.org/dox/' self.root_path = 'index.html' self.initial_paths = [ "modules.html" ] self.release = '3.4.0' self.links = { home: 'https://eigen.tuxfamily.org', code: 'https://gitlab.com/libeigen/eigen' } html_filters.push 'eigen3/entries', 'eigen3/clean_html', 'title' # Remove the `clean_text` because Doxygen are actually creating empty # anchor such as to do anchor link.. and that anchor # will be removed by clean_text self.text_filters = FilterStack.new text_filters.push 'images', 'inner_html', 'attribution' def get_latest_version(opts) tags = get_gitlab_tags("https://gitlab.com", "libeigen", "eigen", opts) tags[0]['name'] end options[:attribution] = <<-HTML © Eigen.
Licensed under the MPL2 License. HTML # Skip source code since it doesn't provide any useful docs options[:skip_patterns] = [/_source/, /-members/, /__Reference\.html/, /_chapter\.html/, /\.txt/, /\.tgz/] # TODO: replace cppreference # options[:replace_urls] = { 'http://en.cppreference.com/w/cpp/' => 'cpp/' } def parse(response) # Hook here because Nokogori removes whitespace from code fragments last_idx = 0 # Process nested

s inside code fragment div. while not (last_idx = response.body.index('

', last_idx)).nil? # enter code fragment

level = 1 while not (last_idx = response.body.index(/<\/?div/, last_idx+1)).nil? # skip nested divs inside. if response.body[last_idx..last_idx+3] == '' response.body[last_idx..last_idx+5] = '' end end response.body.gsub! /[\r\n\s]*

]*>.*<\/div>[\r\n\s]*/, "" response.body.gsub! /

(.*?)<\/div>/m, "\\1" response.body.gsub! '

', '

'
      super
    end

    def process_response?(response)
      return false unless super
      # Remove Empty pages.
      response.body.index(/[\r\n\s]*<\/div>/m).nil? and \
        response.body.index(/TODO: write this dox page!<\/p>/).nil?
    end
  end
end