Parent

Included Modules

Class/Module Index [+]

Quicksearch

Domainatrix::DomainParser

Attributes

public_suffixes[R]

Public Class Methods

new(file_name) click to toggle source
# File lib/domainatrix/domain_parser.rb, line 7
def initialize(file_name)
  @public_suffixes = {}
  read_dat_file(file_name)
end

Public Instance Methods

parse(url) click to toggle source
# File lib/domainatrix/domain_parser.rb, line 33
def parse(url)
  uri = URI.parse(url)
  if uri.query
    path = "#{uri.path}?#{uri.query}"
  else
    path = uri.path
  end
  parse_domains_from_host(uri.host).merge({
    :scheme => uri.scheme,
    :host   => uri.host,
    :path   => path,
    :url    => url
  })
end
parse_domains_from_host(host) click to toggle source
# File lib/domainatrix/domain_parser.rb, line 48
def parse_domains_from_host(host)
  parts = host.split(".").reverse
  public_suffix = []
  domain = ""
  subdomains = []
  sub_hash = @public_suffixes
  parts.each_index do |i|
    part = parts[i]

    sub_parts = sub_hash[part]
    sub_hash = sub_parts
    if sub_parts.has_key? "*"
      public_suffix << part
      public_suffix << parts[i+1]
      domain = parts[i+2]
      subdomains = parts.slice(i+3, parts.size)
      break
    elsif sub_parts.empty? || !sub_parts.has_key?(parts[i+1])
      public_suffix << part
      domain = parts[i+1]
      subdomains = parts.slice(i+2, parts.size)
      break
    else
      public_suffix << part
    end
  end
  {:public_suffix => public_suffix.reverse.join("."), :domain => domain, :subdomain => subdomains.reverse.join(".")}
end
read_dat_file(file_name) click to toggle source
# File lib/domainatrix/domain_parser.rb, line 12
def read_dat_file(file_name)
  # If we're in 1.9, make sure we're opening it in UTF-8
  if RUBY_VERSION >= '1.9'
    dat_file = File.open(file_name, "r:UTF-8")
  else
    dat_file = File.open(file_name)
  end
  
  dat_file.each_line do |line|
    line = line.strip
    unless (line =~ /\/\//) || line.empty?
      parts = line.split(".").reverse

      sub_hash = @public_suffixes
      parts.each do |part|
        sub_hash = (sub_hash[part] ||= {})
      end
    end
  end
end

[Validate]

Generated with the Darkfish Rdoc Generator 2.