RubyGems - domainatrix - Versions diffs - 0.0.1 - Mend

domainatrix 0.0.1

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (11) hide show

data/README.textile +63 -0
data/lib/domainatrix.rb +13 -0
data/lib/domainatrix/domain_parser.rb +63 -0
data/lib/domainatrix/url.rb +24 -0
data/lib/effective_tld_names.dat +4362 -0
data/spec/domainatrix/domain_parser_spec.rb +63 -0
data/spec/domainatrix/url_spec.rb +37 -0
data/spec/domainatrix_spec.rb +16 -0
data/spec/spec.opts +2 -0
data/spec/spec_helper.rb +10 -0
metadata +64 -0

data/spec/domainatrix/domain_parser_spec.rb ADDED Viewed

@@ -0,0 +1,63 @@
+require File.dirname(__FILE__) + '/../spec_helper'
+describe "domain parser" do
+  before(:all) do
+    @domain_parser = Domainatrix::DomainParser.new("#{File.dirname(__FILE__)}/../../lib/effective_tld_names.dat")
+  end
+  describe "reading the dat file" do
+    it "creates a tree of the domain names" do
+      @domain_parser.tlds.should be_a Hash
+    end
+    it "creates the first level of the tree" do
+      @domain_parser.tlds.should have_key("com")
+    end
+    it "creates the first level of the tree even when the first doesn't appear on a line by itself" do
+      @domain_parser.tlds.should have_key("uk")
+    end
+    it "creates lower levels of the tree" do
+      @domain_parser.tlds["jp"].should have_key("ac")
+      @domain_parser.tlds["jp"]["aichi"].should have_key("*")
+    end
+  end
+  describe "parsing" do
+    it "returns a hash of parts" do
+      @domain_parser.parse("http://pauldix.net").should be_a Hash
+    end
+    it "should strip the http://" do
+      @domain_parser.parse("http://pauldix.net").values.each {|val| (val =~ /http\:\/\//).should_not be}
+    end
+    it "parses out the path" do
+      @domain_parser.parse("http://pauldix.net/foo.html?asdf=foo")[:path].should == "/foo.html?asdf=foo"
+      @domain_parser.parse("http://pauldix.net?asdf=foo")[:path].should == "?asdf=foo"
+      @domain_parser.parse("http://pauldix.net")[:path].should == ""
+    end
+    it "parses the tld" do
+      @domain_parser.parse("http://pauldix.net")[:tld].should == "net"
+      @domain_parser.parse("http://pauldix.co.uk")[:tld].should == "co.uk"
+      @domain_parser.parse("http://pauldix.com.kg")[:tld].should == "com.kg"
+      @domain_parser.parse("http://pauldix.com.aichi.jp")[:tld].should == "com.aichi.jp"
+    end
+    it "should have the domain" do
+      @domain_parser.parse("http://pauldix.net")[:domain].should == "pauldix"
+      @domain_parser.parse("http://foo.pauldix.net")[:domain].should == "pauldix"
+      @domain_parser.parse("http://pauldix.co.uk")[:domain].should == "pauldix"
+      @domain_parser.parse("http://foo.pauldix.co.uk")[:domain].should == "pauldix"
+      @domain_parser.parse("http://pauldix.com.kg")[:domain].should == "pauldix"
+      @domain_parser.parse("http://pauldix.com.aichi.jp")[:domain].should == "pauldix"
+    end
+    it "should have subdomains" do
+      @domain_parser.parse("http://foo.pauldix.net")[:subdomain].should == "foo"
+      @domain_parser.parse("http://bar.foo.pauldix.co.uk")[:subdomain].should == "bar.foo"
+    end
+  end
+end

data/spec/domainatrix/url_spec.rb ADDED Viewed

@@ -0,0 +1,37 @@
+require File.dirname(__FILE__) + '/../spec_helper'
+describe "url" do
+  it "has the tld" do
+    Domainatrix::Url.new(:tld => "net").tld.should == "net"
+  end
+  it "has the domain" do
+    Domainatrix::Url.new(:domain => "pauldix").domain.should == "pauldix"
+  end
+  it "has the subdomain" do
+    Domainatrix::Url.new(:subdomain => "foo").subdomain.should == "foo"
+  end
+  it "has the path" do
+    Domainatrix::Url.new(:path => "/asdf.html").path.should == "/asdf.html"
+  end
+  it "canonicalizes the url" do
+    Domainatrix::Url.new(:domain => "pauldix", :tld => "net").canonical.should == "net.pauldix"
+    Domainatrix::Url.new(:subdomain => "foo", :domain => "pauldix", :tld => "net").canonical.should == "net.pauldix.foo"
+    Domainatrix::Url.new(:subdomain => "foo.bar", :domain => "pauldix", :tld => "net").canonical.should == "net.pauldix.bar.foo"
+    Domainatrix::Url.new(:domain => "pauldix", :tld => "co.uk").canonical.should == "uk.co.pauldix"
+    Domainatrix::Url.new(:subdomain => "foo", :domain => "pauldix", :tld => "co.uk").canonical.should == "uk.co.pauldix.foo"
+    Domainatrix::Url.new(:subdomain => "foo.bar", :domain => "pauldix", :tld => "co.uk").canonical.should == "uk.co.pauldix.bar.foo"
+    Domainatrix::Url.new(:subdomain => "", :domain => "pauldix", :tld => "co.uk").canonical.should == "uk.co.pauldix"
+  end
+  it "canonicalizes the url with the path" do
+    Domainatrix::Url.new(:subdomain => "foo", :domain => "pauldix", :tld => "net", :path => "/hello").canonical.should == "net.pauldix.foo/hello"
+  end
+  it "canonicalizes the url without the path" do
+    Domainatrix::Url.new(:subdomain => "foo", :domain => "pauldix", :tld => "net").canonical(:include_path => false).should == "net.pauldix.foo"
+  end
+end

data/spec/domainatrix_spec.rb ADDED Viewed

@@ -0,0 +1,16 @@
+require File.dirname(__FILE__) + '/spec_helper'
+describe "domainatrix" do
+  it "should parse into a url object" do
+    Domainatrix.parse("http://pauldix.net").should be_a Domainatrix::Url
+  end
+  it "should canonicalize" do
+    Domainatrix.parse("http://pauldix.net").canonical.should == "net.pauldix"
+    Domainatrix.parse("http://pauldix.net/foo.html").canonical.should == "net.pauldix/foo.html"
+    Domainatrix.parse("http://pauldix.net/foo.html?asdf=bar").canonical.should == "net.pauldix/foo.html?asdf=bar"
+    Domainatrix.parse("http://foo.pauldix.net").canonical.should == "net.pauldix.foo"
+    Domainatrix.parse("http://foo.bar.pauldix.net").canonical.should == "net.pauldix.bar.foo"
+    Domainatrix.parse("http://pauldix.co.uk").canonical.should == "uk.co.pauldix"
+  end
+end

data/spec/spec.opts ADDED Viewed

	@@ -0,0 +1,2 @@
1	+ --diff
2	+ --color

data/spec/spec_helper.rb ADDED Viewed

@@ -0,0 +1,10 @@
+require "rubygems"
+require "spec"
+# gem install redgreen for colored test output
+begin require "redgreen" unless ENV['TM_CURRENT_LINE']; rescue LoadError; end
+path = File.expand_path(File.dirname(__FILE__) + "/../lib/")
+$LOAD_PATH.unshift(path) unless $LOAD_PATH.include?(path)
+require "lib/domainatrix"

metadata ADDED Viewed

@@ -0,0 +1,64 @@
+--- !ruby/object:Gem::Specification
+name: domainatrix
+version: !ruby/object:Gem::Version
+  version: 0.0.1
+platform: ruby
+authors:
+- Paul Dix
+autorequire:
+bindir: bin
+cert_chain: []
+date: 2009-12-10 00:00:00 -05:00
+default_executable:
+dependencies: []
+description:
+email: paul@pauldix.net
+executables: []
+extensions: []
+extra_rdoc_files: []
+files:
+- lib/domainatrix.rb
+- lib/effective_tld_names.dat
+- lib/domainatrix/domain_parser.rb
+- lib/domainatrix/url.rb
+- README.textile
+- spec/spec.opts
+- spec/spec_helper.rb
+- spec/domainatrix_spec.rb
+- spec/domainatrix/domain_parser_spec.rb
+- spec/domainatrix/url_spec.rb
+has_rdoc: true
+homepage: http://github.com/pauldix/domainatrix
+licenses: []
+post_install_message:
+rdoc_options: []
+require_paths:
+- lib
+required_ruby_version: !ruby/object:Gem::Requirement
+  requirements:
+  - - ">="
+    - !ruby/object:Gem::Version
+      version: "0"
+  version:
+required_rubygems_version: !ruby/object:Gem::Requirement
+  requirements:
+  - - ">="
+    - !ruby/object:Gem::Version
+      version: "0"
+  version:
+requirements: []
+rubyforge_project:
+rubygems_version: 1.3.5
+signing_key:
+specification_version: 2
+summary: A cruel misstress that uses the public suffix domain list to dominate URLs by canonicalizing, finding TLDs, and breaking them into their domain parts.
+test_files: []