rjl-allmusic 0.2

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (3) hide show
  1. checksums.yaml +7 -0
  2. data/lib/allmusic.rb +129 -0
  3. metadata +44 -0
checksums.yaml ADDED
@@ -0,0 +1,7 @@
1
+ ---
2
+ SHA1:
3
+ metadata.gz: b155dfb8ba731eb2b83141639618bc488cf4bf69
4
+ data.tar.gz: a150392aa792c92b30be443bb676a0edaab3be52
5
+ SHA512:
6
+ metadata.gz: 4b3ce309787ceda0bcc62d004e26b5e5e4de19b681d3954c90a5734263f9eb8716d6547255c4852322efd60158efff8b447e6b37bc2a9e40923ed03ee44bff86
7
+ data.tar.gz: 065de01a7543af3c01a1f1dba95f3793d6281f3186c80d8bd82eba4cde83255c9f39127d46f9b49854a7c66cbff2d1ab003ea063c82d1afd7dbb462e3483e4f9
data/lib/allmusic.rb ADDED
@@ -0,0 +1,129 @@
1
+ require 'nokogiri'
2
+ require 'uri'
3
+ require 'open-uri'
4
+ require 'fuzzystringmatch' #https://github.com/kiyoka/fuzzy-string-match
5
+
6
+ # Allmusic.com client
7
+ # @param [String]
8
+ class Allmusic
9
+
10
+ # @!attribute album
11
+ # @return [String] Album name
12
+ attr_accessor :album
13
+ # @!attribute artist
14
+ # @return [String] Artist name
15
+ attr_accessor :artist
16
+ attr_reader :genres
17
+ attr_reader :styles
18
+ attr_reader :genre
19
+ attr_reader :style
20
+
21
+ ARTIST_SEARCH_URL = "http://www.allmusic.com/search/artists/"
22
+
23
+ def initialize( artist = nil, album = nil)
24
+ @artist = artist
25
+ @album = album
26
+ @genre = nil
27
+ @style = nil
28
+ end
29
+
30
+ # return a list of the albums genre/styles
31
+ # @param album_page [Nokogiri] the page node to parse
32
+ # @param type [String] 'genre' | 'styles'
33
+ # @return [string] list of genre / syles
34
+ def parse( album_page, type = 'genre' )
35
+ data = []
36
+ data_nodes = album_page.xpath("//div[@class='#{type}']//a")
37
+ data_nodes.each do |data_node|
38
+ data << data_node.text
39
+ end
40
+ return data
41
+ end
42
+
43
+ # Sets @genre and @style for @album, @artist
44
+ def get_meta
45
+
46
+ # search for artist page e.g. http://www.allmusic.com/search/artists/abba
47
+ artist_search_url = make_url(ARTIST_SEARCH_URL, @artist)
48
+ artist_search_page = Nokogiri::HTML(open(artist_search_url))
49
+
50
+ if no_search_result?(artist_search_page)
51
+ raise "Couldn't find artist '#{@artist}'"
52
+ exit
53
+ end
54
+
55
+ # get the url of the artist page
56
+ artist_urls = artist_search_page.xpath("//ul[@class='search-results']//div[@class='name']/a")
57
+ artist_url = best_match(@artist, artist_urls)
58
+
59
+ # get the artist discography page
60
+ album_search_page = make_url(artist_url, '/discography/all')
61
+ artist_discography_page = Nokogiri::HTML(open(album_search_page))
62
+
63
+ # get album link
64
+ album_urls = artist_discography_page.xpath("//td[@class='title']/a[1]")
65
+ album_url = best_match(@album, album_urls)
66
+
67
+ unless album_url.nil?
68
+ # get album page
69
+ begin
70
+ album_page = Nokogiri::HTML(open(album_url))
71
+ @genres = parse( album_page, 'genre' )
72
+ @styles = parse( album_page, 'styles')
73
+ # # get genre
74
+ # # TODO: Improve this is there are more than one
75
+ # @genre = album_page.xpath("//div[@class='genre']//a[1]").text
76
+ # # get style
77
+ # @style = album_page.xpath("//div[@class='styles']//a[1]").text
78
+ rescue
79
+ puts ">> ERROR: Couldn't open #{album_url} for #{@artist} / #{@album}"
80
+ end
81
+ end
82
+ end
83
+
84
+ def genre
85
+ return @genres[0]
86
+ end
87
+
88
+ def style
89
+ return @styles[0]
90
+ end
91
+
92
+ # @return [URL] Joins URL parts
93
+ def make_url( root, path)
94
+ # TODO: unsafe, not portable - File.join gives the wrong separator on windows
95
+ # TODO: escape url
96
+ clean_url = URI.escape(File.join(root, path))
97
+ return clean_url
98
+ end
99
+
100
+ # @return [true, false] Returns `true` if no search results for the given page
101
+ def no_search_result?(page)
102
+ return !page.xpath('//div[@class="no-results"]').empty?
103
+ end
104
+
105
+ # @return [URL] The candidate with the highest Jaro-Winkler distance from target
106
+ # @param target [String] the string to compare
107
+ # @param candidates [Array] array of Nokogiri <A> nodes
108
+ def best_match(target, candidates)
109
+ # TODO: replace with a proper array sort
110
+ confidence = 0
111
+ best_url = nil
112
+ jarow = FuzzyStringMatch::JaroWinkler.create( :native )
113
+ candidates.each do |candidate|
114
+ title = candidate.text
115
+ distance = jarow.getDistance(target, title)
116
+ if distance > confidence
117
+ confidence = distance
118
+ best_url = candidate['href']
119
+ end
120
+ end
121
+ return best_url
122
+ end
123
+
124
+ def debug( prefix = "debug", message )
125
+ puts "-"*50
126
+ puts "#{prefix}: #{message}"
127
+ puts "="*50
128
+ end
129
+ end
metadata ADDED
@@ -0,0 +1,44 @@
1
+ --- !ruby/object:Gem::Specification
2
+ name: rjl-allmusic
3
+ version: !ruby/object:Gem::Version
4
+ version: '0.2'
5
+ platform: ruby
6
+ authors:
7
+ - Richard Lyon
8
+ autorequire:
9
+ bindir: bin
10
+ cert_chain: []
11
+ date: 2016-02-06 00:00:00.000000000 Z
12
+ dependencies: []
13
+ description:
14
+ email: richard@richardlyon.net
15
+ executables: []
16
+ extensions: []
17
+ extra_rdoc_files: []
18
+ files:
19
+ - lib/allmusic.rb
20
+ homepage: https://github.com/richardjlyon/allmusic
21
+ licenses:
22
+ - MIT
23
+ metadata: {}
24
+ post_install_message:
25
+ rdoc_options: []
26
+ require_paths:
27
+ - lib
28
+ required_ruby_version: !ruby/object:Gem::Requirement
29
+ requirements:
30
+ - - ">="
31
+ - !ruby/object:Gem::Version
32
+ version: '0'
33
+ required_rubygems_version: !ruby/object:Gem::Requirement
34
+ requirements:
35
+ - - ">="
36
+ - !ruby/object:Gem::Version
37
+ version: '0'
38
+ requirements: []
39
+ rubyforge_project:
40
+ rubygems_version: 2.5.1
41
+ signing_key:
42
+ specification_version: 4
43
+ summary: Get genre and style information from Allmusic.com
44
+ test_files: []