diarize-jruby 0.2.0-java → 0.2.1-java
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- data/README.md +14 -5
- data/diarize-jruby.gemspec +2 -2
- data/lib/diarize/speaker.rb +1 -5
- metadata +2 -2
data/README.md
CHANGED
@@ -10,6 +10,7 @@ archive prototype.
|
|
10
10
|
See http://worldservice.prototyping.bbc.co.uk/programmes/X0403940 for
|
11
11
|
an example.
|
12
12
|
|
13
|
+
|
13
14
|
Speaker diarization
|
14
15
|
-------------------
|
15
16
|
|
@@ -38,10 +39,11 @@ It also includes support for speaker supervectors [Campbell2006], which
|
|
38
39
|
can be used in combination with our ruby-lsh library for fast speaker
|
39
40
|
identification.
|
40
41
|
|
42
|
+
|
41
43
|
Example use
|
42
44
|
-----------
|
43
45
|
|
44
|
-
This gem has been tested with jruby 1.7.
|
46
|
+
This gem has been tested with jruby 1.7.0 onwards.
|
45
47
|
|
46
48
|
$ jruby -S gem install diarize-jruby
|
47
49
|
$ jruby -S irb
|
@@ -53,15 +55,21 @@ This gem has been tested with jruby 1.7.2 onwards.
|
|
53
55
|
> audio.to_rdf
|
54
56
|
> speakers = audio.speakers
|
55
57
|
> speakers.first.gender
|
56
|
-
> speakers.first.model.
|
58
|
+
> speakers.first.model.mean_log_likelihood
|
57
59
|
> speakers.first.model.components.size
|
58
|
-
> audio.
|
59
|
-
> audio.
|
60
|
+
> audio.segments_by_speaker(speakers.first)[0].play
|
61
|
+
> audio.segments_by_speaker(speakers.first)[1].play
|
60
62
|
> ...
|
61
|
-
> speakers |=
|
63
|
+
> speakers |= other_speakers
|
62
64
|
> Diarize::Speaker.match(speakers)
|
63
65
|
|
64
66
|
|
67
|
+
Running tests
|
68
|
+
-------------
|
69
|
+
|
70
|
+
$ jruby -S rake
|
71
|
+
|
72
|
+
|
65
73
|
References
|
66
74
|
----------
|
67
75
|
|
@@ -85,6 +93,7 @@ Proceedings of INTERSPEECH, 2005
|
|
85
93
|
"Support vector machines using GMM supervectors for speaker verification",
|
86
94
|
IEEE Signal Processing Letters, 2006, 13, 308-311
|
87
95
|
|
96
|
+
|
88
97
|
Licensing terms and authorship
|
89
98
|
------------------------------
|
90
99
|
|
data/diarize-jruby.gemspec
CHANGED
@@ -1,10 +1,10 @@
|
|
1
1
|
Gem::Specification.new do |s|
|
2
2
|
s.name = "diarize-jruby"
|
3
|
-
s.version = "0.2.
|
3
|
+
s.version = "0.2.1"
|
4
4
|
s.date = "2013-06-14"
|
5
5
|
s.summary = "Speaker Diarization for JRuby"
|
6
6
|
s.email = "yves.raimond@bbc.co.uk"
|
7
|
-
s.homepage = "
|
7
|
+
s.homepage = "https://github.com/bbcrd/diarize-jruby"
|
8
8
|
s.description = "A library for JRuby wrapping the LIUM Speaker Diarization and including a few extra tools"
|
9
9
|
s.has_rdoc = false
|
10
10
|
s.authors = ['Yves Raimond']
|
data/lib/diarize/speaker.rb
CHANGED
@@ -24,12 +24,8 @@ module Diarize
|
|
24
24
|
|
25
25
|
include JBLAS
|
26
26
|
|
27
|
-
# Some possible matching heuristics if using GDMAP:
|
28
|
-
# - speaker mean_log_likelihood needs to be more than -33 to be considered for match
|
29
|
-
# - distance between two speakers need to be less than distance between speaker and universal model + detection threshold to be considered
|
30
|
-
|
31
27
|
@@log_likelihood_threshold = -33
|
32
|
-
@@detection_threshold = 0.2
|
28
|
+
@@detection_threshold = 0.2
|
33
29
|
|
34
30
|
@@speakers = {}
|
35
31
|
|
metadata
CHANGED
@@ -1,7 +1,7 @@
|
|
1
1
|
--- !ruby/object:Gem::Specification
|
2
2
|
name: diarize-jruby
|
3
3
|
version: !ruby/object:Gem::Version
|
4
|
-
version: 0.2.
|
4
|
+
version: 0.2.1
|
5
5
|
prerelease:
|
6
6
|
platform: java
|
7
7
|
authors:
|
@@ -65,7 +65,7 @@ files:
|
|
65
65
|
- lib/diarize/ubm.gmm
|
66
66
|
- lib/diarize/speaker.rb
|
67
67
|
- lib/diarize/super_vector.rb
|
68
|
-
homepage:
|
68
|
+
homepage: https://github.com/bbcrd/diarize-jruby
|
69
69
|
licenses: []
|
70
70
|
post_install_message:
|
71
71
|
rdoc_options: []
|