bio-ucsc-api 0.0.1
Sign up to get free protection for your applications and to get access to all the features.
- data/.document +5 -0
- data/.rspec +2 -0
- data/COPYING +58 -0
- data/COPYING.ja +51 -0
- data/Gemfile +19 -0
- data/Gemfile.lock +49 -0
- data/README.rdoc +57 -0
- data/Rakefile +72 -0
- data/VERSION +1 -0
- data/bio-ucsc-api.gemspec +212 -0
- data/lib/bio-ucsc.rb +20 -0
- data/lib/bio-ucsc/hg18.rb +27 -0
- data/lib/bio-ucsc/hg18/activerecord.rb +166 -0
- data/lib/bio-ucsc/hg18/cnpiafrate2.rb +31 -0
- data/lib/bio-ucsc/hg18/cnplocke.rb +31 -0
- data/lib/bio-ucsc/hg18/cnpredon.rb +32 -0
- data/lib/bio-ucsc/hg18/cnpsebat2.rb +35 -0
- data/lib/bio-ucsc/hg18/cnpsharp2.rb +32 -0
- data/lib/bio-ucsc/hg18/db_connection.rb +61 -0
- data/lib/bio-ucsc/hg18/dgv.rb +27 -0
- data/lib/bio-ucsc/hg18/refgene.rb +27 -0
- data/lib/bio-ucsc/hg18/rmsk.rb +51 -0
- data/lib/bio-ucsc/hg18/tables.rb +142 -0
- data/lib/bio-ucsc/hg19.rb +54 -0
- data/lib/bio-ucsc/hg19/activerecord.rb +217 -0
- data/lib/bio-ucsc/hg19/ccdsgene.rb +33 -0
- data/lib/bio-ucsc/hg19/cytoband.rb +33 -0
- data/lib/bio-ucsc/hg19/db_connection.rb +61 -0
- data/lib/bio-ucsc/hg19/dgv.rb +27 -0
- data/lib/bio-ucsc/hg19/ensgene.rb +21 -0
- data/lib/bio-ucsc/hg19/gwascatalog.rb +26 -0
- data/lib/bio-ucsc/hg19/hapmapalleleschimp.rb +35 -0
- data/lib/bio-ucsc/hg19/hapmapallelesmacaque.rb +35 -0
- data/lib/bio-ucsc/hg19/hapmapsnpsasw.rb +33 -0
- data/lib/bio-ucsc/hg19/hapmapsnpsceu.rb +33 -0
- data/lib/bio-ucsc/hg19/hapmapsnpschb.rb +33 -0
- data/lib/bio-ucsc/hg19/hapmapsnpschd.rb +33 -0
- data/lib/bio-ucsc/hg19/hapmapsnpsgih.rb +34 -0
- data/lib/bio-ucsc/hg19/hapmapsnpsjpt.rb +34 -0
- data/lib/bio-ucsc/hg19/hapmapsnpslwk.rb +35 -0
- data/lib/bio-ucsc/hg19/hapmapsnpsmex.rb +35 -0
- data/lib/bio-ucsc/hg19/hapmapsnpsmkk.rb +35 -0
- data/lib/bio-ucsc/hg19/hapmapsnpstsi.rb +35 -0
- data/lib/bio-ucsc/hg19/hapmapsnpsyri.rb +35 -0
- data/lib/bio-ucsc/hg19/knowngene.rb +34 -0
- data/lib/bio-ucsc/hg19/omimgene.rb +25 -0
- data/lib/bio-ucsc/hg19/phastconselements46wayprimates.rb +27 -0
- data/lib/bio-ucsc/hg19/phylop46wayprimates.rb +27 -0
- data/lib/bio-ucsc/hg19/refgene.rb +27 -0
- data/lib/bio-ucsc/hg19/rmsk.rb +32 -0
- data/lib/bio-ucsc/hg19/snp131.rb +30 -0
- data/lib/bio-ucsc/hg19/snp132.rb +31 -0
- data/lib/bio-ucsc/hg19/snp132codingdbsnp.rb +29 -0
- data/lib/bio-ucsc/hg19/snp132common.rb +32 -0
- data/lib/bio-ucsc/hg19/snp132flagged.rb +31 -0
- data/lib/bio-ucsc/hg19/snp132mult.rb +32 -0
- data/lib/bio-ucsc/hg19/wgrna.rb +29 -0
- data/lib/bio-ucsc/ucsc_bin.rb +148 -0
- data/samples/hg19-sample.rb +66 -0
- data/spec/hg18/cnpiafrate2_spec.rb +23 -0
- data/spec/hg18/cnplocke_spec.rb +23 -0
- data/spec/hg18/cnpredon_spec.rb +23 -0
- data/spec/hg18/cnpsebat2_spec.rb +23 -0
- data/spec/hg18/cnpsharp2_spec.rb +23 -0
- data/spec/hg18/db_connection_spec.rb +36 -0
- data/spec/hg18/dgv_spec.rb +23 -0
- data/spec/hg18/refgene_spec.rb +23 -0
- data/spec/hg18/rmsk_spec.rb +33 -0
- data/spec/hg19/ccdsgene_spec.rb +23 -0
- data/spec/hg19/cytoband_spec.rb +23 -0
- data/spec/hg19/db_connection_spec.rb +37 -0
- data/spec/hg19/dgv_spec.rb +23 -0
- data/spec/hg19/ensgene_spec.rb +23 -0
- data/spec/hg19/gwascatalog_spec.rb +23 -0
- data/spec/hg19/hapmapalleleschimp_spec.rb +23 -0
- data/spec/hg19/hapmapallelesmacaque_spec.rb +23 -0
- data/spec/hg19/hapmapsnpsasw_spec.rb +23 -0
- data/spec/hg19/hapmapsnpsceu_spec.rb +23 -0
- data/spec/hg19/hapmapsnpschb_spec.rb +23 -0
- data/spec/hg19/hapmapsnpschd_spec.rb +23 -0
- data/spec/hg19/hapmapsnpsgih_spec.rb +23 -0
- data/spec/hg19/hapmapsnpsjpt_spec.rb +23 -0
- data/spec/hg19/hapmapsnpslwk_spec.rb +23 -0
- data/spec/hg19/hapmapsnpsmex_spec.rb +23 -0
- data/spec/hg19/hapmapsnpsmkk_spec.rb +23 -0
- data/spec/hg19/hapmapsnpstsi_spec.rb +23 -0
- data/spec/hg19/hapmapsnpsyri_spec.rb +23 -0
- data/spec/hg19/knowngene_spec.rb +23 -0
- data/spec/hg19/omimGene_spec.rb +23 -0
- data/spec/hg19/phastconselements46wayprimates_spec.rb +23 -0
- data/spec/hg19/phyloP46wayPrimates_spec.rb +23 -0
- data/spec/hg19/refgene_spec.rb +23 -0
- data/spec/hg19/rmsk_spec.rb +23 -0
- data/spec/hg19/snp132Flagged_spec.rb +24 -0
- data/spec/hg19/snp132_spec.rb +23 -0
- data/spec/hg19/snp132codingdbsnp_spec.rb +23 -0
- data/spec/hg19/snp132common_spec.rb +24 -0
- data/spec/hg19/snp132mult_spec.rb +23 -0
- data/spec/hg19/wgrna_spec.rb +23 -0
- data/spec/spec_helper.rb +12 -0
- metadata +368 -0
data/lib/bio-ucsc.rb
ADDED
@@ -0,0 +1,20 @@
|
|
1
|
+
#
|
2
|
+
# = ucsc.rb
|
3
|
+
# Copyright:: Cioyrught (C) 2011
|
4
|
+
# MISHIMA, Hiroyuki <missy at be.to / hmishima at nagasaki-u.ac.jp>
|
5
|
+
# License:: Ruby licence (Ryby's / GPLv2 dual)
|
6
|
+
|
7
|
+
base = File.dirname(__FILE__)
|
8
|
+
require "#{base}/bio-ucsc/ucsc_bin"
|
9
|
+
require "bio-genomic-interval"
|
10
|
+
|
11
|
+
module Bio
|
12
|
+
module Ucsc
|
13
|
+
base = File.dirname(__FILE__)
|
14
|
+
autoload :Hg18, "#{base}/bio-ucsc/hg18"
|
15
|
+
autoload :Hg19, "#{base}/bio-ucsc/hg19"
|
16
|
+
|
17
|
+
# ToDo
|
18
|
+
# autoload :Mm9, "#{base}/bio-ucsc/mm9"
|
19
|
+
end
|
20
|
+
end
|
@@ -0,0 +1,27 @@
|
|
1
|
+
#
|
2
|
+
# = ucsc.rb
|
3
|
+
# Copyright:: Cioyrught (C) 2011
|
4
|
+
# MISHIMA, Hiroyuki <missy at be.to / hmishima at nagasaki-u.ac.jp>
|
5
|
+
# Copyright:: Copyright (C) 2008
|
6
|
+
# Jan Aerts <jan.aerts@gmail.com>
|
7
|
+
# License:: Ruby's
|
8
|
+
|
9
|
+
base = File.dirname(__FILE__)
|
10
|
+
require "#{base}/hg18/db_connection"
|
11
|
+
require "#{base}/hg18/activerecord"
|
12
|
+
|
13
|
+
module Bio
|
14
|
+
module Ucsc
|
15
|
+
module Hg18
|
16
|
+
base = File.dirname(__FILE__)
|
17
|
+
autoload :RefGene, "#{base}/hg18/refgene"
|
18
|
+
autoload :Dgv, "#{base}/hg18/dgv"
|
19
|
+
autoload :CnpIafrate2, "#{base}/hg18/cnpiafrate2"
|
20
|
+
autoload :CnpLocke, "#{base}/hg18/cnplocke"
|
21
|
+
autoload :CnpRedon, "#{base}/hg18/cnpredon"
|
22
|
+
autoload :CnpSebat2, "#{base}/hg18/cnpsebat2"
|
23
|
+
autoload :CnpSharp2, "#{base}/hg18/cnpsharp2"
|
24
|
+
autoload :Rmsk, "#{base}/hg18/rmsk.rb"
|
25
|
+
end
|
26
|
+
end
|
27
|
+
end
|
@@ -0,0 +1,166 @@
|
|
1
|
+
#
|
2
|
+
# = ucsc/hg18/activerecord.rb - ActiveRecord mappings to UCSC hg18 database
|
3
|
+
#
|
4
|
+
# Copyright::
|
5
|
+
# Copyright (C) 2011 MISHIMA, Hiroyuki <missy at be.to / hmishima at nagasaki-u.ac.jp>
|
6
|
+
# Copyright (C) 2008 Jan Aerts <jan.aerts@gmail.com>
|
7
|
+
# License:: The Ruby licence (Ryby's / GPLv2 dual)
|
8
|
+
#
|
9
|
+
# = DESCRIPTION
|
10
|
+
# == What is it?
|
11
|
+
# The UCSC module provides an API to the UCSC databases
|
12
|
+
# stored at genome-mysql.cse.ucsc.edu. This is the same information that is
|
13
|
+
# available from http://genome.ucsc.edu
|
14
|
+
#
|
15
|
+
# The Ucsc::Hg18 module covers the hg19 (= GRCh37) assembly.
|
16
|
+
#
|
17
|
+
# == ActiveRecord
|
18
|
+
# The UCSC API provides a ruby interface to the UCSC mysql databases
|
19
|
+
# at genome-mysql.cse.ucsc.edu. Most of the API is based on ActiveRecord to
|
20
|
+
# get data from that database. In general, each table is described by a
|
21
|
+
# class with the same name: the cnpRedon table is covered by the
|
22
|
+
# CnpRedon class, the dgv table is covered by the Dgv class,
|
23
|
+
# etc. As a result, accessors are available for all columns in each table.
|
24
|
+
# For example, the cnpRedon table has the following columns: chrom, chromStart,
|
25
|
+
# chromEnd and name. Through ActiveRecord, these column names become available
|
26
|
+
# as attributes of CnpRedon objects:
|
27
|
+
# puts my_cnp_redon.name
|
28
|
+
# puts my_cnp_redon.chrom
|
29
|
+
# puts my_cnp_redon.chromStart
|
30
|
+
# puts my_cnp_redon.chromEnd
|
31
|
+
#
|
32
|
+
# ActiveRecord makes it easy to extract data from those tables using the
|
33
|
+
# collection of #find methods. There are three types of #find methods (e.g.
|
34
|
+
# for the CnpRedon class):
|
35
|
+
# a. find based on primary key in table:
|
36
|
+
# # not possible with the UCSC database
|
37
|
+
# b. find_by_sql:
|
38
|
+
# my_cnp = CnpRedon.find_by_sql('SELECT * FROM cnpRedon WHERE name = 'cnp1'")
|
39
|
+
# c. find_by_<insert_your_column_name_here>
|
40
|
+
# my_cnp = CnpRedon.find_by_name('cnp1')
|
41
|
+
# my_cnp2 = CnpRedon.find_by_chrom_and_chromStart('chr1',377)
|
42
|
+
# To find out which find_by_<column> methods are available, you can list the
|
43
|
+
# column names using the column_names class methods:
|
44
|
+
#
|
45
|
+
# puts Ucsc::Hg18::CnpRedon.column_names.join("\t")
|
46
|
+
#
|
47
|
+
# For more information on the find methods, see
|
48
|
+
# http://ar.rubyonrails.org/classes/ActiveRecord/Base.html#M000344
|
49
|
+
#
|
50
|
+
|
51
|
+
module Bio
|
52
|
+
module Ucsc
|
53
|
+
|
54
|
+
# = DESCRIPTION
|
55
|
+
# The Bin::Ucsc::Hg18 module covers the hg18 database from
|
56
|
+
# genome-mysql.cse.ucsc.edu and covers mainly sequences and their annotations.
|
57
|
+
# For a more information about the database tables, click on the "Describe
|
58
|
+
# table schema" in the Table Browser.
|
59
|
+
module Hg18
|
60
|
+
# interval: chromStart, chromEnd
|
61
|
+
# bin index is enabled
|
62
|
+
module QueryUsingChromBin
|
63
|
+
def find_by_interval(interval)
|
64
|
+
zstart = interval.zero_start
|
65
|
+
zend = interval.zero_end
|
66
|
+
where = <<-SQL
|
67
|
+
chrom = :chrom
|
68
|
+
AND bin in (:bins)
|
69
|
+
AND ((chromStart BETWEEN :zstart AND :zend)
|
70
|
+
OR (chromEnd BETWEEN :zstart AND :zend)
|
71
|
+
OR (chromStart <= :zstart AND chromEnd >= :zend))
|
72
|
+
SQL
|
73
|
+
cond = {
|
74
|
+
:chrom => interval.chrom,
|
75
|
+
:bins => Ucsc::UcscBin.bin_all(zstart, zend),
|
76
|
+
:zstart => zstart,
|
77
|
+
:zend => zend,
|
78
|
+
}
|
79
|
+
|
80
|
+
self.find(:all,
|
81
|
+
:select => "*",
|
82
|
+
:conditions => [where, cond],
|
83
|
+
)
|
84
|
+
end
|
85
|
+
end # module QueryUsingChromBin
|
86
|
+
|
87
|
+
# interval: chromStart, chromEnd
|
88
|
+
# bin index is disabled
|
89
|
+
module QueryUsingChrom
|
90
|
+
def find_by_interval(interval)
|
91
|
+
zstart = interval.zero_start
|
92
|
+
zend = interval.zero_end
|
93
|
+
where = <<-SQL
|
94
|
+
chrom = :chrom
|
95
|
+
AND ((chromStart BETWEEN :zstart AND :zend)
|
96
|
+
OR (chromEnd BETWEEN :zstart AND :zend)
|
97
|
+
OR (chromStart <= :zstart AND chromEnd >= :zend))
|
98
|
+
SQL
|
99
|
+
cond = {
|
100
|
+
:chrom => interval.chrom,
|
101
|
+
:zstart => zstart,
|
102
|
+
:zend => zend,
|
103
|
+
}
|
104
|
+
self.find(:all,
|
105
|
+
:select => "*",
|
106
|
+
:conditions => [where, cond],
|
107
|
+
)
|
108
|
+
end
|
109
|
+
end # module QueryUsingChrom
|
110
|
+
|
111
|
+
# interval: chromStart, chromEnd
|
112
|
+
# bin index is disabled
|
113
|
+
module QueryUsingTxBin
|
114
|
+
def find_by_interval(interval)
|
115
|
+
zstart = interval.zero_start
|
116
|
+
zend = interval.zero_end
|
117
|
+
where = <<-SQL
|
118
|
+
chrom = :chrom
|
119
|
+
AND bin in (:bins)
|
120
|
+
AND ((txStart BETWEEN :zstart AND :zend)
|
121
|
+
OR (txEnd BETWEEN :zstart AND :zend)
|
122
|
+
OR (txStart <= :zstart AND txEnd >= :zend))
|
123
|
+
SQL
|
124
|
+
cond = {
|
125
|
+
:chrom => interval.chrom,
|
126
|
+
:bins => Bio::Ucsc::UcscBin.bin_all(zstart, zend),
|
127
|
+
:zstart => zstart,
|
128
|
+
:zend => zend,
|
129
|
+
}
|
130
|
+
self.find(:all,
|
131
|
+
:select => "*",
|
132
|
+
:conditions => [where, cond],
|
133
|
+
)
|
134
|
+
end
|
135
|
+
end # module QueryUsingTxBin
|
136
|
+
|
137
|
+
# interval: genoName, genoStart, genoEnd
|
138
|
+
# bin index is enabled
|
139
|
+
module QueryUsingGenoBin
|
140
|
+
def find_by_interval(interval)
|
141
|
+
zstart = interval.zero_start
|
142
|
+
zend = interval.zero_end
|
143
|
+
where = <<-SQL
|
144
|
+
genoName = :chrom
|
145
|
+
AND bin in (:bins)
|
146
|
+
AND ((genoStart BETWEEN :zstart AND :zend)
|
147
|
+
OR (genoEnd BETWEEN :zstart AND :zend)
|
148
|
+
OR (genoStart <= :zstart AND genoEnd >= :zend))
|
149
|
+
SQL
|
150
|
+
cond = {
|
151
|
+
:chrom => interval.chrom,
|
152
|
+
:bins => Ucsc::UcscBin.bin_all(zstart, zend),
|
153
|
+
:zstart => zstart,
|
154
|
+
:zend => zend,
|
155
|
+
}
|
156
|
+
|
157
|
+
self.find(:all,
|
158
|
+
:select => "*",
|
159
|
+
:conditions => [where, cond],
|
160
|
+
)
|
161
|
+
end
|
162
|
+
end # module QueryUsingChromBin
|
163
|
+
|
164
|
+
end # module Hg18
|
165
|
+
end # module Ucsc
|
166
|
+
end # module Bio
|
@@ -0,0 +1,31 @@
|
|
1
|
+
#
|
2
|
+
# = hg18/cnpiafrate2.rb
|
3
|
+
# Copyright::
|
4
|
+
# Copyright (C) 2011 MISHIMA, Hiroyuki <missy at be.to / hmishima at nagasaki-u.ac.jp>
|
5
|
+
# Copyright (C) 2008 Jan Aerts <jan.aerts@gmail.com>
|
6
|
+
# License:: The Ruby licence (Ryby's / GPLv2 dual)
|
7
|
+
#
|
8
|
+
# = Table desfription in UCSC Table Browser
|
9
|
+
# This annotation shows regions detected as putative copy number
|
10
|
+
# polymorphisms (CNP) and sites of detected intermediate-sized
|
11
|
+
# structural variation (ISV). The CNPs and ISVs were determined by
|
12
|
+
# various methods, displayed in individual subtracks within the
|
13
|
+
# annotation.
|
14
|
+
#
|
15
|
+
# Iafrate BAC microarray analysis
|
16
|
+
# All hybridizations were performed in duplicate incorporating a
|
17
|
+
# dye-reversal using proprieta#ry 1 Mb GenomeChip V1.2 Human BAC Arrays
|
18
|
+
# consisting of 2,632 BAC clones (Spectral Genomics,# Houston, TX). The
|
19
|
+
# false positive rate was estimated at ~1 clone per 5,264 tested.
|
20
|
+
|
21
|
+
module Bio
|
22
|
+
module Ucsc
|
23
|
+
module Hg18
|
24
|
+
class CnpIafrate2 < DBConnection
|
25
|
+
extend Bio::Ucsc::Hg18::QueryUsingChromBin
|
26
|
+
set_table_name 'cnpIafrate2'
|
27
|
+
set_primary_key nil
|
28
|
+
end
|
29
|
+
end
|
30
|
+
end
|
31
|
+
end
|
@@ -0,0 +1,31 @@
|
|
1
|
+
#
|
2
|
+
# = hg18/cnplocke.rb
|
3
|
+
# Copyright::
|
4
|
+
# Copyright (C) 2011 MISHIMA, Hiroyuki <missy at be.to / hmishima at nagasaki-u.ac.jp>
|
5
|
+
# Copyright (C) 2008 Jan Aerts <jan.aerts@gmail.com>
|
6
|
+
# License:: The Ruby licence (Ryby's / GPLv2 dual)
|
7
|
+
#
|
8
|
+
# = Table desfription in UCSC Table Browser
|
9
|
+
# This annotation shows regions detected as putative copy number
|
10
|
+
# polymorphisms (CNP) and sites of detected intermediate-sized
|
11
|
+
# structural variation (ISV). The CNPs and ISVs were determined by
|
12
|
+
# various methods, displayed in individual subtracks within the
|
13
|
+
# annotation.
|
14
|
+
#
|
15
|
+
# Locke analysis of duplication-rich regions
|
16
|
+
# DNA samples were obtained from Coriell Cell Repositories. The
|
17
|
+
# reference DNA used for all hybridizations was from a single male of
|
18
|
+
# Czechoslovakian descent, Coriell ID GM15724 (also used in the Sharp
|
19
|
+
# study).
|
20
|
+
|
21
|
+
module Bio
|
22
|
+
module Ucsc
|
23
|
+
module Hg18
|
24
|
+
class CnpLocke < DBConnection
|
25
|
+
extend Bio::Ucsc::Hg18::QueryUsingChromBin
|
26
|
+
set_table_name 'cnpLocke'
|
27
|
+
set_primary_key nil
|
28
|
+
end
|
29
|
+
end
|
30
|
+
end
|
31
|
+
end
|
@@ -0,0 +1,32 @@
|
|
1
|
+
#
|
2
|
+
# = hg18/cnpredon.rb
|
3
|
+
# Copyright::
|
4
|
+
# Copyright (C) 2011 MISHIMA, Hiroyuki <missy at be.to / hmishima at nagasaki-u.ac.jp>
|
5
|
+
# Copyright (C) 2008 Jan Aerts <jan.aerts@gmail.com>
|
6
|
+
# License:: The Ruby licence (Ryby's / GPLv2 dual)
|
7
|
+
#
|
8
|
+
# = Table desfription in UCSC Table Browser
|
9
|
+
# This annotation shows regions detected as putative copy number
|
10
|
+
# polymorphisms (CNP) and sites of detected intermediate-sized
|
11
|
+
# structural variation (ISV). The CNPs and ISVs were determined by
|
12
|
+
# various methods, displayed in individual subtracks within the
|
13
|
+
# annotation.
|
14
|
+
#
|
15
|
+
# Redon analysis of HapMap data
|
16
|
+
# Experiments were performed with the International HapMap DNA and
|
17
|
+
# cell-line collection using two technologies: comparative analysis of
|
18
|
+
# hybridization intensities on Affymetric GeneChip Human Mapping 500K
|
19
|
+
# early access arrays (500K EA) and comparative genomic hybridization
|
20
|
+
# with a Whole Genome TilePath (WGTP) array.
|
21
|
+
|
22
|
+
module Bio
|
23
|
+
module Ucsc
|
24
|
+
module Hg18
|
25
|
+
class CnpRedon < DBConnection
|
26
|
+
extend Bio::Ucsc::Hg18::QueryUsingChromBin
|
27
|
+
set_table_name 'cnpRedon'
|
28
|
+
set_primary_key nil
|
29
|
+
end
|
30
|
+
end
|
31
|
+
end
|
32
|
+
end
|
@@ -0,0 +1,35 @@
|
|
1
|
+
#
|
2
|
+
# = hg18/cnpsebat2.rb
|
3
|
+
# Copyright::
|
4
|
+
# Copyright (C) 2011 MISHIMA, Hiroyuki <missy at be.to / hmishima at nagasaki-u.ac.jp>
|
5
|
+
# Copyright (C) 2008 Jan Aerts <jan.aerts@gmail.com>
|
6
|
+
# License:: The Ruby licence (Ryby's / GPLv2 dual)
|
7
|
+
#
|
8
|
+
# = Table desfription in UCSC Table Browser
|
9
|
+
# This annotation shows regions detected as putative copy number
|
10
|
+
# polymorphisms (CNP) and sites of detected intermediate-sized
|
11
|
+
# structural variation (ISV). The CNPs and ISVs were determined by
|
12
|
+
# various methods, displayed in individual subtracks within the
|
13
|
+
# annotation.
|
14
|
+
#
|
15
|
+
# Sebat ROMA Following digestion with BglII or HindIII, genomic DNA
|
16
|
+
# was hybridized to a custom array consisting of 85,000
|
17
|
+
# oligonucleotide probes. The probes were selected to be free of
|
18
|
+
# common repeats and have unique homology within the human genome. The
|
19
|
+
# average resolution of the array was -5 kb; however, only intervals
|
20
|
+
# in which three consecutive probes showed concordant signals were
|
21
|
+
# scored as CNPs. All hybridizations were performed in duplicate
|
22
|
+
# incorporating a dye-reversal, with the false positive rate estimated
|
23
|
+
# to be -6%.
|
24
|
+
|
25
|
+
module Bio
|
26
|
+
module Ucsc
|
27
|
+
module Hg18
|
28
|
+
class CnpSebat2 < DBConnection
|
29
|
+
extend Bio::Ucsc::Hg18::QueryUsingChrom
|
30
|
+
set_table_name 'cnpSebat2'
|
31
|
+
set_primary_key nil
|
32
|
+
end
|
33
|
+
end
|
34
|
+
end
|
35
|
+
end
|
@@ -0,0 +1,32 @@
|
|
1
|
+
#
|
2
|
+
# = hg18/cnpsharp2.rb
|
3
|
+
# Copyright::
|
4
|
+
# Copyright (C) 2011 MISHIMA, Hiroyuki <missy at be.to / hmishima at nagasaki-u.ac.jp>
|
5
|
+
# Copyright (C) 2008 Jan Aerts <jan.aerts@gmail.com>
|
6
|
+
# License:: The Ruby licence (Ryby's / GPLv2 dual)
|
7
|
+
#
|
8
|
+
# = Table desfription in UCSC Table Browser
|
9
|
+
# This annotation shows regions detected as putative copy number
|
10
|
+
# polymorphisms (CNP) and sites of detected intermediate-sized
|
11
|
+
# structural variation (ISV). The CNPs and ISVs were determined by
|
12
|
+
# various methods, displayed in individual subtracks within the
|
13
|
+
# annotation.
|
14
|
+
#
|
15
|
+
# Sharp BAC microarray analysis
|
16
|
+
# All hybridizations were performed in duplicate incorporating a
|
17
|
+
# dye-reversal using a custom array consisting of 2,194 end-sequence
|
18
|
+
# or FISH-confirmed BACs, targeted to regions of the genome flanked by
|
19
|
+
# segmental duplications. The false positive rate was estimated at -3
|
20
|
+
# clones per 4,000 tested.
|
21
|
+
|
22
|
+
module Bio
|
23
|
+
module Ucsc
|
24
|
+
module Hg18
|
25
|
+
class CnpSharp2 < DBConnection
|
26
|
+
extend Bio::Ucsc::Hg18::QueryUsingChromBin
|
27
|
+
set_table_name 'cnpSharp2'
|
28
|
+
set_primary_key nil
|
29
|
+
end
|
30
|
+
end
|
31
|
+
end
|
32
|
+
end
|
@@ -0,0 +1,61 @@
|
|
1
|
+
#
|
2
|
+
# = lib/ucsc/hg18/db_connection.rb - UCSC hg18 DB connection
|
3
|
+
#
|
4
|
+
# Copyright:: Cioyrught (C) 2011
|
5
|
+
# MISHIMA, Hiroyuki <missy at be.to / hmishima at nagasaki-u.ac.jp>
|
6
|
+
# Copyright:: Copyright (C) 2008
|
7
|
+
# Jan Aerts <jan.aerts@gmail.com>
|
8
|
+
# License:: Ruby licence (Ryby's / GPLv2 dual)
|
9
|
+
|
10
|
+
require 'rubygems'
|
11
|
+
require 'active_record'
|
12
|
+
|
13
|
+
module Bio
|
14
|
+
module Ucsc
|
15
|
+
|
16
|
+
module Hg18
|
17
|
+
# = DESCRIPTION
|
18
|
+
# The Ucsc::Hg18::DBConnection is the actual connection established
|
19
|
+
# with the UCSC mysql server.
|
20
|
+
|
21
|
+
class DBConnection < ActiveRecord::Base
|
22
|
+
# = DESCRIPTION
|
23
|
+
# The Ucsc::Hg18::DBConnection#connect method makes the connection
|
24
|
+
# to the UCSC hg18 database.
|
25
|
+
#
|
26
|
+
# = USAGE
|
27
|
+
# # Connect to the hg18
|
28
|
+
# Ensembl::Core::DBConnection.connect
|
29
|
+
#
|
30
|
+
# ---
|
31
|
+
# *Arguments*: none
|
32
|
+
@@db_adapter = 'mysql'
|
33
|
+
@@db_host = 'genome-mysql.cse.ucsc.edu'
|
34
|
+
@@db_username = 'genome'
|
35
|
+
@@db_password = ''
|
36
|
+
|
37
|
+
cattr_accessor :db_host, :db_username, :db_password
|
38
|
+
|
39
|
+
self.abstract_class = true
|
40
|
+
|
41
|
+
def self.default
|
42
|
+
@@db_adapter = 'mysql'
|
43
|
+
@@db_host = 'genome-mysql.cse.ucsc.edu'
|
44
|
+
@@db_username = 'genome'
|
45
|
+
@@db_password = ''
|
46
|
+
end
|
47
|
+
|
48
|
+
def self.connect
|
49
|
+
establish_connection(
|
50
|
+
:adapter => @@db_adapter,
|
51
|
+
:host => @@db_host,
|
52
|
+
:database => 'hg18',
|
53
|
+
:username => @@db_username,
|
54
|
+
:password => @@db_password
|
55
|
+
)
|
56
|
+
end
|
57
|
+
end
|
58
|
+
end # module Hg18
|
59
|
+
|
60
|
+
end # module Ucsc
|
61
|
+
end # module Bio
|