bioroebe 0.12.24 → 0.13.31

Sign up to get free protection for your applications and to get access to all the features.
Files changed (503) hide show
  1. checksums.yaml +4 -4
  2. data/LICENSE.md +7 -8
  3. data/README.md +566 -354
  4. data/bin/all_positions_of_this_nucleotide +1 -1
  5. data/bin/aminoacid_frequencies +1 -1
  6. data/bin/automatically_rename_this_fasta_file +1 -1
  7. data/bin/base_composition +1 -1
  8. data/bin/batch_create_windows_executables +1 -1
  9. data/bin/bioroebe +12 -1
  10. data/bin/bioroebe_cat +7 -0
  11. data/bin/calculate_exponential_growth +7 -0
  12. data/bin/calculate_n50_value +1 -1
  13. data/bin/calculate_the_frequencies_of_this_species +7 -0
  14. data/bin/chunked_display +1 -1
  15. data/bin/codon_frequency +1 -1
  16. data/bin/codon_to_aminoacid +1 -1
  17. data/bin/colourize_this_fasta_sequence +1 -1
  18. data/bin/complementary_dna_strand +1 -1
  19. data/bin/complementary_rna_strand +1 -1
  20. data/bin/consensus_sequence +1 -1
  21. data/bin/dna_to_rna +1 -1
  22. data/bin/downcase_chunked_display +1 -1
  23. data/bin/download_this_pdb +1 -1
  24. data/bin/fasta_index +1 -1
  25. data/bin/fetch_data_from_uniprot +1 -1
  26. data/bin/filter_away_invalid_nucleotides +1 -1
  27. data/bin/find_substring +1 -1
  28. data/bin/input_as_dna +1 -1
  29. data/bin/is_palindrome +1 -1
  30. data/bin/leading_five_prime +1 -1
  31. data/bin/longest_ORF +1 -1
  32. data/bin/longest_substring +1 -1
  33. data/bin/open_reading_frames +1 -1
  34. data/bin/partner_nucleotide +1 -1
  35. data/bin/plain_palindrome +1 -1
  36. data/bin/random_dna_sequence +1 -1
  37. data/bin/random_sequence +1 -1
  38. data/bin/raw_hamming_distance +1 -1
  39. data/bin/return_longest_substring_via_LCS_algorithm +1 -1
  40. data/bin/reverse_sequence +1 -1
  41. data/bin/short_aminoacid_letter_from_long_aminoacid_name +1 -1
  42. data/bin/show_atomic_composition +1 -1
  43. data/bin/show_fasta_header +1 -1
  44. data/bin/show_nucleotide_sequence +1 -1
  45. data/bin/show_this_dna_sequence +1 -1
  46. data/bin/show_time_now +7 -0
  47. data/bin/sort_aminoacid_based_on_its_hydrophobicity +1 -1
  48. data/bin/strict_filter_away_invalid_aminoacids +1 -1
  49. data/{lib/bioroebe/base/reset.rb → bin/three_delimiter} +9 -6
  50. data/bin/three_to_one +1 -1
  51. data/bin/to_rna +1 -1
  52. data/bin/trailing_three_prime +1 -1
  53. data/bin/upcase_this_aminoacid_sequence_and_remove_numbers +1 -1
  54. data/bioroebe.gemspec +6 -7
  55. data/doc/README.gen +534 -322
  56. data/doc/blosum/blosum.md +4 -0
  57. data/doc/compatibility/BIO_PHP.md +20 -18
  58. data/doc/compatibility/README.md +2 -3
  59. data/doc/compatibility/emboss.md +5 -3
  60. data/doc/{extensive_usage_example.md → extensive_usage_example/extensive_usage_example.md} +4 -2
  61. data/doc/{instructions_for_the_taxonomy_subproject.md → instructions_for_the_taxonomy_subproject/instructions_for_the_taxonomy_subproject.md} +36 -33
  62. data/doc/{legacy_paths.md → legacy_paths/legacy_paths.md} +3 -3
  63. data/doc/statistics/statistics.md +12 -10
  64. data/doc/todo/bioroebe_GUI_todo.md +6 -1
  65. data/doc/todo/bioroebe_java_todo.md +3 -2
  66. data/doc/todo/bioroebe_todo.md +328 -310
  67. data/doc/{using_biomart.md → using_biomart/using_biomart.md} +7 -3
  68. data/lib/bioroebe/abstract/features.rb +0 -0
  69. data/lib/bioroebe/aminoacids/aminoacid_substitution.rb +1 -1
  70. data/lib/bioroebe/aminoacids/aminoacids_mass_table.rb +3 -1
  71. data/lib/bioroebe/aminoacids/codon_percentage.rb +18 -10
  72. data/lib/bioroebe/aminoacids/create_random_aminoacids.rb +5 -2
  73. data/lib/bioroebe/aminoacids/deduce_aminoacid_sequence.rb +90 -64
  74. data/lib/bioroebe/aminoacids/display_aminoacid_table.rb +1 -3
  75. data/lib/bioroebe/aminoacids/show_hydrophobicity.rb +2 -2
  76. data/lib/bioroebe/annotations/create_annotation_format.rb +2 -2
  77. data/lib/bioroebe/base/base.rb +101 -6
  78. data/lib/bioroebe/base/base_module/base_module.rb +9 -1
  79. data/lib/bioroebe/base/colours.rb +3 -0
  80. data/lib/bioroebe/base/colours_for_base/colours_for_base.rb +80 -44
  81. data/lib/bioroebe/base/commandline_application/README.md +1 -1
  82. data/lib/bioroebe/base/commandline_application/commandline_application.rb +661 -22
  83. data/lib/bioroebe/base/commandline_application/commandline_arguments.rb +2 -1
  84. data/lib/bioroebe/base/infer_the_namespace_module/infer_the_namespace_module.rb +37 -0
  85. data/lib/bioroebe/base/internal_hash_module/internal_hash_module.rb +1 -6
  86. data/lib/bioroebe/base/prototype/prototype.rb +155 -14
  87. data/lib/bioroebe/biomart/attribute.rb +1 -1
  88. data/lib/bioroebe/biomart/biomart.rb +8 -9
  89. data/lib/bioroebe/biomart/server.rb +1 -1
  90. data/lib/bioroebe/blosum/blosum.rb +2 -2
  91. data/lib/bioroebe/calculate/calculate_blosum_score.rb +5 -3
  92. data/lib/bioroebe/calculate/calculate_gc_content.rb +1 -1
  93. data/lib/bioroebe/calculate/calculate_levensthein_distance.rb +5 -3
  94. data/lib/bioroebe/calculate/calculate_melting_temperature.rb +2 -10
  95. data/lib/bioroebe/calculate/calculate_melting_temperature_for_more_than_thirteen_nucleotides.rb +6 -15
  96. data/lib/bioroebe/calculate/calculate_the_position_specific_scoring_matrix.rb +4 -2
  97. data/lib/bioroebe/cell/cell.rb +3 -2
  98. data/lib/bioroebe/cell/specialized_cells/B_cell.rb +60 -0
  99. data/lib/bioroebe/cell/specialized_cells/Macrophage.rb +60 -0
  100. data/lib/bioroebe/cell/specialized_cells/README.md +5 -0
  101. data/lib/bioroebe/cell/specialized_cells/T_cell.rb +60 -0
  102. data/lib/bioroebe/cleave_and_digest/cleave.rb +3 -1
  103. data/lib/bioroebe/cleave_and_digest/digestion.rb +1 -1
  104. data/lib/bioroebe/codon_tables/frequencies/10090_Mus_musculus.yml +93 -0
  105. data/lib/bioroebe/codon_tables/frequencies/107243_Thlaspi_caerulescens.yml +72 -0
  106. data/lib/bioroebe/codon_tables/frequencies/parse_frequency_table.rb +2 -2
  107. data/lib/bioroebe/codons/codon_table.rb +10 -2
  108. data/lib/bioroebe/codons/codons.rb +3 -3
  109. data/lib/bioroebe/codons/convert_this_codon_to_that_aminoacid.rb +18 -15
  110. data/lib/bioroebe/codons/determine_optimal_codons.rb +1 -1
  111. data/lib/bioroebe/codons/possible_codons_for_this_aminoacid.rb +4 -2
  112. data/lib/bioroebe/codons/show_codon_tables.rb +1 -1
  113. data/lib/bioroebe/codons/show_codon_usage.rb +1 -2
  114. data/lib/bioroebe/codons/show_this_codon_table.rb +2 -2
  115. data/lib/bioroebe/codons/start_codons.rb +7 -3
  116. data/lib/bioroebe/colours/colour_schemes/README.md +1 -1
  117. data/lib/bioroebe/colours/colour_schemes/array_available_colour_schemes.rb +3 -3
  118. data/lib/bioroebe/colours/colour_schemes/colour_scheme.rb +3 -3
  119. data/lib/bioroebe/colours/colour_schemes/colour_scheme_demo.rb +4 -3
  120. data/lib/bioroebe/colours/colour_schemes/helix.rb +3 -1
  121. data/lib/bioroebe/colours/colour_schemes/hydropathy.rb +3 -1
  122. data/lib/bioroebe/colours/colour_schemes/score.rb +13 -2
  123. data/lib/bioroebe/colours/colour_schemes/strand.rb +3 -1
  124. data/lib/bioroebe/colours/colour_schemes/turn.rb +3 -1
  125. data/lib/bioroebe/colours/colour_schemes/zappo.rb +1 -1
  126. data/lib/bioroebe/{toplevel_methods/colourize_related_methods.rb → colours/colourize_related_code.rb} +1 -3
  127. data/lib/bioroebe/colours/colourize_sequence.rb +3 -1
  128. data/lib/bioroebe/colours/colours.rb +172 -15
  129. data/lib/bioroebe/configuration/configuration.rb +1 -1
  130. data/lib/bioroebe/constants/GUIs.rb +2 -2
  131. data/lib/bioroebe/constants/constants.rb +1349 -0
  132. data/lib/bioroebe/conversions/convert_aminoacid_to_dna.rb +8 -13
  133. data/lib/bioroebe/conversions/dna_to_aminoacid_sequence.rb +9 -3
  134. data/lib/bioroebe/count/count_amount_of_aminoacids.rb +11 -10
  135. data/lib/bioroebe/count/count_amount_of_nucleotides.rb +1 -1
  136. data/lib/bioroebe/count/count_at.rb +2 -1
  137. data/lib/bioroebe/databases/download_taxonomy_database.rb +1 -1
  138. data/lib/bioroebe/dotplots/advanced_dotplot.rb +2 -2
  139. data/lib/bioroebe/electron_microscopy/coordinate_analyzer.rb +2 -2
  140. data/lib/bioroebe/electron_microscopy/fix_pos_file.rb +2 -2
  141. data/lib/bioroebe/electron_microscopy/flipy.rb +2 -2
  142. data/lib/bioroebe/electron_microscopy/generate_em2em_file.rb +3 -11
  143. data/lib/bioroebe/electron_microscopy/parse_coordinates.rb +6 -6
  144. data/lib/bioroebe/electron_microscopy/read_file_xmd.rb +6 -6
  145. data/lib/bioroebe/electron_microscopy/simple_star_file_generator.rb +2 -2
  146. data/lib/bioroebe/enzymes/has_this_restriction_enzyme.rb +1 -1
  147. data/lib/bioroebe/enzymes/restriction_enzyme.rb +1 -1
  148. data/lib/bioroebe/enzymes/restriction_enzymes/statistics.rb +4 -3
  149. data/lib/bioroebe/enzymes/restriction_enzymes_file.rb +1 -1
  150. data/lib/bioroebe/enzymes/return_sequence_that_is_cut_via_restriction_enzyme.rb +4 -3
  151. data/lib/bioroebe/enzymes/show_restriction_enzymes.rb +3 -3
  152. data/lib/bioroebe/ext/main.cpp +0 -1
  153. data/lib/bioroebe/fasta_and_fastq/autocorrect_the_name_of_this_fasta_file.rb +3 -3
  154. data/lib/bioroebe/fasta_and_fastq/compact_fasta_file/compact_fasta_file.rb +1 -1
  155. data/lib/bioroebe/fasta_and_fastq/display_how_many_fasta_entries_are_in_this_directory.rb +1 -1
  156. data/lib/bioroebe/fasta_and_fastq/download_fasta.rb +8 -14
  157. data/lib/bioroebe/fasta_and_fastq/fasta_defline/fasta_defline.rb +1 -1
  158. data/lib/bioroebe/fasta_and_fastq/fasta_to_yaml/fasta_to_yaml.rb +1 -1
  159. data/lib/bioroebe/fasta_and_fastq/fastq_format_explainer.rb +1 -1
  160. data/lib/bioroebe/fasta_and_fastq/length_modifier/length_modifier.rb +1 -1
  161. data/lib/bioroebe/fasta_and_fastq/parse_fasta/parse_fasta.rb +37 -11
  162. data/lib/bioroebe/fasta_and_fastq/parse_fastq/parse_fastq.rb +2 -2
  163. data/lib/bioroebe/fasta_and_fastq/return_fasta_subsection_of_this_file.rb +1 -1
  164. data/lib/bioroebe/fasta_and_fastq/show_fasta_headers.rb +5 -13
  165. data/lib/bioroebe/fasta_and_fastq/show_fasta_statistics.rb +1 -1
  166. data/lib/bioroebe/fasta_and_fastq/simplify_fasta_header/simplify_fasta_header.rb +1 -1
  167. data/lib/bioroebe/fasta_and_fastq/split_this_fasta_file_into_chromosomes/reset.rb +3 -6
  168. data/lib/bioroebe/fasta_and_fastq/split_this_fasta_file_into_chromosomes/split_this_fasta_file_into_chromosomes.rb +3 -3
  169. data/lib/bioroebe/genbank/genbank_flat_file_format_generator.rb +20 -11
  170. data/lib/bioroebe/genome/genome.rb +1 -1
  171. data/lib/bioroebe/genomes/genome_pattern.rb +17 -16
  172. data/lib/bioroebe/genomes/genome_retriever.rb +4 -2
  173. data/lib/bioroebe/gui/experimental/snapgene/snapgene.rb +10 -13
  174. data/lib/bioroebe/gui/universal_widgets/alignment/alignment.rb +557 -0
  175. data/lib/bioroebe/gui/{gtk3 → universal_widgets}/aminoacid_composition/aminoacid_composition.rb +498 -198
  176. data/lib/bioroebe/gui/universal_widgets/anti_sense_strand/anti_sense_strand.rb +665 -0
  177. data/lib/bioroebe/gui/universal_widgets/blosum_matrix_viewer/blosum_matrix_viewer.rb +329 -0
  178. data/lib/bioroebe/gui/universal_widgets/calculate_cell_numbers_of_bacteria/calculate_cell_numbers_of_bacteria.rb +423 -0
  179. data/lib/bioroebe/gui/{gtk3 → universal_widgets}/controller/controller.rb +170 -118
  180. data/lib/bioroebe/gui/{gtk3 → universal_widgets}/dna_to_aminoacid_widget/dna_to_aminoacid_widget.rb +277 -215
  181. data/lib/bioroebe/gui/{shared_code/dna_to_reverse_complement_widget/dna_to_reverse_complement_widget_module.rb → universal_widgets/dna_to_reverse_complement_widget/dna_to_reverse_complement_widget.rb} +297 -107
  182. data/lib/bioroebe/gui/universal_widgets/fasta_table_widget/fasta_table_widget.rb +643 -0
  183. data/lib/bioroebe/gui/{gtk3 → universal_widgets}/format_converter/format_converter.rb +236 -164
  184. data/lib/bioroebe/gui/universal_widgets/gene/gene.rb +278 -0
  185. data/lib/bioroebe/gui/universal_widgets/hamming_distance/hamming_distance.rb +646 -0
  186. data/lib/bioroebe/gui/{shared_code/levensthein_distance/levensthein_distance_module.rb → universal_widgets/levensthein_distance/levensthein_distance.rb} +313 -88
  187. data/lib/bioroebe/gui/{gtk3 → universal_widgets}/nucleotide_analyser/nucleotide_analyser.rb +281 -189
  188. data/lib/bioroebe/gui/{gtk3 → universal_widgets}/parse_pdb_file/parse_pdb_file.rb +265 -149
  189. data/lib/bioroebe/gui/{gtk3 → universal_widgets}/primer_design_widget/primer_design_widget.rb +337 -263
  190. data/lib/bioroebe/gui/universal_widgets/protein_to_DNA/protein_to_DNA.rb +408 -0
  191. data/lib/bioroebe/gui/{gtk3 → universal_widgets}/random_sequence/random_sequence.rb +245 -187
  192. data/lib/bioroebe/gui/{gtk3 → universal_widgets}/restriction_enzymes/restriction_enzymes.rb +207 -137
  193. data/lib/bioroebe/gui/universal_widgets/shell/shell.rb +288 -0
  194. data/lib/bioroebe/gui/{gtk3/show_codon_table/misc.rb → universal_widgets/show_codon_table/show_codon_table.rb} +290 -110
  195. data/lib/bioroebe/gui/{shared_code/show_codon_usage/show_codon_usage_module.rb → universal_widgets/show_codon_usage/show_codon_usage.rb} +228 -47
  196. data/lib/bioroebe/gui/{gtk3 → universal_widgets}/sizeseq/sizeseq.rb +151 -69
  197. data/lib/bioroebe/gui/{gtk3 → universal_widgets}/three_to_one/three_to_one.rb +190 -127
  198. data/lib/bioroebe/gui/{gtk3 → universal_widgets}/www_finder/www_finder.rb +211 -152
  199. data/lib/bioroebe/images/images.html +953 -1170
  200. data/lib/bioroebe/images/misc/README.md +6 -0
  201. data/lib/bioroebe/images/misc/activation.avif +0 -0
  202. data/lib/bioroebe/images/misc/inhibition.avif +0 -0
  203. data/lib/bioroebe/images/misc/small_virus_logo.avif +0 -0
  204. data/lib/bioroebe/{constants/base_directory.rb → log_directory/log_directory.rb} +79 -59
  205. data/lib/bioroebe/matplotlib/matplotlib_generator.rb +1 -1
  206. data/lib/bioroebe/misc/quiz/three_letter_to_aminoacid.rb +1 -1
  207. data/lib/bioroebe/misc/ruler.rb +5 -5
  208. data/lib/bioroebe/misc/useful_formulas.rb +3 -3
  209. data/lib/bioroebe/ncbi/efetch.rb +1 -2
  210. data/lib/bioroebe/ngs/phred_quality_score_table.rb +3 -3
  211. data/lib/bioroebe/nucleotides/complementary_dna_strand.rb +3 -6
  212. data/lib/bioroebe/nucleotides/molecular_weight_of_nucleotides.rb +3 -3
  213. data/lib/bioroebe/nucleotides/most_likely_nucleotide_sequence_for_this_aminoacid_sequence.rb +6 -10
  214. data/lib/bioroebe/nucleotides/{show_nucleotide_sequence.rb → show_nucleotide_sequence/show_nucleotide_sequence.rb} +377 -255
  215. data/lib/bioroebe/palindromes/palindrome_2D_structure.rb +1 -1
  216. data/lib/bioroebe/palindromes/palindrome_finder.rb +1 -1
  217. data/lib/bioroebe/palindromes/palindrome_generator.rb +2 -10
  218. data/lib/bioroebe/parsers/biolang_parser.rb +1 -1
  219. data/lib/bioroebe/parsers/blosum_parser.rb +14 -19
  220. data/lib/bioroebe/parsers/genbank_parser.rb +2 -6
  221. data/lib/bioroebe/parsers/gff.rb +9 -9
  222. data/lib/bioroebe/parsers/parse_embl.rb +2 -6
  223. data/lib/bioroebe/parsers/stride_parser.rb +4 -12
  224. data/lib/bioroebe/patterns/analyse_glycosylation_pattern.rb +2 -2
  225. data/lib/bioroebe/patterns/is_this_sequence_a_EGF2_pattern.rb +6 -3
  226. data/lib/bioroebe/patterns/profile_pattern.rb +2 -2
  227. data/lib/bioroebe/patterns/rgg_scanner.rb +4 -2
  228. data/lib/bioroebe/{protein_structure → pdb_and_protein_structure}/alpha_helix.rb +2 -2
  229. data/lib/bioroebe/{pdb → pdb_and_protein_structure}/download_this_pdb.rb +2 -3
  230. data/lib/bioroebe/{pdb → pdb_and_protein_structure}/fetch_fasta_sequence_from_pdb.rb +4 -4
  231. data/lib/bioroebe/{protein_structure → pdb_and_protein_structure}/helical_wheel.rb +2 -2
  232. data/lib/bioroebe/{pdb → pdb_and_protein_structure}/parse_mmCIF_file.rb +1 -1
  233. data/lib/bioroebe/{pdb → pdb_and_protein_structure}/parse_pdb_file.rb +3 -3
  234. data/lib/bioroebe/{pdb → pdb_and_protein_structure}/report_secondary_structures_from_this_pdb_file.rb +3 -3
  235. data/lib/bioroebe/project/project.rb +3 -1
  236. data/lib/bioroebe/raw_sequence/README.md +8 -8
  237. data/lib/bioroebe/raw_sequence/raw_sequence.rb +11 -2
  238. data/lib/bioroebe/regexes/regexes.rb +1 -2
  239. data/lib/bioroebe/requires/commandline_application.rb +3 -1
  240. data/lib/bioroebe/requires/require_all_pdb_files.rb +1 -1
  241. data/lib/bioroebe/requires/require_all_taxonomy_files.rb +1 -1
  242. data/lib/bioroebe/requires/require_all_utility_scripts_files.rb +10 -0
  243. data/lib/bioroebe/requires/require_colours.rb +1 -1
  244. data/lib/bioroebe/requires/require_the_bioroebe_project.rb +5 -7
  245. data/lib/bioroebe/requires/require_the_bioroebe_sinatra_components.rb +1 -1
  246. data/lib/bioroebe/requires/require_the_constants.rb +2 -14
  247. data/lib/bioroebe/requires/require_yaml.rb +7 -5
  248. data/lib/bioroebe/sequence/alignment.rb +1 -1
  249. data/lib/bioroebe/sequence/dna.rb +4 -2
  250. data/lib/bioroebe/sequence/nucleotide_module/nucleotide_module.rb +22 -8
  251. data/lib/bioroebe/sequence/protein.rb +2 -2
  252. data/lib/bioroebe/sequence/reverse_complement.rb +3 -3
  253. data/lib/bioroebe/sequence/rna.rb +9 -8
  254. data/lib/bioroebe/sequence/sequence.rb +3 -3
  255. data/lib/bioroebe/shell/configuration/additionally_set_xorg_buffer.yml +0 -0
  256. data/lib/bioroebe/shell/configuration/may_we_show_the_startup_information.yml +0 -0
  257. data/lib/bioroebe/shell/configuration/upcase_nucleotides.yml +0 -0
  258. data/lib/bioroebe/shell/configuration/use_silent_startup.yml +1 -1
  259. data/lib/bioroebe/shell/help/class.rb +68 -19
  260. data/lib/bioroebe/shell/menu.rb +5244 -5322
  261. data/lib/bioroebe/shell/{readline/readline.rb → readline.rb} +1 -3
  262. data/lib/bioroebe/shell/shell.rb +11240 -453
  263. data/lib/bioroebe/siRNA/siRNA.rb +3 -3
  264. data/lib/bioroebe/{gui/shared_code/blosum_matrix_viewer/blosum_matrix_viewer_module.rb → sinatra/sinatra_interface.rb} +28 -19
  265. data/lib/bioroebe/{www/sinatra/sinatra.rb → sinatra/sinatra_wrapper.rb} +731 -754
  266. data/lib/bioroebe/string_matching/find_longest_substring.rb +2 -10
  267. data/lib/bioroebe/string_matching/find_longest_substring_via_LCS_algorithm.rb +4 -14
  268. data/lib/bioroebe/string_matching/hamming_distance.rb +11 -10
  269. data/lib/bioroebe/string_matching/levensthein.rb +5 -17
  270. data/lib/bioroebe/string_matching/simple_string_comparer.rb +48 -4
  271. data/lib/bioroebe/string_matching/smith_waterman.rb +11 -6
  272. data/lib/bioroebe/svg/glyph.rb +4 -1
  273. data/lib/bioroebe/svg/mini_feature.rb +1 -1
  274. data/lib/bioroebe/svg/page.rb +18 -7
  275. data/lib/bioroebe/svg/svgee.rb +22 -13
  276. data/lib/bioroebe/svg/track.rb +20 -4
  277. data/lib/bioroebe/taxonomy/chart.rb +2 -2
  278. data/lib/bioroebe/taxonomy/class_methods.rb +5 -6
  279. data/lib/bioroebe/taxonomy/constants.rb +1 -1
  280. data/lib/bioroebe/taxonomy/info/info.rb +1 -1
  281. data/lib/bioroebe/taxonomy/info/is_dna.rb +1 -1
  282. data/lib/bioroebe/taxonomy/interactive.rb +1 -2
  283. data/lib/bioroebe/taxonomy/menu.rb +1 -1
  284. data/lib/bioroebe/taxonomy/node.rb +1 -1
  285. data/lib/bioroebe/taxonomy/parse_fasta.rb +4 -2
  286. data/lib/bioroebe/taxonomy/shared.rb +5 -4
  287. data/lib/bioroebe/taxonomy/taxonomy.rb +2 -4
  288. data/lib/bioroebe/toplevel_methods/fasta_and_fastq.rb +3 -45
  289. data/lib/bioroebe/toplevel_methods/{is_on_roebe.rb → roebe.rb} +1 -11
  290. data/lib/bioroebe/toplevel_methods/taxonomy.rb +6 -12
  291. data/lib/bioroebe/toplevel_methods/toplevel_methods.rb +5568 -0
  292. data/lib/bioroebe/utility_scripts/align_open_reading_frames.rb +4 -3
  293. data/lib/bioroebe/utility_scripts/analyse_local_dataset.rb +2 -2
  294. data/lib/bioroebe/utility_scripts/check_for_mismatches/check_for_mismatches.rb +16 -9
  295. data/lib/bioroebe/utility_scripts/compacter/compacter.rb +4 -2
  296. data/lib/bioroebe/utility_scripts/compare_these_two_sequences_via_blosum.rb +119 -0
  297. data/lib/bioroebe/utility_scripts/compseq/compseq.rb +11 -9
  298. data/lib/bioroebe/utility_scripts/{consensus_sequence.rb → consensus_sequence/consensus_sequence.rb} +13 -4
  299. data/lib/bioroebe/utility_scripts/{create_batch_entrez_file.rb → create_batch_entrez_file/create_batch_entrez_file.rb} +5 -5
  300. data/lib/bioroebe/utility_scripts/{determine_antigenic_areas.rb → determine_antigenic_areas/determine_antigenic_areas.rb} +5 -5
  301. data/lib/bioroebe/utility_scripts/{determine_missing_nucleotides_percentage.rb → determine_missing_nucleotides_percentage/determine_missing_nucleotides_percentage.rb} +16 -15
  302. data/lib/bioroebe/utility_scripts/display_open_reading_frames/display_open_reading_frames.rb +7 -7
  303. data/lib/bioroebe/utility_scripts/display_open_reading_frames/misc.rb +1 -1
  304. data/lib/bioroebe/utility_scripts/display_open_reading_frames/report.rb +2 -0
  305. data/lib/bioroebe/utility_scripts/{dot_alignment.rb → dot_alignment/dot_alignment.rb} +3 -3
  306. data/lib/bioroebe/utility_scripts/{download_files_from_rebase.rb → download_files_from_rebase/download_files_from_rebase.rb} +5 -5
  307. data/lib/bioroebe/utility_scripts/fetch_data_from_uniprot/fetch_data_from_uniprot.rb +269 -0
  308. data/lib/bioroebe/utility_scripts/find_gene.rb +4 -2
  309. data/lib/bioroebe/utility_scripts/{mirror_repeat.rb → mirror_repeat/mirror_repeat.rb} +5 -5
  310. data/lib/bioroebe/utility_scripts/move_file_to_its_correct_location.rb +3 -3
  311. data/lib/bioroebe/utility_scripts/{parse_taxonomy.rb → parse_taxonomy/parse_taxonomy.rb} +15 -6
  312. data/lib/bioroebe/utility_scripts/{pathways.rb → pathways/pathways.rb} +4 -3
  313. data/lib/bioroebe/utility_scripts/{permutations.rb → permutations/permutations.rb} +3 -3
  314. data/lib/bioroebe/utility_scripts/punnet/punnet.rb +4 -2
  315. data/lib/bioroebe/utility_scripts/{show_this_dna_sequence.rb → show_this_dna_sequence/show_this_dna_sequence.rb} +1 -1
  316. data/lib/bioroebe/utility_scripts/showorf/showorf.rb +406 -10
  317. data/lib/bioroebe/version/version.rb +2 -2
  318. data/lib/bioroebe/viennarna/rnafold_wrapper.rb +5 -13
  319. data/lib/bioroebe/virus/individual_viruses/README.md +15 -0
  320. data/lib/bioroebe/virus/individual_viruses/tobacco_mosaic_virus.rb +40 -0
  321. data/lib/bioroebe/virus/virus.rb +76 -0
  322. data/lib/bioroebe/www/bioroebe.cgi +4 -3
  323. data/lib/bioroebe/www/embeddable_interface.rb +85 -49
  324. data/lib/bioroebe/yaml/agarose/agarose_concentrations.yml +6 -6
  325. data/lib/bioroebe/yaml/antisense/antisense.yml +2 -0
  326. data/lib/bioroebe/yaml/blosum/blosum50.yml +6 -0
  327. data/lib/bioroebe/yaml/blosum/blosum90.yml +2 -1
  328. data/lib/bioroebe/yaml/chromosomes/chromosome_numbers.yml +2 -2
  329. data/lib/bioroebe/yaml/configuration/temp_dir.yml +1 -1
  330. data/lib/bioroebe/yaml/consensus_sequences/consensus_sequences.yml +1 -0
  331. data/lib/bioroebe/yaml/enzymes/enzyme_classes.yml +7 -6
  332. data/lib/bioroebe/yaml/humans/human_chromosomes.yml +3 -3
  333. data/lib/bioroebe/yaml/mRNA/mRNA.yml +1 -5
  334. data/lib/bioroebe/yaml/nucleotides/abbreviations_for_nucleotides.yml +1 -0
  335. data/lib/bioroebe/yaml/nucleotides/nucleotide_density.yml +2 -1
  336. data/lib/bioroebe/yaml/promoters/35S.yml +3 -1
  337. data/lib/bioroebe/yaml/proteases/proteases.yml +3 -1
  338. data/lib/bioroebe/yaml/proteins/ubiquitin.yml +4 -1
  339. data/lib/bioroebe/yaml/restriction_enzymes/restriction_enzymes.yml +7 -7
  340. data/spec/testing_toplevel_method_editor.rb +1 -1
  341. data/spec/testing_toplevel_method_verbose.rb +1 -1
  342. data/test/testing_dna_to_rna_conversion.rb +1 -1
  343. metadata +127 -235
  344. data/doc/blosum.md +0 -5
  345. data/lib/bioroebe/base/commandline_application/aminoacids.rb +0 -33
  346. data/lib/bioroebe/base/commandline_application/directory.rb +0 -33
  347. data/lib/bioroebe/base/commandline_application/extract.rb +0 -22
  348. data/lib/bioroebe/base/commandline_application/misc.rb +0 -502
  349. data/lib/bioroebe/base/commandline_application/opn.rb +0 -47
  350. data/lib/bioroebe/base/commandline_application/reset.rb +0 -42
  351. data/lib/bioroebe/base/commandline_application/warnings.rb +0 -36
  352. data/lib/bioroebe/base/commandline_application/write_what_into.rb +0 -29
  353. data/lib/bioroebe/base/initialize.rb +0 -18
  354. data/lib/bioroebe/base/misc.rb +0 -129
  355. data/lib/bioroebe/base/namespace.rb +0 -16
  356. data/lib/bioroebe/base/prototype/e_and_ee.rb +0 -24
  357. data/lib/bioroebe/base/prototype/misc.rb +0 -114
  358. data/lib/bioroebe/base/prototype/mkdir.rb +0 -20
  359. data/lib/bioroebe/base/prototype/reset.rb +0 -36
  360. data/lib/bioroebe/colours/misc_colours.rb +0 -80
  361. data/lib/bioroebe/colours/rev.rb +0 -44
  362. data/lib/bioroebe/colours/sdir.rb +0 -21
  363. data/lib/bioroebe/colours/sfancy.rb +0 -21
  364. data/lib/bioroebe/colours/sfile.rb +0 -21
  365. data/lib/bioroebe/colours/simp.rb +0 -21
  366. data/lib/bioroebe/colours/swarn.rb +0 -29
  367. data/lib/bioroebe/constants/aminoacids_and_proteins.rb +0 -147
  368. data/lib/bioroebe/constants/carriage_return.rb +0 -14
  369. data/lib/bioroebe/constants/codon_tables.rb +0 -77
  370. data/lib/bioroebe/constants/database_constants.rb +0 -107
  371. data/lib/bioroebe/constants/files_and_directories.rb +0 -606
  372. data/lib/bioroebe/constants/misc.rb +0 -209
  373. data/lib/bioroebe/constants/newline.rb +0 -14
  374. data/lib/bioroebe/constants/nucleotides.rb +0 -121
  375. data/lib/bioroebe/constants/regex.rb +0 -28
  376. data/lib/bioroebe/constants/roebe.rb +0 -38
  377. data/lib/bioroebe/constants/row_terminator.rb +0 -16
  378. data/lib/bioroebe/constants/tabulator.rb +0 -14
  379. data/lib/bioroebe/constants/unicode.rb +0 -12
  380. data/lib/bioroebe/constants/urls.rb +0 -50
  381. data/lib/bioroebe/gui/gtk +0 -1
  382. data/lib/bioroebe/gui/gtk3/README.md +0 -2
  383. data/lib/bioroebe/gui/gtk3/alignment/alignment.rb +0 -306
  384. data/lib/bioroebe/gui/gtk3/anti_sense_strand/anti_sense_strand.rb +0 -29
  385. data/lib/bioroebe/gui/gtk3/blosum_matrix_viewer/blosum_matrix_viewer.rb +0 -195
  386. data/lib/bioroebe/gui/gtk3/calculate_cell_numbers_of_bacteria/calculate_cell_numbers_of_bacteria.rb +0 -105
  387. data/lib/bioroebe/gui/gtk3/dna_to_reverse_complement_widget/dna_to_reverse_complement_widget.rb +0 -188
  388. data/lib/bioroebe/gui/gtk3/fasta_table_widget/fasta_table_widget.rb +0 -322
  389. data/lib/bioroebe/gui/gtk3/gene/gene.rb +0 -181
  390. data/lib/bioroebe/gui/gtk3/hamming_distance/hamming_distance.rb +0 -383
  391. data/lib/bioroebe/gui/gtk3/levensthein_distance/levensthein_distance.rb +0 -174
  392. data/lib/bioroebe/gui/gtk3/protein_to_DNA/protein_to_DNA.rb +0 -181
  393. data/lib/bioroebe/gui/gtk3/show_codon_table/show_codon_table.rb +0 -101
  394. data/lib/bioroebe/gui/gtk3/show_codon_usage/show_codon_usage.rb +0 -145
  395. data/lib/bioroebe/gui/gtk3/three_to_one/title.rb +0 -23
  396. data/lib/bioroebe/gui/jruby/alignment/alignment.rb +0 -165
  397. data/lib/bioroebe/gui/jruby/aminoacid_composition/aminoacid_composition.rb +0 -166
  398. data/lib/bioroebe/gui/jruby/blosum_matrix_viewer/blosum_matrix_viewer.rb +0 -82
  399. data/lib/bioroebe/gui/libui/README.md +0 -4
  400. data/lib/bioroebe/gui/libui/alignment/alignment.rb +0 -116
  401. data/lib/bioroebe/gui/libui/blosum_matrix_viewer/blosum_matrix_viewer.rb +0 -112
  402. data/lib/bioroebe/gui/libui/calculate_cell_numbers_of_bacteria/calculate_cell_numbers_of_bacteria.rb +0 -60
  403. data/lib/bioroebe/gui/libui/controller/controller.rb +0 -116
  404. data/lib/bioroebe/gui/libui/dna_to_aminoacid_widget/dna_to_aminoacid_widget.rb +0 -161
  405. data/lib/bioroebe/gui/libui/dna_to_reverse_complement_widget/dna_to_reverse_complement_widget.rb +0 -76
  406. data/lib/bioroebe/gui/libui/hamming_distance/hamming_distance.rb +0 -135
  407. data/lib/bioroebe/gui/libui/levensthein_distance/levensthein_distance.rb +0 -118
  408. data/lib/bioroebe/gui/libui/protein_to_DNA/protein_to_DNA.rb +0 -115
  409. data/lib/bioroebe/gui/libui/random_sequence/random_sequence.rb +0 -190
  410. data/lib/bioroebe/gui/libui/show_codon_table/show_codon_table.rb +0 -134
  411. data/lib/bioroebe/gui/libui/show_codon_usage/show_codon_usage.rb +0 -89
  412. data/lib/bioroebe/gui/libui/three_to_one/three_to_one.rb +0 -113
  413. data/lib/bioroebe/gui/shared_code/alignment/alignment_module.rb +0 -102
  414. data/lib/bioroebe/gui/shared_code/aminoacid_composition/aminoacid_composition_module.rb +0 -94
  415. data/lib/bioroebe/gui/shared_code/calculate_cell_numbers_of_bacteria/calculate_cell_numbers_of_bacteria_module.rb +0 -216
  416. data/lib/bioroebe/gui/shared_code/protein_to_DNA/protein_to_DNA_module.rb +0 -192
  417. data/lib/bioroebe/gui/shared_code/show_codon_table/show_codon_table_module.rb +0 -72
  418. data/lib/bioroebe/gui/tk/aminoacid_composition/aminoacid_composition.rb +0 -206
  419. data/lib/bioroebe/gui/tk/blosum_matrix_viewer/blosum_matrix_viewer.rb +0 -140
  420. data/lib/bioroebe/gui/tk/hamming_distance/hamming_distance.rb +0 -262
  421. data/lib/bioroebe/gui/tk/levensthein_distance/levensthein_distance.rb +0 -243
  422. data/lib/bioroebe/gui/tk/three_to_one/three_to_one.rb +0 -199
  423. data/lib/bioroebe/gui/unified_widgets/anti_sense_strand/anti_sense_strand.rb +0 -519
  424. data/lib/bioroebe/shell/colours/colours.rb +0 -235
  425. data/lib/bioroebe/shell/help/help.rb +0 -25
  426. data/lib/bioroebe/shell/misc.rb +0 -10227
  427. data/lib/bioroebe/toplevel_methods/ad_hoc_task.rb +0 -56
  428. data/lib/bioroebe/toplevel_methods/aminoacids_and_proteins.rb +0 -722
  429. data/lib/bioroebe/toplevel_methods/atomic_composition.rb +0 -198
  430. data/lib/bioroebe/toplevel_methods/base_composition.rb +0 -121
  431. data/lib/bioroebe/toplevel_methods/blast.rb +0 -153
  432. data/lib/bioroebe/toplevel_methods/calculate_n50_value.rb +0 -57
  433. data/lib/bioroebe/toplevel_methods/cat.rb +0 -71
  434. data/lib/bioroebe/toplevel_methods/chunked_display.rb +0 -92
  435. data/lib/bioroebe/toplevel_methods/cliner.rb +0 -81
  436. data/lib/bioroebe/toplevel_methods/complement.rb +0 -58
  437. data/lib/bioroebe/toplevel_methods/convert_global_env.rb +0 -39
  438. data/lib/bioroebe/toplevel_methods/databases.rb +0 -73
  439. data/lib/bioroebe/toplevel_methods/delimiter.rb +0 -19
  440. data/lib/bioroebe/toplevel_methods/digest.rb +0 -81
  441. data/lib/bioroebe/toplevel_methods/download_and_fetch_data.rb +0 -146
  442. data/lib/bioroebe/toplevel_methods/e.rb +0 -20
  443. data/lib/bioroebe/toplevel_methods/editor.rb +0 -21
  444. data/lib/bioroebe/toplevel_methods/esystem.rb +0 -22
  445. data/lib/bioroebe/toplevel_methods/exponential_growth.rb +0 -74
  446. data/lib/bioroebe/toplevel_methods/extract.rb +0 -56
  447. data/lib/bioroebe/toplevel_methods/file_and_directory_related_actions.rb +0 -269
  448. data/lib/bioroebe/toplevel_methods/frequencies.rb +0 -99
  449. data/lib/bioroebe/toplevel_methods/hamming_distance.rb +0 -60
  450. data/lib/bioroebe/toplevel_methods/infer.rb +0 -66
  451. data/lib/bioroebe/toplevel_methods/leading_five_prime_and_trailing_three_prime.rb +0 -101
  452. data/lib/bioroebe/toplevel_methods/levensthein.rb +0 -63
  453. data/lib/bioroebe/toplevel_methods/log_directory.rb +0 -109
  454. data/lib/bioroebe/toplevel_methods/longest_common_substring.rb +0 -55
  455. data/lib/bioroebe/toplevel_methods/map_ncbi_entry_to_eutils_id.rb +0 -88
  456. data/lib/bioroebe/toplevel_methods/matches.rb +0 -259
  457. data/lib/bioroebe/toplevel_methods/misc.rb +0 -596
  458. data/lib/bioroebe/toplevel_methods/nucleotides.rb +0 -787
  459. data/lib/bioroebe/toplevel_methods/number_of_clones.rb +0 -63
  460. data/lib/bioroebe/toplevel_methods/open_in_browser.rb +0 -79
  461. data/lib/bioroebe/toplevel_methods/open_reading_frames.rb +0 -236
  462. data/lib/bioroebe/toplevel_methods/opn.rb +0 -34
  463. data/lib/bioroebe/toplevel_methods/palindromes.rb +0 -155
  464. data/lib/bioroebe/toplevel_methods/parse.rb +0 -59
  465. data/lib/bioroebe/toplevel_methods/phred_error_probability.rb +0 -68
  466. data/lib/bioroebe/toplevel_methods/rds.rb +0 -24
  467. data/lib/bioroebe/toplevel_methods/remove.rb +0 -86
  468. data/lib/bioroebe/toplevel_methods/return_source_code_of_this_method.rb +0 -35
  469. data/lib/bioroebe/toplevel_methods/return_subsequence_based_on_indices.rb +0 -68
  470. data/lib/bioroebe/toplevel_methods/rna_splicing.rb +0 -73
  471. data/lib/bioroebe/toplevel_methods/rnalfold.rb +0 -69
  472. data/lib/bioroebe/toplevel_methods/searching_and_finding.rb +0 -116
  473. data/lib/bioroebe/toplevel_methods/shuffleseq.rb +0 -37
  474. data/lib/bioroebe/toplevel_methods/statistics.rb +0 -53
  475. data/lib/bioroebe/toplevel_methods/sum_of_odd_integers.rb +0 -62
  476. data/lib/bioroebe/toplevel_methods/three_delimiter.rb +0 -34
  477. data/lib/bioroebe/toplevel_methods/time_and_date.rb +0 -53
  478. data/lib/bioroebe/toplevel_methods/to_camelcase.rb +0 -31
  479. data/lib/bioroebe/toplevel_methods/truncate.rb +0 -48
  480. data/lib/bioroebe/toplevel_methods/url.rb +0 -36
  481. data/lib/bioroebe/toplevel_methods/verbose.rb +0 -59
  482. data/lib/bioroebe/utility_scripts/showorf/constants.rb +0 -31
  483. data/lib/bioroebe/utility_scripts/showorf/help.rb +0 -33
  484. data/lib/bioroebe/utility_scripts/showorf/initialize.rb +0 -52
  485. data/lib/bioroebe/utility_scripts/showorf/menu.rb +0 -68
  486. data/lib/bioroebe/utility_scripts/showorf/reset.rb +0 -36
  487. data/lib/bioroebe/utility_scripts/showorf/run.rb +0 -152
  488. data/lib/bioroebe/utility_scripts/showorf/show.rb +0 -97
  489. /data/doc/{german_names_for_the_aminoacids.md → german_names_for_the_aminoacids/german_names_for_the_aminoacids.md} +0 -0
  490. /data/doc/{pdb_ATOM_entry.md → pdb_ATOM_entry/pdb_ATOM_entry.md} +0 -0
  491. /data/doc/{resources.md → resources/resources.md} +0 -0
  492. /data/lib/bioroebe/gui/{gtk3 → universal_widgets}/aminoacid_composition/customized_dialog.rb +0 -0
  493. /data/lib/bioroebe/gui/{gtk3 → universal_widgets}/anti_sense_strand/anti_sense_strand.config +0 -0
  494. /data/lib/bioroebe/gui/{gtk3 → universal_widgets}/calculate_cell_numbers_of_bacteria/calculate_cell_numbers_of_bacteria.config +0 -0
  495. /data/lib/bioroebe/gui/{gtk3 → universal_widgets}/dna_to_reverse_complement_widget/dna_to_reverse_complement_widget.config +0 -0
  496. /data/lib/bioroebe/gui/{gtk3 → universal_widgets}/hamming_distance/hamming_distance.config +0 -0
  497. /data/lib/bioroebe/gui/{gtk3 → universal_widgets}/levensthein_distance/levensthein_distance.config +0 -0
  498. /data/lib/bioroebe/gui/{gtk3 → universal_widgets}/protein_to_DNA/protein_to_DNA.config +0 -0
  499. /data/lib/bioroebe/gui/{gtk3 → universal_widgets}/restriction_enzymes/restriction_enzymes.config +0 -0
  500. /data/lib/bioroebe/gui/{gtk3 → universal_widgets}/www_finder/www_finder.config +0 -0
  501. /data/lib/bioroebe/yaml/{base_composition_of_dna.yml → base_composition_of_dna/base_composition_of_dna.yml} +0 -0
  502. /data/lib/bioroebe/yaml/{nuclear_localization_sequences.yml → nuclear_localization_sequences/nuclear_localization_sequences.yml} +0 -0
  503. /data/lib/bioroebe/yaml/{talens.yml → talens/talens.yml} +0 -0
@@ -1,198 +0,0 @@
1
- #!/usr/bin/ruby -w
2
- # Encoding: UTF-8
3
- # frozen_string_literal: true
4
- # =========================================================================== #
5
- # require 'bioroebe/toplevel_methods/atomic_composition.rb'
6
- # Bioroebe.show_atomic_composition
7
- # =========================================================================== #
8
- module Bioroebe
9
-
10
- require 'bioroebe/constants/files_and_directories.rb'
11
- require 'bioroebe/colours/rev.rb'
12
- require 'bioroebe/toplevel_methods/aminoacids_and_proteins.rb'
13
- require 'bioroebe/toplevel_methods/e.rb'
14
- require 'bioroebe/toplevel_methods/is_on_roebe.rb'
15
-
16
- # ========================================================================= #
17
- # === Bioroebe.atomic_composition
18
- #
19
- # This method will return the composition of atoms in a given protein,
20
- # via Hash, such as:
21
- #
22
- # {"C"=>11, "H"=>19, "N"=>5, "O"=>6, "S"=>0}
23
- #
24
- # The Hash keeps track of 11 C atoms, 19 H atoms, 5 N atoms,
25
- # 6 O atoms and 0 S atoms.
26
- #
27
- # This hash can then be formatted via the method:
28
- #
29
- # Bioroebe.show_atomic_composition()
30
- #
31
- # Which can be found below.
32
- #
33
- # Presently this method works on aminoacids only, but in theory the
34
- # code could be extended to work with DNA nucleotides and RNA
35
- # nucleotides as well.
36
- #
37
- # Either way, the one letter abbreviation should be used as input
38
- # to this method.
39
- #
40
- # When we use aminoacids, we need to remember that a peptide bond
41
- # deducts 1x H₂O (water). This will have to be deducted from the
42
- # formula, but only if it is an internal aminoacid. In other words,
43
- # the only two aminoacids that will behave differently, are the
44
- # first one (since it will miss one -OH group) and the last
45
- # aminoacid (as this one will lack a -H molecule.
46
- #
47
- # Remember that the input sequence to this method should be the
48
- # one-letter code for the aminoacid sequence at hand.
49
- # ========================================================================= #
50
- def self.atomic_composition(
51
- of = 'GGGGA' # ← This should be the aminoacid sequence.
52
- )
53
- begin
54
- require 'chemistry_paradise/split_molecule_names.rb'
55
- require 'chemistry_paradise/toplevel_methods/remove_this_molecule_from.rb'
56
- rescue LoadError
57
- if is_on_roebe?
58
- puts 'Two files from the chemistry_paradise gem are not available.'
59
- end
60
- end
61
- # ======================================================================= #
62
- # Load up the molecular formula for each aminoacid next. This will
63
- # be used as our reference-point for calculating things such as the
64
- # composition, or weight.
65
- # ======================================================================= #
66
- dataset_molecular_formula_for_the_aminoacids = YAML.load_file(
67
- FILE_AMINOACIDS_MOLECULAR_FORMULA
68
- )
69
- if of.is_a?(Array)
70
- if of.empty?
71
- of = 'GGGGA' # In this case reinstate the default.
72
- else
73
- if of.first.is_a?(String) and of.first.size > 1
74
- of = of.first.split(//) # Split it on a per-character basis here.
75
- end
76
- end
77
- end
78
- if of.is_a? String
79
- of = of.split(//)
80
- end
81
- unless of.is_a? Array
82
- of = [of]
83
- end
84
- hash_keeping_track_of_the_atomic_composition = {}
85
- # ======================================================================= #
86
- # Build up the default values, for the atoms C, H, N, O and S.
87
- # ======================================================================= #
88
- hash_keeping_track_of_the_atomic_composition['C'] = 0
89
- hash_keeping_track_of_the_atomic_composition['H'] = 0
90
- hash_keeping_track_of_the_atomic_composition['N'] = 0
91
- hash_keeping_track_of_the_atomic_composition['O'] = 0
92
- hash_keeping_track_of_the_atomic_composition['S'] = 0
93
- # ======================================================================= #
94
- # Next obtain the formula from the ChemistryParadise project. We
95
- # do so by iterating over the given input, and we assume that
96
- # this input is always an Array.
97
- # ======================================================================= #
98
- of.map.with_index {|this_amino_acid, position_of_that_aminoacid|
99
- # ===================================================================== #
100
- # Next, we have to obtain the formula for this amino acid.
101
- # ===================================================================== #
102
- this_amino_acid = AMINO_ACIDS_ENGLISH[this_amino_acid]
103
- formula_for_this_amino_acid = dataset_molecular_formula_for_the_aminoacids[this_amino_acid]
104
- # ===================================================================== #
105
- # The next case-menu will handle the position of the aminoacid at hand.
106
- # We will skip doing so if there is only one aminoacid though.
107
- # ===================================================================== #
108
- if of.first.to_s.size > 1
109
- case position_of_that_aminoacid # case tag
110
- when 0 # This is the first aminoacid. It loses only one 'OH' group.
111
- formula_for_this_amino_acid =
112
- ::ChemistryParadise.remove_this_molecule_from('OH', formula_for_this_amino_acid)
113
- when (of.size - 1) # This is the last entry. It loses only one 'H' group.
114
- formula_for_this_amino_acid =
115
- ::ChemistryParadise.remove_this_molecule_from('H', formula_for_this_amino_acid)
116
- else
117
- # ================================================================= #
118
- # Else it will lose a full H₂O group.
119
- # ================================================================= #
120
- formula_for_this_amino_acid =
121
- ::ChemistryParadise.remove_this_molecule_from('H2O', formula_for_this_amino_acid)
122
- end
123
- end
124
- array_chemical_formula = ::ChemistryParadise.split_this_molecular_formula_into_a_hash(
125
- formula_for_this_amino_acid
126
- )
127
- array_chemical_formula.each {|molecule_and_number| # e. g. 'H13'
128
- if molecule_and_number =~ /\d+/ # If it has at the least one number.
129
- molecule_and_number =~ /([A-Z]+)(\d{1,2})/ # See: https://rubular.com/r/nCojEDcY6g
130
- molecule = $1.to_s.dup
131
- n_times = $2.to_s.dup.to_i
132
- hash_keeping_track_of_the_atomic_composition[molecule] += n_times
133
- else # else it must be 1, since there is no other number, such as 'N'.
134
- hash_keeping_track_of_the_atomic_composition[molecule_and_number] += 1
135
- end
136
- }
137
- }
138
- return hash_keeping_track_of_the_atomic_composition
139
- end
140
-
141
- # ========================================================================= #
142
- # === Bioroebe.show_atomic_composition
143
- #
144
- # This method will output the above.
145
- #
146
- # Display style is similar to ExPASY output.
147
- #
148
- # Atomic composition:
149
- #
150
- # Carbon C 11
151
- # Hydrogen H 19
152
- # Nitrogen N 5
153
- # Oxygen O 6
154
- # Sulfur S 0
155
- #
156
- # ========================================================================= #
157
- def self.show_atomic_composition(
158
- of = 'GGGGA'
159
- )
160
- if of.is_a? Array
161
- of = of.join(' ').strip
162
- end
163
- padding_to_use = ' '
164
- hash = ::Bioroebe.atomic_composition(of)
165
- _ = ''.dup
166
- _ << "#{rev}Atomic composition of #{steelblue(of)}#{rev}:\n\n"
167
- n_atoms_in_total = hash.values.sum
168
- array = %w( C H N O S )
169
- array.each {|this_atom|
170
- case this_atom
171
- when 'C'
172
- _ << "#{padding_to_use}#{rev}Carbon C #{hash[this_atom].to_s.rjust(4)}\n"
173
- when 'H'
174
- _ << "#{padding_to_use}#{rev}Hydrogen H #{hash[this_atom].to_s.rjust(4)}\n"
175
- when 'N'
176
- _ << "#{padding_to_use}#{rev}Nitrogen N #{hash[this_atom].to_s.rjust(4)}\n"
177
- when 'O'
178
- _ << "#{padding_to_use}#{rev}Oxygen O #{hash[this_atom].to_s.rjust(4)}\n"
179
- when 'S'
180
- _ << "#{padding_to_use}#{rev}Sulfur S #{hash[this_atom].to_s.rjust(4)}\n"
181
- end
182
- }
183
- _ << " "+("-" * 18)
184
- _ << "\n"
185
- _ << " Total: #{n_atoms_in_total}\n\n"
186
- puts _
187
- end
188
-
189
- end
190
-
191
- if __FILE__ == $PROGRAM_NAME
192
- if ARGV.empty?
193
- pp Bioroebe.atomic_composition(ARGV)
194
- Bioroebe.show_atomic_composition
195
- else
196
- Bioroebe.show_atomic_composition(ARGV)
197
- end
198
- end # atomiccomposition GGGGA
@@ -1,121 +0,0 @@
1
- #!/usr/bin/ruby -w
2
- # Encoding: UTF-8
3
- # frozen_string_literal: true
4
- # =========================================================================== #
5
- # require 'bioroebe/toplevel_methods/base_composition.rb'
6
- # Bioroebe.report_base_composition
7
- # =========================================================================== #
8
- module Bioroebe
9
-
10
- require 'bioroebe/colours/colours.rb'
11
- require 'bioroebe/colours/rev.rb'
12
- require 'bioroebe/toplevel_methods/e.rb'
13
-
14
- # ========================================================================= #
15
- # === Bioroebe.base_composition
16
- #
17
- # This method can be used to query the composition of a given DNA
18
- # sequence, that is, in percentage, the values for A, T, C and
19
- # G.
20
- #
21
- # This method will then return a Hash, consisting of the percentage
22
- # values of A, T, C and G in the given DNA sequence at hand.
23
- #
24
- # Note that the input to this method has to include a '%' character,
25
- # at the least up until March 2020. Past March 2020 this requirement
26
- # was dropped, but I still think it is visually more elegant to
27
- # include a '%' character.
28
- # ========================================================================= #
29
- def self.base_composition(
30
- i = '52%GC'
31
- )
32
- if i.is_a? Array
33
- if i.empty?
34
- i = '52%GC' # Default value.
35
- else
36
- i = i.join(' ').strip
37
- end
38
- end
39
- # ======================================================================= #
40
- # Add support for Files here.
41
- # ======================================================================= #
42
- if i and File.exist?(i)
43
- i = File.readlines(i).reject {|line| line.start_with? '>' }.join("\n").delete("\n")
44
- end
45
- # ======================================================================= #
46
- # We must use a Hash for this.
47
- # ======================================================================= #
48
- hash = {
49
- 'A' => 0,
50
- 'T' => 0,
51
- 'C' => 0,
52
- 'G' => 0,
53
- }
54
- if i.include? '%'
55
- splitted = i.split('%').map(&:strip)
56
- frequency = splitted.first.to_i
57
- opposite_frequency = 100 - frequency
58
- characters = splitted.last.split(//)
59
- characters.each {|this_nucleotide|
60
- hash[this_nucleotide] = frequency / 2
61
- }
62
- # ===================================================================== #
63
- # Next calculate the missing nucleotides:
64
- # ===================================================================== #
65
- missing_nucleotides = hash.select {|key, value|
66
- value == 0
67
- }
68
- missing_nucleotides.each_pair {|this_nucleotide, value|
69
- hash[this_nucleotide] = opposite_frequency / 2
70
- }
71
- else
72
- frequency = Hash.new(0)
73
- chars = i.chars
74
- chars.each { |entry| frequency[entry] += 1 }
75
- sum = frequency.values.sum
76
- frequency.each_pair {|this_nucleotide, value|
77
- hash[this_nucleotide] = ((value * 100.0) / sum).round(2)
78
- }
79
- end
80
- return hash
81
- end; self.instance_eval { alias frequency_of base_composition } # === Bioroebe.frequency_of
82
-
83
- # ========================================================================= #
84
- # === Bioroebe.report_base_composition
85
- #
86
- # This is the convenience-method for reporting the base composition
87
- # at hand.
88
- # ========================================================================= #
89
- def self.report_base_composition(
90
- i = '52%GC'
91
- )
92
- if i.is_a? Array
93
- if i.empty?
94
- i = '52%GC' # Default value.
95
- else
96
- i = i.join(' ').strip
97
- end
98
- end
99
- hash = ::Bioroebe.base_composition(i)
100
- a = hash['A']
101
- t = hash['T']
102
- c = hash['C']
103
- g = hash['G']
104
- erev 'The base composition frequencies of this sequence '\
105
- '(length: '+i.size.to_s+') is as follows:'
106
- e
107
- e ' '\
108
- ' A: '+steelblue(a.to_s+'%')+rev+
109
- ' T: '+steelblue(t.to_s+'%')+rev+
110
- ' C: '+steelblue(c.to_s+'%')+rev+
111
- ' G: '+steelblue(g.to_s+'%')+rev
112
- e
113
- end; self.instance_eval { alias show_base_composition report_base_composition } # === show_base_composition
114
-
115
- end
116
-
117
- if __FILE__ == $PROGRAM_NAME
118
- pp Bioroebe.base_composition(ARGV)
119
- Bioroebe.report_base_composition(ARGV)
120
- end # basecomposition ATGC
121
- # basecomposition ATTGCCCCCCCCAACCCCACA
@@ -1,153 +0,0 @@
1
- #!/usr/bin/ruby -w
2
- # Encoding: UTF-8
3
- # frozen_string_literal: true
4
- # =========================================================================== #
5
- # require 'bioroebe/toplevel_methods/blast.rb'
6
- # =========================================================================== #
7
- module Bioroebe
8
-
9
- # ========================================================================= #
10
- # === Bioroebe.blast_neighborhood
11
- #
12
- # The second argument to this method is a score-filter, e. g. to
13
- # select only entries that have a score higher than 1.
14
- # ========================================================================= #
15
- def self.blast_neighborhood(
16
- this_mer = 'CTC',
17
- optional_apply_filter_for_score_higher_than = nil
18
- )
19
- require 'bioroebe/toplevel_methods/e.rb'
20
- if this_mer.is_a? Array
21
- this_mer = this_mer.first
22
- end
23
- if this_mer.nil?
24
- this_mer = 'CTC' # Set the same default as above.
25
- end
26
- match_score = 2
27
- mis_match_score = -2
28
- # ======================================================================= #
29
- # Next use an Array of sequences that we will compare.
30
- # ======================================================================= #
31
- compare_these_sequences = %w(
32
- AAA
33
- AAT
34
- AAC
35
- AAG
36
- ATA
37
- ATT
38
- ATC
39
- ATG
40
- ACA
41
- ACT
42
- ACC
43
- ACG
44
- AGA
45
- AGT
46
- AGC
47
- AGG
48
- TAA
49
- TAT
50
- TAC
51
- TAG
52
- TTA
53
- TTT
54
- TTC
55
- TTG
56
- TCA
57
- TCT
58
- TCC
59
- TCG
60
- TGA
61
- TGT
62
- TGC
63
- TGG
64
- CAA
65
- CAT
66
- CAC
67
- CAG
68
- CTA
69
- CTT
70
- CTC
71
- CTG
72
- CCA
73
- CCT
74
- CCC
75
- CCG
76
- CGA
77
- CGT
78
- CGC
79
- CGG
80
- GAA
81
- GAT
82
- GAC
83
- GAG
84
- GTA
85
- GTT
86
- GTC
87
- GTG
88
- GCA
89
- GCT
90
- GCC
91
- GCG
92
- GGA
93
- GGT
94
- GGC
95
- GGG
96
- )
97
- compare_these_sequences.each {|this_sequence|
98
- score = 0
99
- chars = this_sequence.chars
100
- first_char = chars[0]
101
- second_char = chars[1]
102
- third_char = chars[2]
103
- if first_char == this_mer[0]
104
- # =================================================================== #
105
- # Found the first match.
106
- # =================================================================== #
107
- score += match_score
108
- else
109
- # =================================================================== #
110
- # else it must be a mismatch
111
- # =================================================================== #
112
- score += mis_match_score
113
- end
114
- if second_char == this_mer[1]
115
- # =================================================================== #
116
- # Found the first match.
117
- # =================================================================== #
118
- score += match_score
119
- else
120
- # =================================================================== #
121
- # else it must be a mismatch
122
- # =================================================================== #
123
- score += mis_match_score
124
- end
125
- if third_char == this_mer[2]
126
- # =================================================================== #
127
- # Found the first match.
128
- # =================================================================== #
129
- score += match_score
130
- else
131
- # =================================================================== #
132
- # else it must be a mismatch
133
- # =================================================================== #
134
- score += mis_match_score
135
- end
136
- if optional_apply_filter_for_score_higher_than
137
- if (score.to_i > optional_apply_filter_for_score_higher_than)
138
- e "#{this_sequence}: score of "\
139
- "#{score.to_s.rjust(3)}"
140
- end
141
- else
142
- e this_sequence+': score of '+
143
- score.to_s.rjust(3)
144
- end
145
- }
146
- end
147
-
148
- end
149
-
150
- if __FILE__ == $PROGRAM_NAME
151
- # Bioroebe.blast_neighborhood(ARGV)
152
- Bioroebe.blast_neighborhood(ARGV, 1)
153
- end # rb blast_neighb*
@@ -1,57 +0,0 @@
1
- #!/usr/bin/ruby -w
2
- # Encoding: UTF-8
3
- # frozen_string_literal: true
4
- # =========================================================================== #
5
- # require 'bioroebe/toplevel_methods/calculate_n50_value.rb'
6
- # Bioroebe.calculate_n50_value(ARGV)
7
- # =========================================================================== #
8
- module Bioroebe
9
-
10
- # ========================================================================= #
11
- # === Bioroebe.calculate_n50_value
12
- #
13
- # This method will calculate the N50 value of the given input. The input
14
- # to this method should be a sorted Array.
15
- # ========================================================================= #
16
- def self.calculate_n50_value(
17
- i = [
18
- 1989, 1934, 1841,
19
- 1785, 1737, 1649,
20
- 1361, 926, 848,
21
- 723
22
- ]
23
- )
24
- # ======================================================================= #
25
- # The following conversion is necessary because ARGV will contain only
26
- # String objects, not integer-values.
27
- # ======================================================================= #
28
- i.map! {|entry| entry.to_i }
29
- calculate_sum_for_the_loop = 0
30
- sum = i.sum
31
- half = sum / 2.0
32
- find_the_proper_contig = nil
33
- i.each {|this_number|
34
- calculate_sum_for_the_loop += this_number
35
- # ===================================================================== #
36
- # Compare the temporary sum with the half-sum.
37
- # ===================================================================== #
38
- if calculate_sum_for_the_loop > half
39
- find_the_proper_contig = this_number
40
- break
41
- end
42
- }
43
- return find_the_proper_contig
44
- end
45
-
46
- end
47
-
48
- if __FILE__ == $PROGRAM_NAME
49
- if ARGV.empty?
50
- pp Bioroebe.calculate_n50_value
51
- array_to_test = [1252, 919, 917, 765, 711, 690, 632, 516, 463, 218]
52
- pp array_to_test
53
- pp Bioroebe.calculate_n50_value(array_to_test)
54
- else
55
- pp Bioroebe.calculate_n50_value(ARGV)
56
- end
57
- end # calculaten50value
@@ -1,71 +0,0 @@
1
- #!/usr/bin/ruby -w
2
- # Encoding: UTF-8
3
- # frozen_string_literal: true
4
- # =========================================================================== #
5
- # require 'bioroebe/toplevel_methods/cat.rb'
6
- # =========================================================================== #
7
- module Bioroebe
8
-
9
- require 'bioroebe/toplevel_methods/convert_global_env.rb'
10
- require 'bioroebe/toplevel_methods/e.rb'
11
- require 'bioroebe/colours/colours.rb'
12
- require 'bioroebe/colours/rev.rb'
13
- require 'bioroebe/colours/sfile.rb'
14
- require 'bioroebe/colours/sdir.rb'
15
-
16
- # ========================================================================= #
17
- # === Bioroebe.cat (cat tag)
18
- #
19
- # A variant of cat to use here.
20
- # ========================================================================= #
21
- def self.cat(i = nil)
22
- if i
23
- i = convert_global_env(i) if i.include? '$'
24
- i = Dir['*'][i.to_i - 1] if i =~ /^\d+$/
25
- end
26
- if i.nil?
27
- erev 'Please provide an argument to Bioroebe.cat() (the name of a file)'
28
- # ======================================================================= #
29
- # === Handle directories next
30
- # ======================================================================= #
31
- elsif File.directory? i
32
- erev "We can not read from `#{sdir(i)}#{rev}` as it is a directory."
33
- # ======================================================================= #
34
- # Else the File will exist in this clause:
35
- # ======================================================================= #
36
- elsif File.exist?(i)
37
- _ = File.extname(i).delete('.')
38
- case _ # case tag
39
- # ===================================================================== #
40
- # === fasta
41
- # ===================================================================== #
42
- when 'fasta',
43
- 'fa'
44
- e 'This is a fasta file, so rather than cat-ing the content,'
45
- e 'we will send this dataset to the ParseFasta class.'
46
- require 'bioroebe/fasta_and_fastq/parse_fasta/parse_fasta.rb'
47
- Bioroebe::ParseFasta.new(i)
48
- else # The default here.
49
- e "Now displaying the file `#{sfile(i)}`."
50
- # e File.read(i)
51
- # ^^^ Or we could use the above. We have to reconsider this one day.
52
- File.readlines(i).each {|line| e " #{line.chomp}" } # With a bit of padding.
53
- end
54
- else # else the file does not exist.
55
- e "#{swarn('Trying to display the file `')}#{sfile(i)}#{swarn('`')}"
56
- e swarn('but it does not exist.')
57
- end
58
- end
59
-
60
- # ========================================================================= #
61
- # === cat
62
- # ========================================================================= #
63
- def cat(i)
64
- ::Bioroebe.cat(i)
65
- end
66
-
67
- end
68
-
69
- if __FILE__ == $PROGRAM_NAME
70
- Bioroebe.cat '/etc/wgetrc' # This is just for testing purposes really.
71
- end # bioroebe_cat
@@ -1,92 +0,0 @@
1
- #!/usr/bin/ruby -w
2
- # Encoding: UTF-8
3
- # frozen_string_literal: true
4
- # =========================================================================== #
5
- # This code will return a properly-chunked nucleotide sequence, with
6
- # numbers.
7
- #
8
- # The genbank format uses such a chunked display.
9
- #
10
- # The display will look similar to this:
11
- #
12
- #
13
- # 1 ATGGGGCCTG CAATGGGGCC TGCAATGGGG CCTGCAATGG GGCCTGCAAT GGGGCCTGCA
14
- # 61 ATGGGGCCTG CAATGGGGCC TGCAATGGGG CCTGCA
15
- #
16
- #
17
- # The chunks width defaults to the genbank format.
18
- # =========================================================================== #
19
- # require 'bioroebe/toplevel_methods/chunked_display.rb'
20
- # puts Bioroebe.chunked_display(ARGV, 10)
21
- # =========================================================================== #
22
- module Bioroebe
23
-
24
- require 'bioroebe/constants/newline.rb'
25
-
26
- # ========================================================================= #
27
- # === Bioroebe.return_nucleotide_sequence_as_ten_nucleotides_chunks
28
- # ========================================================================= #
29
- def self.return_nucleotide_sequence_as_ten_nucleotides_chunks(i)
30
- i.split(/(.{10})/).reject(&:empty?)
31
- end
32
-
33
- # ========================================================================= #
34
- # === Bioroebe.return_chunked_display
35
- #
36
- # The second argument to this method tells us how many nucleotides
37
- # shall be grouped together (and then displayed as such).
38
- # ========================================================================= #
39
- def self.return_chunked_display(
40
- i,
41
- group_together_n_nucleotides = 10
42
- )
43
- i = i.first if i.is_a? Array
44
- chunks = i.split(/(.{#{group_together_n_nucleotides}})/).reject(&:empty?)
45
- sliced = chunks.each_slice(6).to_a
46
- _ = ''.dup # We need a dynamic String.
47
- sliced.each {|array|
48
- # ===================================================================== #
49
- # First, add the number to the beginning.
50
- # ===================================================================== #
51
- nucleotide_position = (
52
- _.strip.tr(' ','').tr(N,'').gsub(/\d/,'').strip.size + 1
53
- ).to_s
54
- _ << nucleotide_position.rjust(9)+' '
55
- _ << array.join(' ')
56
- _ << N
57
- }
58
- return _
59
- end; self.instance_eval { alias chunked_display return_chunked_display } # === Bioroebe.chunked_display
60
-
61
- # ========================================================================= #
62
- # === Bioroebe.downcase_chunked_display
63
- #
64
- # This is similar to the regular chunked display, but will return
65
- # the nucleotides in a downcased manner, aka "A" will become "a"
66
- # and so forth.
67
- #
68
- # In the past this functionality resided in its own .rb file, but
69
- # since as of March 2020 a bin/ executable was added, so that
70
- # the functionality can be more easily called when the bioroebe
71
- # gem is installed.
72
- #
73
- # Usage example:
74
- #
75
- # Bioroebe.downcase_chunked_display 'ATGGGGCCTGCAATGGGGCCTGCAATGGGGCCTGCAATGGGGCCTGCAATGGGGCCTGCAATGGGGCCTGCAATGGGGCCTGCAATGGGGCCTGCA'
76
- #
77
- # ========================================================================= #
78
- def self.downcase_chunked_display(
79
- i,
80
- group_together_n_nucleotides = 10
81
- )
82
- sequence = ::Bioroebe.return_chunked_display(i, group_together_n_nucleotides).downcase
83
- return sequence
84
- end
85
-
86
- end
87
-
88
- if __FILE__ == $PROGRAM_NAME
89
- puts Bioroebe.chunked_display(ARGV, 10)
90
- puts Bioroebe.downcase_chunked_display(ARGV, 10)
91
- end # chunkeddisplay ATGGGGCCTGCAATGGGGCCTGCAATGGGGCCTGCAATGGGGCCTGCAATGGGGCCTGCAATGGGGCCTGCAATGGGGCCTGCAATGGGGCCTGCA
92
- # downcasechunkeddisplay ATGGGGCCTGCAATGGGGCCTGCAATGGGGCCTGCAATGGGGCCTGCAATGGGGCCTGCAATGGGGCCTGCAATGGGGCCTGCAATGGGGCCTGCA