Class: Bioroebe::ShowFastaHeaders

Inherits:
CommandlineApplication show all
Defined in:
lib/bioroebe/fasta_and_fastq/show_fasta_headers.rb

Overview

Biroebe::ShowFastaHeaders

Constant Summary collapse

NAMESPACE =
#

NAMESPACE

#
inspect
BASE_DIR =
#

BASE_DIR

This base-directory will only work on my home setup, by default.

#
'/home/x/data/science/bioinformatics/data/fasta/'

Constants inherited from CommandlineApplication

CommandlineApplication::OLD_VERBOSE_VALUE

Constants included from ColoursForBase

ColoursForBase::ARRAY_HTML_COLOURS_IN_USE

Instance Method Summary collapse

Methods inherited from CommandlineApplication

#all_aminoacids?, #append_what_into, #at_home?, #be_silent, #be_verbose?, #cat, #ccliner, #change_directory, #cliner, #codon_table_dataset?, #codon_to_aminoacid, #codons_for?, #colourize_this_dna_sequence, #complement, #cp, #disable_warnings, #download_dir?, #editor?, #enable_warnings, #ensure_that_the_base_directories_exist, #esystem, #extract, #is_this_a_start_codon?, #is_this_a_stop_codon?, #leading_five_prime, #load_bioroebe_yaml_file, #log_directory?, #one_letter_to_long_name, #one_to_three, #only_numbers?, #open_in_browser, #opne, #opnn, #pad_with_double_quotes, #pad_with_single_quotes, #partner_nucleotide, #remove_numbers, #remove_trailing_ansii_escape_code, #return_all_possible_start_codons, #return_array_of_one_letter_aminoacids, #return_cheerful_person, #return_chunked_display, #return_ubiquitin_sequence, #set_be_verbose, #start_codon?, #stop_codons?, #strict_filter_away_invalid_aminoacids, #taxonomy_download_directory?, #three_to_one, #to_rna, #trailing_three_prime, #use_opn?, #verbose_truth, #was_or_were, #without_extname, #write_what_into

Methods included from CommandlineArguments

#commandline_arguments?, #commandline_arguments_that_are_files?, #e, #first?, #first_non_hyphen_argument?, #remove_hyphens_from_the_commandline_arguments, #return_commandline_arguments_as_string, #return_commandline_arguments_that_are_not_files, #return_entries_without_two_leading_hyphens, #select_commandline_arguments, #select_entries_starting_with_two_hyphens, #set_commandline_arguments

Methods included from ColoursForBase

#colourize_this_aminoacid_sequence_for_the_commandline, #colourize_this_nucleotide_sequence, #disable_colours, #ecomment, #efancy, #egold, #enable_colours, #eorange, #eparse, #erev, #red, #remove_trailing_escape_part, #return_colour_for_nucleotides, #rev, #sdir, #set_use_colours, #sfancy, #sfile, #simp, #swarn, #use_colours?, #use_colours_within_the_bioroebe_namespace?

Methods inherited from Base

#append_what_into, #can_base_pair?, #convert_global_env, #delete_file, #directory_to_the_codon_tables?, #file_readlines, #infer_the_namespace, #is_on_roebe?, #is_palindrome?, #main_encoding?, #mkdir, #move_file, #mv, #namespace?, #no_file_exists_at, #no_newlines, #project_yaml_directory?, #rds, #register_sigint, #return_pwd, #return_the_first_line_of_this_file, #word_wrap, #write_what_into

Constructor Details

#initialize(i = BASE_DIR, run_already = true) ⇒ ShowFastaHeaders

#

initialize

#

38
39
40
41
42
43
44
45
# File 'lib/bioroebe/fasta_and_fastq/show_fasta_headers.rb', line 38

def initialize(
    i           = BASE_DIR,
    run_already = true
  )
  reset
  set_input(i)
  run if run_already
end

Instance Method Details

#input?Boolean

#

input?

#

Returns:

  • (Boolean)

85
86
87
# File 'lib/bioroebe/fasta_and_fastq/show_fasta_headers.rb', line 85

def input?
  @input
end

#input_without_extensionObject

#

input_without_extension

#

92
93
94
# File 'lib/bioroebe/fasta_and_fastq/show_fasta_headers.rb', line 92

def input_without_extension
  input?.sub(/\*\.ffn$/,'')
end

#report_these_files(files) ⇒ Object

#

report_these_files

#

99
100
101
102
103
104
105
106
# File 'lib/bioroebe/fasta_and_fastq/show_fasta_headers.rb', line 99

def report_these_files(files)
  files.each {|this_file|
    dataset = File.readlines(this_file)
    dataset.reject! {|line| line.strip.start_with? '#' }
    header = dataset.first
    report_this_header_from_that_file(header, this_file)
  }
end

#report_this_header_from_that_file(header, file) ⇒ Object

#

report_this_header_from_that_file

#

111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
# File 'lib/bioroebe/fasta_and_fastq/show_fasta_headers.rb', line 111

def report_this_header_from_that_file(header, file)
  if @be_verbose
    erev "The file at #{sfile(file)}#{rev} has the following FASTA header:"
    e
  end
  e "  #{simp(header)}"
  if header.include? '|'
    splitted = header.split('|')
    if splitted.size > 2
      assumed_name_of_the_organism = splitted[2].strip
      if assumed_name_of_the_organism.include? 'OS='
        assumed_name_of_the_organism = assumed_name_of_the_organism.scan(/ OS=(.+)/).flatten
        assumed_name_of_the_organism = assumed_name_of_the_organism.first
        if assumed_name_of_the_organism.include? ' ('
          assumed_name_of_the_organism = assumed_name_of_the_organism.split(' (').first
        end
      end
      erev 'The organism may be: '+
           steelblue(assumed_name_of_the_organism)+rev
    end
  end
end

#resetObject

#

reset (reset tag)

#

50
51
52
53
54
55
56
57
58
59
60
# File 'lib/bioroebe/fasta_and_fastq/show_fasta_headers.rb', line 50

def reset
  super()
  # ======================================================================= #
  # === @be_verbose
  # ======================================================================= #
  @be_verbose = true
  # ======================================================================= #
  # === @namespace
  # ======================================================================= #
  @namespace = NAMESPACE
end

#runObject

#

run (run tag)

#

137
138
139
140
141
142
143
144
# File 'lib/bioroebe/fasta_and_fastq/show_fasta_headers.rb', line 137

def run
  files = Dir[input?]
  if files.empty?
    opnn; e "No files could be found for #{input?}."
  else
    report_these_files(files)
  end
end

#set_input(i = '') ⇒ Object

#

set_input

#

65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
# File 'lib/bioroebe/fasta_and_fastq/show_fasta_headers.rb', line 65

def set_input(i = '')
  i = i.first if i.is_a? Array
  i = i.to_s.dup
  if i.empty?
    i = BASE_DIR
  end
  i = i.dup if i.frozen?
  if i.end_with?('/') and !File.directory?(i) # Reject invalid directories here.
    i.chop!
  end
  if File.directory? i
    i << '/*.ffn'
  end
  i.squeeze!('/')
  @input = i
end