Module: BioRdf::Parsers::BroadGSEA::Parser
- Includes:
- Bio::Log
- Defined in:
- lib/bio-rdf/parsers/gsea/broadgsea.rb
Class Method Summary collapse
Class Method Details
.do_parse(input, filter, output) ⇒ Object
129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 151 152 153 154 155 156 157 158 159 160 |
# File 'lib/bio-rdf/parsers/gsea/broadgsea.rb', line 129 def Parser::do_parse input, filter, output log = LoggerPlus.new 'gsea' log.level = INFO log.outputters = Outputter.stderr log.warn("Fetching "+input) print "Marker\tGenotype\tGS\tSIZE\tSOURCE\tES\tNES\tNOM p-val\tFDR q-val\tFWER p-val\tTag \%\tGene \%\tSignal\tFDR (median)\tglob.p.val\n" Dir.foreach(input) do |entry| # two step search, because of many dirs next if entry == '.' or entry == '..' log.info("Parsing directory "+entry) clsfilename = File.join(input,entry,"*cls") clsfilename = Dir.glob(clsfilename) raise "We need one cls file: #{clsfilename}" if clsfilename.size != 1 clsfilename = clsfilename[0] # log.info(resultfilenames) resultfilenames = File.join(input,entry,"*SUMMARY.RESULTS.REPORT.[01].txt") Dir.glob(resultfilenames) do |fn| genotype = "A" genotype = "B" if fn =~ /1.txt/ marker = "unknown" # fetch marker name if File.exist?(clsfilename) cls = BioRdf::Parsers::BroadGSEA::ParseClsRecord.new(File.read(clsfilename)) marker = cls.classnames[0] end gsea_results = BioRdf::Parsers::BroadGSEA::ParseResultFile.new(fn) recs = gsea_results.find_all { | rec | rec.fdr_q_value <= 0.25 } recs.each do | rec | print "#{marker}\t#{genotype}\t"+rec.to_list.join("\t"),"\n" end end end end |
.handle_options ⇒ Object
98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 |
# File 'lib/bio-rdf/parsers/gsea/broadgsea.rb', line 98 def Parser:: = OpenStruct.new() opts = OptionParser.new() do |o| o. = "Usage: #{File.basename($0)} gsea [options] dir" o.on_tail("-h", "--help", "Show help and examples") { print(o) exit() } o.on("-e filter","--exec filter",String, "Execute filter") do |s| .exec = s end o.on("--tabulate","Output tab delimited table") do .output = :tabulate end end opts.parse!(ARGV) dir = ARGV[0] if dir and File.directory?(dir) do_parse(dir, .exec, .output) else raise "you should supply a GSEA directory!" end end |